mirror of
https://github.com/EnterpriseDB/repmgr.git
synced 2026-03-23 15:16:29 +00:00
Compare commits
228 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
16896510dc | ||
|
|
1c155a1088 | ||
|
|
31d57f4122 | ||
|
|
7b313b9d71 | ||
|
|
cf126642bd | ||
|
|
52281fcde8 | ||
|
|
de573edaaa | ||
|
|
4cb7f301ad | ||
|
|
87d8de4441 | ||
|
|
6db742f81e | ||
|
|
c79933685c | ||
|
|
04ba672b9f | ||
|
|
4f4111063a | ||
|
|
3a3a536e6d | ||
|
|
6f7206a5a1 | ||
|
|
f9fd1dd227 | ||
|
|
8140ba9c27 | ||
|
|
32dba444e1 | ||
|
|
8212ff8d8a | ||
|
|
1ccd0edad2 | ||
|
|
59b31dd1ca | ||
|
|
300b9f0cc2 | ||
|
|
0efee4cf65 | ||
|
|
0cb2584886 | ||
|
|
b88d27248c | ||
|
|
683c54325e | ||
|
|
70d398cd47 | ||
|
|
7b7d80e5f2 | ||
|
|
96b0e26084 | ||
|
|
91c498f6f1 | ||
|
|
d48093e732 | ||
|
|
3f0d1754a4 | ||
|
|
f27979bbe1 | ||
|
|
e9445a5d5e | ||
|
|
9a2717b5e3 | ||
|
|
dd6ea1cd77 | ||
|
|
de5908c122 | ||
|
|
4b5c84921c | ||
|
|
aaa8d70cef | ||
|
|
ca31b846e7 | ||
|
|
a27cecb559 | ||
|
|
cf0cdfa6a1 | ||
|
|
31489d92c0 | ||
|
|
b7fd13aed2 | ||
|
|
3c4bf27aa7 | ||
|
|
0ebd9c15d9 | ||
|
|
f9dba283d4 | ||
|
|
205f1cebbb | ||
|
|
4d97c1ebf7 | ||
|
|
12c395e91f | ||
|
|
bd1e4f71d6 | ||
|
|
cb49071ea4 | ||
|
|
5ad674edff | ||
|
|
ac09bad89c | ||
|
|
009d92fec8 | ||
|
|
b3d8a68a1d | ||
|
|
05b47cb2a8 | ||
|
|
dc542a1b7d | ||
|
|
6ce8058749 | ||
|
|
2edcac77f0 | ||
|
|
f740374392 | ||
|
|
c9c18d6216 | ||
|
|
d21f506614 | ||
|
|
fbad18085e | ||
|
|
ca08b1c3bb | ||
|
|
3d95fab0ac | ||
|
|
12d6ce4629 | ||
|
|
dfb34ae7b6 | ||
|
|
98c4eb002a | ||
|
|
faed8a65f7 | ||
|
|
a81cf04614 | ||
|
|
ca6cbcf965 | ||
|
|
16c1e13019 | ||
|
|
1375adcac8 | ||
|
|
e859a58405 | ||
|
|
1a6d830314 | ||
|
|
a96f478a43 | ||
|
|
8f20ab16dd | ||
|
|
3ec436f30d | ||
|
|
61e00bf1c7 | ||
|
|
5d71869fc1 | ||
|
|
7598e08b6f | ||
|
|
ba71e1eedf | ||
|
|
a4c07b23fb | ||
|
|
0c36f921f7 | ||
|
|
8ac5a5444e | ||
|
|
f60e7346e2 | ||
|
|
855ca8fe1a | ||
|
|
daa79d1a0f | ||
|
|
211768d911 | ||
|
|
f982708b35 | ||
|
|
995083d66c | ||
|
|
be58d6af96 | ||
|
|
a52e97e622 | ||
|
|
cc1ea00333 | ||
|
|
ec3596521f | ||
|
|
66245ccc03 | ||
|
|
c7542063be | ||
|
|
2633d994ef | ||
|
|
5359d45463 | ||
|
|
efa60d142c | ||
|
|
f3d0ab9ab9 | ||
|
|
7e6bac1be6 | ||
|
|
b72058dba8 | ||
|
|
79d1332f9c | ||
|
|
cde721e3fc | ||
|
|
7b2439b824 | ||
|
|
787cd94142 | ||
|
|
056e64f635 | ||
|
|
6b5a609d30 | ||
|
|
7a4d84379c | ||
|
|
490e12b1af | ||
|
|
7b9df3ac8f | ||
|
|
d6bf870316 | ||
|
|
b15e8debe1 | ||
|
|
310faf1bd9 | ||
|
|
35caeaa66a | ||
|
|
ba300c58f7 | ||
|
|
f2370de2fa | ||
|
|
3920deb803 | ||
|
|
e452bf6601 | ||
|
|
167b4efbb3 | ||
|
|
56b9ca7992 | ||
|
|
9c002c7e38 | ||
|
|
cfec04d19f | ||
|
|
4f1c67a1bf | ||
|
|
2f4fd2b7fa | ||
|
|
aca2b9547f | ||
|
|
c9db7f57d2 | ||
|
|
96ac39ba0f | ||
|
|
88a3378203 | ||
|
|
4db0efab47 | ||
|
|
864d57953a | ||
|
|
84d2a292b2 | ||
|
|
62d53b7622 | ||
|
|
77d52adb53 | ||
|
|
7a3e2f2a3a | ||
|
|
120688013e | ||
|
|
f6d1db5edb | ||
|
|
02729d299b | ||
|
|
88a6a1376e | ||
|
|
67df082ee9 | ||
|
|
9ed71d6317 | ||
|
|
933647d6de | ||
|
|
f99018b202 | ||
|
|
ced87373cd | ||
|
|
1db22546a9 | ||
|
|
7ae0df9c85 | ||
|
|
7a80f7a096 | ||
|
|
8710e067d0 | ||
|
|
793950eabd | ||
|
|
d1b4280182 | ||
|
|
64d038c823 | ||
|
|
46dd734b3d | ||
|
|
0a2e4466aa | ||
|
|
17ab86f7ac | ||
|
|
d433982af7 | ||
|
|
869b6a7a06 | ||
|
|
9018dc65de | ||
|
|
9cbd8df089 | ||
|
|
67a81d1d47 | ||
|
|
ab70007b75 | ||
|
|
0145aa0fc3 | ||
|
|
493c307b23 | ||
|
|
fc6225a511 | ||
|
|
e3111d37ba | ||
|
|
2a1a9f2e61 | ||
|
|
71a667ecb8 | ||
|
|
3ab91730c3 | ||
|
|
dd7f9b79ae | ||
|
|
8ab1901a93 | ||
|
|
e0cbdd5b31 | ||
|
|
d62aaeedd0 | ||
|
|
05cc7091b5 | ||
|
|
d192d5665c | ||
|
|
3848b9011b | ||
|
|
487aadc4b9 | ||
|
|
3f5920a395 | ||
|
|
617ea8cb78 | ||
|
|
142517fcca | ||
|
|
d722e2c74b | ||
|
|
abb02cab76 | ||
|
|
8e66e4811c | ||
|
|
ce5a541960 | ||
|
|
e12be52fa8 | ||
|
|
c0911d3286 | ||
|
|
6e94432282 | ||
|
|
29d9232e2f | ||
|
|
8973812144 | ||
|
|
e775a962ad | ||
|
|
12204f7e56 | ||
|
|
684f7590b7 | ||
|
|
9d589a780d | ||
|
|
83e6d15410 | ||
|
|
6a10fe0cd9 | ||
|
|
c664682c05 | ||
|
|
44acc8d719 | ||
|
|
b911483d5e | ||
|
|
ee9270fe8d | ||
|
|
d0a4eebeec | ||
|
|
0f5e71f029 | ||
|
|
dbd90d45f5 | ||
|
|
c8d0fb401f | ||
|
|
afda3419cc | ||
|
|
a86fa4ad4a | ||
|
|
7e3007f6e8 | ||
|
|
8c797a8fea | ||
|
|
56cec22f22 | ||
|
|
b61649a3e3 | ||
|
|
ded716e403 | ||
|
|
d639dc3342 | ||
|
|
17ed81ebb7 | ||
|
|
b00c507ee4 | ||
|
|
55d8b2ad9c | ||
|
|
c918aaad4a | ||
|
|
6e7eee4c01 | ||
|
|
5c59e8fc5b | ||
|
|
eba0b6bb1e | ||
|
|
3bc0b80a71 | ||
|
|
06b9e0a8ec | ||
|
|
120be2db1c | ||
|
|
12bd7da836 | ||
|
|
2fd905cf9e | ||
|
|
dd7ebdc1c7 | ||
|
|
1636805fa1 | ||
|
|
899d789699 | ||
|
|
cd7a3215df | ||
|
|
f8fd344d9f |
@@ -2,7 +2,7 @@ License and Contributions
|
|||||||
=========================
|
=========================
|
||||||
|
|
||||||
`repmgr` is licensed under the GPL v3. All of its code and documentation is
|
`repmgr` is licensed under the GPL v3. All of its code and documentation is
|
||||||
Copyright 2010-2015, 2ndQuadrant Limited. See the files COPYRIGHT and LICENSE for
|
Copyright 2010-2016, 2ndQuadrant Limited. See the files COPYRIGHT and LICENSE for
|
||||||
details.
|
details.
|
||||||
|
|
||||||
The development of repmgr has primarily been sponsored by 2ndQuadrant customers.
|
The development of repmgr has primarily been sponsored by 2ndQuadrant customers.
|
||||||
|
|||||||
@@ -1,4 +1,4 @@
|
|||||||
Copyright (c) 2010-2015, 2ndQuadrant Limited
|
Copyright (c) 2010-2016, 2ndQuadrant Limited
|
||||||
All rights reserved.
|
All rights reserved.
|
||||||
|
|
||||||
This program is free software: you can redistribute it and/or modify
|
This program is free software: you can redistribute it and/or modify
|
||||||
|
|||||||
238
FAILOVER.rst
238
FAILOVER.rst
@@ -1,237 +1 @@
|
|||||||
====================================================
|
The contents of this file have been incorporated into the main README.md document.
|
||||||
PostgreSQL Automatic Failover - User Documentation
|
|
||||||
====================================================
|
|
||||||
|
|
||||||
Automatic Failover
|
|
||||||
==================
|
|
||||||
|
|
||||||
repmgr allows for automatic failover when it detects the failure of the master node.
|
|
||||||
Following is a quick setup for this.
|
|
||||||
|
|
||||||
Installation
|
|
||||||
============
|
|
||||||
|
|
||||||
For convenience, we define:
|
|
||||||
|
|
||||||
**node1**
|
|
||||||
is the fully qualified domain name of the Master server, IP 192.168.1.10
|
|
||||||
**node2**
|
|
||||||
is the fully qualified domain name of the Standby server, IP 192.168.1.11
|
|
||||||
**witness**
|
|
||||||
is the fully qualified domain name of the server used as a witness, IP 192.168.1.12
|
|
||||||
|
|
||||||
**Note:** We don't recommend using names with the status of a server like «masterserver»,
|
|
||||||
because it would be confusing once a failover takes place and the Master is
|
|
||||||
now on the «standbyserver».
|
|
||||||
|
|
||||||
Summary
|
|
||||||
-------
|
|
||||||
|
|
||||||
2 PostgreSQL servers are involved in the replication. Automatic failover needs
|
|
||||||
a vote to decide what server it should promote, so an odd number is required.
|
|
||||||
A witness-repmgrd is installed in a third server where it uses a PostgreSQL
|
|
||||||
cluster to communicate with other repmgrd daemons.
|
|
||||||
|
|
||||||
1. Install PostgreSQL in all the servers involved (including the witness server)
|
|
||||||
|
|
||||||
2. Install repmgr in all the servers involved (including the witness server)
|
|
||||||
|
|
||||||
3. Configure the Master PostreSQL
|
|
||||||
|
|
||||||
4. Clone the Master to the Standby using "repmgr standby clone" command
|
|
||||||
|
|
||||||
5. Configure repmgr in all the servers involved (including the witness server)
|
|
||||||
|
|
||||||
6. Register Master and Standby nodes
|
|
||||||
|
|
||||||
7. Initiate witness server
|
|
||||||
|
|
||||||
8. Start the repmgrd daemons in all nodes
|
|
||||||
|
|
||||||
**Note** A complete High-Availability design needs at least 3 servers to still have
|
|
||||||
a backup node after a first failure.
|
|
||||||
|
|
||||||
Install PostgreSQL
|
|
||||||
------------------
|
|
||||||
|
|
||||||
You can install PostgreSQL using any of the recommended methods. You should ensure
|
|
||||||
it's 9.0 or later.
|
|
||||||
|
|
||||||
Install repmgr
|
|
||||||
--------------
|
|
||||||
|
|
||||||
Install repmgr following the steps in the README file.
|
|
||||||
|
|
||||||
Configure PostreSQL
|
|
||||||
-------------------
|
|
||||||
|
|
||||||
Log in to node1.
|
|
||||||
|
|
||||||
Edit the file postgresql.conf and modify the parameters::
|
|
||||||
|
|
||||||
listen_addresses='*'
|
|
||||||
wal_level = 'hot_standby'
|
|
||||||
archive_mode = on
|
|
||||||
archive_command = 'cd .' # we can also use exit 0, anything that
|
|
||||||
# just does nothing
|
|
||||||
max_wal_senders = 10
|
|
||||||
wal_keep_segments = 5000 # 80 GB required on pg_xlog
|
|
||||||
hot_standby = on
|
|
||||||
shared_preload_libraries = 'repmgr_funcs'
|
|
||||||
|
|
||||||
Edit the file pg_hba.conf and add lines for the replication::
|
|
||||||
|
|
||||||
host repmgr repmgr 127.0.0.1/32 trust
|
|
||||||
host repmgr repmgr 192.168.1.10/30 trust
|
|
||||||
host replication all 192.168.1.10/30 trust
|
|
||||||
|
|
||||||
**Note:** It is also possible to use a password authentication (md5), .pgpass file
|
|
||||||
should be edited to allow connection between each node.
|
|
||||||
|
|
||||||
Create the user and database to manage replication::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
createuser -s repmgr
|
|
||||||
createdb -O repmgr repmgr
|
|
||||||
psql -f /usr/share/postgresql/9.0/contrib/repmgr_funcs.sql repmgr
|
|
||||||
|
|
||||||
Restart the PostgreSQL server::
|
|
||||||
|
|
||||||
pg_ctl -D $PGDATA restart
|
|
||||||
|
|
||||||
And check everything is fine in the server log.
|
|
||||||
|
|
||||||
Create the ssh-key for the postgres user and copy it to other servers::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
ssh-keygen # /!\ do not use a passphrase /!\
|
|
||||||
cat ~/.ssh/id_rsa.pub > ~/.ssh/authorized_keys
|
|
||||||
chmod 600 ~/.ssh/authorized_keys
|
|
||||||
exit
|
|
||||||
rsync -avz ~postgres/.ssh/authorized_keys node2:~postgres/.ssh/
|
|
||||||
rsync -avz ~postgres/.ssh/authorized_keys witness:~postgres/.ssh/
|
|
||||||
rsync -avz ~postgres/.ssh/id_rsa* node2:~postgres/.ssh/
|
|
||||||
rsync -avz ~postgres/.ssh/id_rsa* witness:~postgres/.ssh/
|
|
||||||
|
|
||||||
Clone Master
|
|
||||||
------------
|
|
||||||
|
|
||||||
Log in to node2.
|
|
||||||
|
|
||||||
Clone node1 (the current Master)::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgr -d repmgr -U repmgr -h node1 standby clone
|
|
||||||
|
|
||||||
Start the PostgreSQL server::
|
|
||||||
|
|
||||||
pg_ctl -D $PGDATA start
|
|
||||||
|
|
||||||
And check everything is fine in the server log.
|
|
||||||
|
|
||||||
Configure repmgr
|
|
||||||
----------------
|
|
||||||
|
|
||||||
Log in to each server and configure repmgr by editing the file
|
|
||||||
/etc/repmgr/repmgr.conf::
|
|
||||||
|
|
||||||
cluster=my_cluster
|
|
||||||
node=1
|
|
||||||
node_name=earth
|
|
||||||
conninfo='host=192.168.1.10 dbname=repmgr user=repmgr'
|
|
||||||
master_response_timeout=60
|
|
||||||
reconnect_attempts=6
|
|
||||||
reconnect_interval=10
|
|
||||||
failover=automatic
|
|
||||||
promote_command='promote_command.sh'
|
|
||||||
follow_command='repmgr standby follow -f /etc/repmgr/repmgr.conf'
|
|
||||||
|
|
||||||
**cluster**
|
|
||||||
is the name of the current replication.
|
|
||||||
**node**
|
|
||||||
is the number of the current node (1, 2 or 3 in the current example).
|
|
||||||
**node_name**
|
|
||||||
is an identifier for every node.
|
|
||||||
**conninfo**
|
|
||||||
is used to connect to the local PostgreSQL server (where the configuration file is) from any node. In the witness server configuration you need to add a 'port=5499' to the conninfo.
|
|
||||||
**master_response_timeout**
|
|
||||||
is the maximum amount of time we are going to wait before deciding the master has died and start the failover procedure.
|
|
||||||
**reconnect_attempts**
|
|
||||||
is the number of times we will try to reconnect to master after a failure has been detected and before start the failover procedure.
|
|
||||||
**reconnect_interval**
|
|
||||||
is the amount of time between retries to reconnect to master after a failure has been detected and before start the failover procedure.
|
|
||||||
**failover**
|
|
||||||
configure behavior: *manual* or *automatic*.
|
|
||||||
**promote_command**
|
|
||||||
the command executed to do the failover (including the PostgreSQL failover itself). The command must return 0 on success.
|
|
||||||
**follow_command**
|
|
||||||
the command executed to address the current standby to another Master. The command must return 0 on success.
|
|
||||||
|
|
||||||
Register Master and Standby
|
|
||||||
---------------------------
|
|
||||||
|
|
||||||
Log in to node1.
|
|
||||||
|
|
||||||
Register the node as Master::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgr -f /etc/repmgr/repmgr.conf master register
|
|
||||||
|
|
||||||
Log in to node2. Register it as a standby::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgr -f /etc/repmgr/repmgr.conf standby register
|
|
||||||
|
|
||||||
Initialize witness server
|
|
||||||
-------------------------
|
|
||||||
|
|
||||||
Log in to witness.
|
|
||||||
|
|
||||||
Initialize the witness server::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgr -d repmgr -U repmgr -h 192.168.1.10 -D $WITNESS_PGDATA -f /etc/repmgr/repmgr.conf witness create
|
|
||||||
|
|
||||||
The witness server needs the following information from the command
|
|
||||||
line:
|
|
||||||
|
|
||||||
* Connection details for the current master, to copy the cluster
|
|
||||||
configuration.
|
|
||||||
* A location for initializing its own $PGDATA.
|
|
||||||
|
|
||||||
repmgr will also ask for the superuser password on the witness database so
|
|
||||||
it can reconnect when needed (the command line option --initdb-no-pwprompt
|
|
||||||
will set up a password-less superuser).
|
|
||||||
|
|
||||||
By default the witness server will listen on port 5499; this value can be
|
|
||||||
overridden by explicitly providing the port number in the conninfo string
|
|
||||||
in repmgr.conf. (Note that it is also possible to specify the port number
|
|
||||||
with the -l/--local-port option, however this option is now deprecated and
|
|
||||||
will be overridden by a port setting in the conninfo string).
|
|
||||||
|
|
||||||
Start the repmgrd daemons
|
|
||||||
-------------------------
|
|
||||||
|
|
||||||
Log in to node2 and witness::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgrd -f /etc/repmgr/repmgr.conf --daemonize -> /var/log/postgresql/repmgr.log 2>&1
|
|
||||||
|
|
||||||
**Note:** The Master does not need a repmgrd daemon.
|
|
||||||
|
|
||||||
Suspend Automatic behavior
|
|
||||||
==========================
|
|
||||||
|
|
||||||
Edit the repmgr.conf of the node to remove from automatic processing and change::
|
|
||||||
|
|
||||||
failover=manual
|
|
||||||
|
|
||||||
Then, signal repmgrd daemon::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
kill -HUP $(pidof repmgrd)
|
|
||||||
|
|
||||||
Usage
|
|
||||||
=====
|
|
||||||
|
|
||||||
The repmgr documentation is in the README file (how to build, options, etc.)
|
|
||||||
|
|||||||
39
FAQ.md
39
FAQ.md
@@ -34,6 +34,11 @@ General
|
|||||||
replication slots, setting a higher figure will make adding new nodes
|
replication slots, setting a higher figure will make adding new nodes
|
||||||
easier.
|
easier.
|
||||||
|
|
||||||
|
- Does `repmgr` support hash indexes?
|
||||||
|
|
||||||
|
No. Hash indexes and replication do not mix well and their use is
|
||||||
|
explicitly discouraged; see:
|
||||||
|
http://www.postgresql.org/docs/current/interactive/sql-createindex.html#AEN74175
|
||||||
|
|
||||||
`repmgr`
|
`repmgr`
|
||||||
--------
|
--------
|
||||||
@@ -96,8 +101,9 @@ General
|
|||||||
is intended to support running the witness server as a separate
|
is intended to support running the witness server as a separate
|
||||||
instance on a normal node server, rather than on its own dedicated server.
|
instance on a normal node server, rather than on its own dedicated server.
|
||||||
|
|
||||||
To specify a port for the witness server, supply the port number to
|
To specify different port for the witness server, supply the port number
|
||||||
repmgr with the `-l/--local-port` command line option.
|
in the `conninfo` string in `repmgr.conf`
|
||||||
|
(repmgr 3.0.1 and earlier: use the `-l/--local-port` option)
|
||||||
|
|
||||||
- Do I need to include `shared_preload_libraries = 'repmgr_funcs'`
|
- Do I need to include `shared_preload_libraries = 'repmgr_funcs'`
|
||||||
in `postgresql.conf` if I'm not using `repmgrd`?
|
in `postgresql.conf` if I'm not using `repmgrd`?
|
||||||
@@ -106,6 +112,30 @@ General
|
|||||||
If you later decide to run `repmgrd`, you just need to add
|
If you later decide to run `repmgrd`, you just need to add
|
||||||
`shared_preload_libraries = 'repmgr_funcs'` and restart PostgreSQL.
|
`shared_preload_libraries = 'repmgr_funcs'` and restart PostgreSQL.
|
||||||
|
|
||||||
|
- I've provided replication permission for the `repmgr` user in `pg_hba.conf`
|
||||||
|
but `repmgr`/`repmgrd` complains it can't connect to the server... Why?
|
||||||
|
|
||||||
|
`repmgr`/`repmgrd` need to be able to connect to the repmgr database
|
||||||
|
with a normal connection to query metadata. The `replication` connection
|
||||||
|
permission is for PostgreSQL's streaming replication and doesn't
|
||||||
|
necessarily need to be the `repmgr` user.
|
||||||
|
|
||||||
|
- When cloning a standby, why do I need to provide the connection parameters
|
||||||
|
for the primary server on the command line, not in the configuration file?
|
||||||
|
|
||||||
|
Cloning a standby is a one-time action; the role of the server being cloned
|
||||||
|
from could change, so fixing it in the configuration file would create
|
||||||
|
confusion. If `repmgr` needs to establish a connection to the primary
|
||||||
|
server, it can retrieve this from the `repl_nodes` table or if necessary
|
||||||
|
scan the replication cluster until it locates the active primary.
|
||||||
|
|
||||||
|
- Why is there no foreign key on the `node_id` column in the `repl_events`
|
||||||
|
table?
|
||||||
|
|
||||||
|
Under some circumstances event notifications can be generated for servers
|
||||||
|
which have not yet been registered; it's also useful to retain a record
|
||||||
|
of events which includes servers removed from the replication cluster
|
||||||
|
which no longer have an entry in the `repl_nodes` table.
|
||||||
|
|
||||||
`repmgrd`
|
`repmgrd`
|
||||||
---------
|
---------
|
||||||
@@ -134,3 +164,8 @@ General
|
|||||||
|
|
||||||
Note that after registering a delayed standby, `repmgrd` will only start
|
Note that after registering a delayed standby, `repmgrd` will only start
|
||||||
once the metadata added in the master node has been replicated.
|
once the metadata added in the master node has been replicated.
|
||||||
|
|
||||||
|
- How can I get `repmgrd` to rotate its logfile?
|
||||||
|
|
||||||
|
Configure your system's `logrotate` service to do this; see example
|
||||||
|
in README.md
|
||||||
|
|||||||
52
HISTORY
52
HISTORY
@@ -1,4 +1,50 @@
|
|||||||
3.0.2 2015-09-
|
3.1.3 2016-05-17
|
||||||
|
repmgrd: enable monitoring when a standby is catching up by
|
||||||
|
replaying archived WAL (Ian)
|
||||||
|
repmgrd: when upstream_node_id is NULL, assume upstream node
|
||||||
|
to be current master (Ian)
|
||||||
|
repmgrd: check for reappearance of the master node if standby
|
||||||
|
promotion fails (Ian)
|
||||||
|
improve handling of rsync failure conditions (Martín)
|
||||||
|
|
||||||
|
3.1.2 2016-04-12
|
||||||
|
Fix pg_ctl path generation in do_standby_switchover() (Ian)
|
||||||
|
Regularly sync witness server repl_nodes table (Ian)
|
||||||
|
Documentation improvements (Gianni, dhyannataraj)
|
||||||
|
(Experimental) ensure repmgr handles failover slots when copying
|
||||||
|
in rsync mode (Craig, Ian)
|
||||||
|
rsync mode handling fixes (Martín)
|
||||||
|
Enable repmgr to compile against 9.6devel (Ian)
|
||||||
|
|
||||||
|
3.1.1 2016-02-24
|
||||||
|
Add '-P/--pwprompt' option for "repmgr create witness" (Ian)
|
||||||
|
Prevent repmgr/repmgrd running as root (Ian)
|
||||||
|
|
||||||
|
3.1.0 2016-02-01
|
||||||
|
Add "repmgr standby switchover" command (Ian)
|
||||||
|
Revised README file (Ian)
|
||||||
|
Remove requirement for 'archive_mode' to be enabled (Ian)
|
||||||
|
Improve -?/--help output, showing default values if relevant (Ian)
|
||||||
|
Various bugfixes to command line/configuration parameter handling (Ian)
|
||||||
|
|
||||||
|
3.0.3 2016-01-04
|
||||||
|
Create replication slot if required before base backup is run (Abhijit)
|
||||||
|
standy clone: when using rsync, clean up "pg_replslot" directory (Ian)
|
||||||
|
Improve --help output (Ian)
|
||||||
|
Improve config file parsing (Ian)
|
||||||
|
Various logging output improvements, including explicit HINTS (Ian)
|
||||||
|
Add --log-level to explicitly set log level on command line (Ian)
|
||||||
|
Repurpose --verbose to display extra log output (Ian)
|
||||||
|
Add --terse to hide hints and other non-critical output (Ian)
|
||||||
|
Reference internal functions with explicit catalog path (Ian)
|
||||||
|
When following a new primary, have repmgr (not repmgrd) create the new slot (Ian)
|
||||||
|
Add /etc/repmgr.conf as a default configuration file location (Ian)
|
||||||
|
Prevent repmgrd's -v/--verbose option expecting a parameter (Ian)
|
||||||
|
Prevent invalid replication_lag values being written to the monitoring table (Ian)
|
||||||
|
Improve repmgrd behaviour when monitored standby node is temporarily
|
||||||
|
unavailable (Martín)
|
||||||
|
|
||||||
|
3.0.2 2015-10-02
|
||||||
Improve handling of --help/--version options; and improve help output (Ian)
|
Improve handling of --help/--version options; and improve help output (Ian)
|
||||||
Improve handling of situation where logfile can't be opened (Ian)
|
Improve handling of situation where logfile can't be opened (Ian)
|
||||||
Always pass -D/--pgdata option to pg_basebackup (Ian)
|
Always pass -D/--pgdata option to pg_basebackup (Ian)
|
||||||
@@ -12,7 +58,9 @@
|
|||||||
Update tablespace remapping in --rsync-only mode for 9.5 and later (Ian)
|
Update tablespace remapping in --rsync-only mode for 9.5 and later (Ian)
|
||||||
Deprecate `-l/--local-port` option - the port can be extracted
|
Deprecate `-l/--local-port` option - the port can be extracted
|
||||||
from the conninfo string in repmgr.conf (Ian)
|
from the conninfo string in repmgr.conf (Ian)
|
||||||
Add STANDBY UNREGISTE (Vik Fearing)
|
Add STANDBY UNREGISTER (Vik Fearing)
|
||||||
|
Don't fail with error when registering master if schema already defined (Ian)
|
||||||
|
Fixes to whitespace handling when parsing config file (Ian)
|
||||||
|
|
||||||
3.0.1 2015-04-16
|
3.0.1 2015-04-16
|
||||||
Prevent repmgrd from looping infinitely if node was not registered (Ian)
|
Prevent repmgrd from looping infinitely if node was not registered (Ian)
|
||||||
|
|||||||
48
Makefile
48
Makefile
@@ -1,6 +1,8 @@
|
|||||||
#
|
#
|
||||||
# Makefile
|
# Makefile
|
||||||
# Copyright (c) 2ndQuadrant, 2010-2015
|
# Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
|
|
||||||
|
HEADERS = $(wildcard *.h)
|
||||||
|
|
||||||
repmgrd_OBJS = dbutils.o config.o repmgrd.o log.o strutil.o
|
repmgrd_OBJS = dbutils.o config.o repmgrd.o log.o strutil.o
|
||||||
repmgr_OBJS = dbutils.o check_dir.o config.o repmgr.o log.o strutil.o
|
repmgr_OBJS = dbutils.o check_dir.o config.o repmgr.o log.o strutil.o
|
||||||
@@ -8,17 +10,24 @@ repmgr_OBJS = dbutils.o check_dir.o config.o repmgr.o log.o strutil.o
|
|||||||
DATA = repmgr.sql uninstall_repmgr.sql
|
DATA = repmgr.sql uninstall_repmgr.sql
|
||||||
|
|
||||||
PG_CPPFLAGS = -I$(libpq_srcdir)
|
PG_CPPFLAGS = -I$(libpq_srcdir)
|
||||||
PG_LIBS = $(libpq_pgport)
|
PG_LIBS = $(libpq_pgport)
|
||||||
|
|
||||||
all: repmgrd repmgr
|
|
||||||
|
all: repmgrd repmgr
|
||||||
$(MAKE) -C sql
|
$(MAKE) -C sql
|
||||||
|
|
||||||
repmgrd: $(repmgrd_OBJS)
|
repmgrd: $(repmgrd_OBJS)
|
||||||
$(CC) $(CFLAGS) $(repmgrd_OBJS) $(PG_LIBS) $(LDFLAGS) $(LDFLAGS_EX) $(LIBS) -o repmgrd
|
$(CC) -o repmgrd $(CFLAGS) $(repmgrd_OBJS) $(PG_LIBS) $(LDFLAGS) $(LDFLAGS_EX) $(LIBS)
|
||||||
$(MAKE) -C sql
|
$(MAKE) -C sql
|
||||||
|
|
||||||
repmgr: $(repmgr_OBJS)
|
repmgr: $(repmgr_OBJS)
|
||||||
$(CC) $(CFLAGS) $(repmgr_OBJS) $(PG_LIBS) $(LDFLAGS) $(LDFLAGS_EX) $(LIBS) -o repmgr
|
$(CC) -o repmgr $(CFLAGS) $(repmgr_OBJS) $(PG_LIBS) $(LDFLAGS) $(LDFLAGS_EX) $(LIBS)
|
||||||
|
|
||||||
|
# Make all objects depend on all include files. This is a bit of a
|
||||||
|
# shotgun approach, but the codebase is small enough that a complete rebuild
|
||||||
|
# is very fast anyway.
|
||||||
|
$(repmgr_OBJS): $(HEADERS)
|
||||||
|
$(repmgrd_OBJS): $(HEADERS)
|
||||||
|
|
||||||
ifdef USE_PGXS
|
ifdef USE_PGXS
|
||||||
PG_CONFIG = pg_config
|
PG_CONFIG = pg_config
|
||||||
@@ -31,8 +40,8 @@ include $(top_builddir)/src/Makefile.global
|
|||||||
include $(top_srcdir)/contrib/contrib-global.mk
|
include $(top_srcdir)/contrib/contrib-global.mk
|
||||||
endif
|
endif
|
||||||
|
|
||||||
# XXX: Try to use PROGRAM construct (see pgxs.mk) someday. Right now
|
# XXX: This overrides the pgxs install target - we're building two binaries,
|
||||||
# is overriding pgxs install.
|
# which is not supported by pgxs.mk's PROGRAM construct.
|
||||||
install: install_prog install_ext
|
install: install_prog install_ext
|
||||||
|
|
||||||
install_prog:
|
install_prog:
|
||||||
@@ -43,6 +52,12 @@ install_prog:
|
|||||||
install_ext:
|
install_ext:
|
||||||
$(MAKE) -C sql install
|
$(MAKE) -C sql install
|
||||||
|
|
||||||
|
# Distribution-specific package building targets
|
||||||
|
# ----------------------------------------------
|
||||||
|
#
|
||||||
|
# XXX we recommend using the PGDG-supplied packages where possible;
|
||||||
|
# see README.md for details.
|
||||||
|
|
||||||
install_rhel:
|
install_rhel:
|
||||||
mkdir -p '$(DESTDIR)/etc/init.d/'
|
mkdir -p '$(DESTDIR)/etc/init.d/'
|
||||||
$(INSTALL_PROGRAM) RHEL/repmgrd.init '$(DESTDIR)/etc/init.d/repmgrd'
|
$(INSTALL_PROGRAM) RHEL/repmgrd.init '$(DESTDIR)/etc/init.d/repmgrd'
|
||||||
@@ -67,16 +82,21 @@ clean:
|
|||||||
rm -f repmgr
|
rm -f repmgr
|
||||||
$(MAKE) -C sql clean
|
$(MAKE) -C sql clean
|
||||||
|
|
||||||
|
# Get correct version numbers and install paths, depending on your postgres version
|
||||||
|
PG_VERSION = $(shell pg_config --version | cut -d ' ' -f 2 | cut -d '.' -f 1,2)
|
||||||
|
REPMGR_VERSION = $(shell grep REPMGR_VERSION version.h | cut -d ' ' -f 3 | cut -d '"' -f 2)
|
||||||
|
PKGLIBDIR = $(shell pg_config --pkglibdir)
|
||||||
|
SHAREDIR = $(shell pg_config --sharedir)
|
||||||
|
|
||||||
deb: repmgrd repmgr
|
deb: repmgrd repmgr
|
||||||
mkdir -p ./debian/usr/bin
|
mkdir -p ./debian/usr/bin
|
||||||
cp repmgrd repmgr ./debian/usr/bin/
|
cp repmgrd repmgr ./debian/usr/bin/
|
||||||
mkdir -p ./debian/usr/share/postgresql/9.0/contrib/
|
mkdir -p ./debian$(SHAREDIR)/contrib/
|
||||||
cp sql/repmgr_funcs.sql ./debian/usr/share/postgresql/9.0/contrib/
|
cp sql/repmgr_funcs.sql ./debian$(SHAREDIR)/contrib/
|
||||||
cp sql/uninstall_repmgr_funcs.sql ./debian/usr/share/postgresql/9.0/contrib/
|
cp sql/uninstall_repmgr_funcs.sql ./debian$(SHAREDIR)/contrib/
|
||||||
mkdir -p ./debian/usr/lib/postgresql/9.0/lib/
|
mkdir -p ./debian$(PKGLIBDIR)/
|
||||||
cp sql/repmgr_funcs.so ./debian/usr/lib/postgresql/9.0/lib/
|
cp sql/repmgr_funcs.so ./debian$(PKGLIBDIR)/
|
||||||
dpkg-deb --build debian
|
dpkg-deb --build debian
|
||||||
mv debian.deb ../postgresql-repmgr-9.0_1.0.0.deb
|
mv debian.deb ../postgresql-repmgr-$(PG_VERSION)_$(REPMGR_VERSION).deb
|
||||||
rm -rf ./debian/usr
|
rm -rf ./debian/usr
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
119
QUICKSTART.md
119
QUICKSTART.md
@@ -1,118 +1 @@
|
|||||||
repmgr quickstart guide
|
The contents of this file have been incorporated into the main README.md document.
|
||||||
=======================
|
|
||||||
|
|
||||||
This quickstart guide provides some annotated examples on basic
|
|
||||||
`repmgr` setup. It assumes you are familiar with PostgreSQL replication
|
|
||||||
concepts setup and Linux/UNIX system administration.
|
|
||||||
|
|
||||||
For the purposes of this guide, we'll assume the database user will be
|
|
||||||
`repmgr_usr` and the database will be `repmgr_db`.
|
|
||||||
|
|
||||||
|
|
||||||
Master setup
|
|
||||||
------------
|
|
||||||
|
|
||||||
1. Configure PostgreSQL
|
|
||||||
|
|
||||||
- create user and database:
|
|
||||||
|
|
||||||
```
|
|
||||||
CREATE ROLE repmgr_usr LOGIN SUPERUSER;
|
|
||||||
CREATE DATABASE repmgr_db OWNER repmgr_usr;
|
|
||||||
```
|
|
||||||
|
|
||||||
- configure `postgresql.conf` for replication (see README.md for sample
|
|
||||||
settings)
|
|
||||||
|
|
||||||
- update `pg_hba.conf`, e.g.:
|
|
||||||
|
|
||||||
```
|
|
||||||
host repmgr_db repmgr_usr 192.168.1.0/24 trust
|
|
||||||
host replication repmgr_usr 192.168.1.0/24 trust
|
|
||||||
```
|
|
||||||
|
|
||||||
Restart the PostgreSQL server after making these changes.
|
|
||||||
|
|
||||||
2. Create the `repmgr` configuration file:
|
|
||||||
|
|
||||||
$ cat /path/to/repmgr/node1/repmgr.conf
|
|
||||||
cluster=test
|
|
||||||
node=1
|
|
||||||
node_name=node1
|
|
||||||
conninfo='host=repmgr_node1 user=repmgr_usr dbname=repmgr_db'
|
|
||||||
pg_bindir=/path/to/postgres/bin
|
|
||||||
|
|
||||||
(For an annotated `repmgr.conf` file, see `repmgr.conf.sample` in the
|
|
||||||
repository's root directory).
|
|
||||||
|
|
||||||
3. Register the master node with `repmgr`:
|
|
||||||
|
|
||||||
$ repmgr -f /path/to/repmgr/node1/repmgr.conf --verbose master register
|
|
||||||
[2015-03-03 17:45:53] [INFO] repmgr connecting to master database
|
|
||||||
[2015-03-03 17:45:53] [INFO] repmgr connected to master, checking its state
|
|
||||||
[2015-03-03 17:45:53] [INFO] master register: creating database objects inside the repmgr_test schema
|
|
||||||
[2015-03-03 17:45:53] [NOTICE] Master node correctly registered for cluster test with id 1 (conninfo: host=localhost user=repmgr_usr dbname=repmgr_db)
|
|
||||||
|
|
||||||
Standby setup
|
|
||||||
-------------
|
|
||||||
|
|
||||||
1. Use `repmgr standby clone` to clone a standby from the master:
|
|
||||||
|
|
||||||
repmgr -D /path/to/standby/data -d repmgr_db -U repmgr_usr --verbose standby clone 192.168.1.2
|
|
||||||
[2015-03-03 18:18:21] [NOTICE] No configuration file provided and default file './repmgr.conf' not found - continuing with default values
|
|
||||||
[2015-03-03 18:18:21] [NOTICE] repmgr Destination directory ' /path/to/standby/data' provided
|
|
||||||
[2015-03-03 18:18:21] [INFO] repmgr connecting to upstream node
|
|
||||||
[2015-03-03 18:18:21] [INFO] repmgr connected to upstream node, checking its state
|
|
||||||
[2015-03-03 18:18:21] [INFO] Successfully connected to upstream node. Current installation size is 27 MB
|
|
||||||
[2015-03-03 18:18:21] [NOTICE] Starting backup...
|
|
||||||
[2015-03-03 18:18:21] [INFO] creating directory " /path/to/standby/data"...
|
|
||||||
[2015-03-03 18:18:21] [INFO] Executing: 'pg_basebackup -l "repmgr base backup" -h localhost -p 9595 -U repmgr_usr -D /path/to/standby/data '
|
|
||||||
NOTICE: pg_stop_backup complete, all required WAL segments have been archived
|
|
||||||
[2015-03-03 18:18:23] [NOTICE] repmgr standby clone (using pg_basebackup) complete
|
|
||||||
[2015-03-03 18:18:23] [NOTICE] HINT: You can now start your postgresql server
|
|
||||||
[2015-03-03 18:18:23] [NOTICE] for example : pg_ctl -D /path/to/standby/data start
|
|
||||||
|
|
||||||
Note that the `repmgr.conf` file is not required when cloning a standby.
|
|
||||||
However we recommend providing a valid `repmgr.conf` if you wish to use
|
|
||||||
replication slots, or want `repmgr` to log the clone event to the
|
|
||||||
`repl_events` table.
|
|
||||||
|
|
||||||
This will clone the PostgreSQL database files from the master, including its
|
|
||||||
`postgresql.conf` and `pg_hba.conf` files, and additionally automatically create
|
|
||||||
the `recovery.conf` file containing the correct parameters to start streaming
|
|
||||||
from the primary node.
|
|
||||||
|
|
||||||
2. Start the PostgreSQL server
|
|
||||||
|
|
||||||
3. Create the `repmgr` configuration file:
|
|
||||||
|
|
||||||
$ cat /path/node2/repmgr/repmgr.conf
|
|
||||||
cluster=test
|
|
||||||
node=2
|
|
||||||
node_name=node2
|
|
||||||
conninfo='host=repmgr_node2 user=repmgr_usr dbname=repmgr_db'
|
|
||||||
pg_bindir=/path/to/postgres/bin
|
|
||||||
|
|
||||||
4. Register the standby node with `repmgr`:
|
|
||||||
|
|
||||||
$ repmgr -f /path/to/repmgr/node2/repmgr.conf --verbose standby register
|
|
||||||
[2015-03-03 18:24:34] [NOTICE] Opening configuration file: /path/to/repmgr/node2/repmgr.conf
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr connecting to standby database
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr connecting to master database
|
|
||||||
[2015-03-03 18:24:34] [INFO] finding node list for cluster 'test'
|
|
||||||
[2015-03-03 18:24:34] [INFO] checking role of cluster node '1'
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr connected to master, checking its state
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr registering the standby
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr registering the standby complete
|
|
||||||
[2015-03-03 18:24:34] [NOTICE] Standby node correctly registered for cluster test with id 2 (conninfo: host=localhost user=repmgr_usr dbname=repmgr_db)
|
|
||||||
|
|
||||||
|
|
||||||
This concludes the basic `repmgr` setup of master and standby. The records
|
|
||||||
created in the `repl_nodes` table should look something like this:
|
|
||||||
|
|
||||||
repmgr_db=# SELECT * from repmgr_test.repl_nodes;
|
|
||||||
id | type | upstream_node_id | cluster | name | conninfo | slot_name | priority | active
|
|
||||||
----+---------+------------------+---------+-------+----------------------------------------------------+-----------+----------+--------
|
|
||||||
1 | primary | | test | node1 | host=repmgr_node1 user=repmgr_usr dbname=repmgr_db | | 0 | t
|
|
||||||
2 | standby | 1 | test | node2 | host=repmgr_node2 user=repmgr_usr dbname=repmgr_db | | 0 | t
|
|
||||||
(2 rows)
|
|
||||||
|
|||||||
35
TODO
35
TODO
@@ -7,6 +7,7 @@ Known issues in repmgr
|
|||||||
|
|
||||||
* PGPASSFILE may not be passed to pg_basebackup
|
* PGPASSFILE may not be passed to pg_basebackup
|
||||||
|
|
||||||
|
|
||||||
Planned feature improvements
|
Planned feature improvements
|
||||||
============================
|
============================
|
||||||
|
|
||||||
@@ -39,6 +40,34 @@ Planned feature improvements
|
|||||||
* make old master node ID available for event notification commands
|
* make old master node ID available for event notification commands
|
||||||
(See github issue #80).
|
(See github issue #80).
|
||||||
|
|
||||||
* Have pg_basebackup use replication slots, if and when support for
|
* repmgr standby clone: possibility to use barman instead of performing a new base backup
|
||||||
this is added; see:
|
|
||||||
http://www.postgresql.org/message-id/555DD2B2.7020000@gmx.net
|
* possibility to transform a failed master into a new standby with pg_rewind
|
||||||
|
|
||||||
|
* "repmgr standby switchover" to promote a standby in a controlled manner
|
||||||
|
and convert the existing primary into a standby
|
||||||
|
|
||||||
|
* make repmgrd more robust
|
||||||
|
|
||||||
|
* repmgr: when cloning a standby using pg_basebackup and replication slots are
|
||||||
|
requested, activate the replication slot using pg_receivexlog to negate the
|
||||||
|
need to set `wal_keep_segments` just for the initial clone (9.4 and 9.5).
|
||||||
|
|
||||||
|
* Take into account the fact that a standby can obtain WAL from an archive,
|
||||||
|
so even if direct streaming replication is interrupted, it may be up-to-date
|
||||||
|
|
||||||
|
Usability improvements
|
||||||
|
======================
|
||||||
|
|
||||||
|
* repmgr: add interrupt handler, so that if the program is interrupted
|
||||||
|
while running a backup, an attempt can be made to execute pg_stop_backup()
|
||||||
|
on the primary, to prevent an orphaned backup state existing.
|
||||||
|
|
||||||
|
* repmgr: when unregistering a node, delete any entries in the repl_monitoring
|
||||||
|
table.
|
||||||
|
|
||||||
|
* repmgr: for "standby unregister", accept connection parameters for the
|
||||||
|
primary and perform metadata updates (and slot removal) directly on
|
||||||
|
the primary, to allow a shutdown standby to be unregistered
|
||||||
|
(currently the standby must still be running, which means the replication
|
||||||
|
slot can't be dropped).
|
||||||
|
|||||||
10
check_dir.c
10
check_dir.c
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* check_dir.c - Directories management functions
|
* check_dir.c - Directories management functions
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -320,10 +320,10 @@ _create_pg_dir(char *dir, bool force, bool for_witness)
|
|||||||
}
|
}
|
||||||
else if (pg_dir && !force)
|
else if (pg_dir && !force)
|
||||||
{
|
{
|
||||||
log_warning(_("\nThis looks like a PostgreSQL directory.\n"
|
log_hint(_("This looks like a PostgreSQL directory.\n"
|
||||||
"If you are sure you want to clone here, "
|
"If you are sure you want to clone here, "
|
||||||
"please check there is no PostgreSQL server "
|
"please check there is no PostgreSQL server "
|
||||||
"running and use the --force option\n"));
|
"running and use the -F/--force option\n"));
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* check_dir.h
|
* check_dir.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
|||||||
461
config.c
461
config.c
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* config.c - Functions to parse the config file
|
* config.c - Functions to parse the config file
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -26,9 +26,25 @@
|
|||||||
|
|
||||||
static void parse_event_notifications_list(t_configuration_options *options, const char *arg);
|
static void parse_event_notifications_list(t_configuration_options *options, const char *arg);
|
||||||
static void tablespace_list_append(t_configuration_options *options, const char *arg);
|
static void tablespace_list_append(t_configuration_options *options, const char *arg);
|
||||||
|
static void exit_with_errors(ErrorList *config_errors);
|
||||||
|
|
||||||
|
const static char *_progname = '\0';
|
||||||
static char config_file_path[MAXPGPATH];
|
static char config_file_path[MAXPGPATH];
|
||||||
static bool config_file_provided = false;
|
static bool config_file_provided = false;
|
||||||
|
bool config_file_found = false;
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
set_progname(const char *argv0)
|
||||||
|
{
|
||||||
|
_progname = get_progname(argv0);
|
||||||
|
}
|
||||||
|
|
||||||
|
const char *
|
||||||
|
progname(void)
|
||||||
|
{
|
||||||
|
return _progname;
|
||||||
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* load_config()
|
* load_config()
|
||||||
@@ -40,61 +56,123 @@ static bool config_file_provided = false;
|
|||||||
*
|
*
|
||||||
* Any configuration options changed in this function must also be changed in
|
* Any configuration options changed in this function must also be changed in
|
||||||
* reload_config()
|
* reload_config()
|
||||||
|
*
|
||||||
|
* NOTE: this function is called before the logger is set up, so we need
|
||||||
|
* to handle the verbose option ourselves; also the default log level is NOTICE,
|
||||||
|
* so we can't use DEBUG.
|
||||||
*/
|
*/
|
||||||
bool
|
bool
|
||||||
load_config(const char *config_file, t_configuration_options *options, char *argv0)
|
load_config(const char *config_file, bool verbose, t_configuration_options *options, char *argv0)
|
||||||
{
|
{
|
||||||
struct stat config;
|
struct stat stat_config;
|
||||||
/* Sanity checks */
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* If a configuration file was provided, check it exists, otherwise
|
* If a configuration file was provided, check it exists, otherwise
|
||||||
* emit an error and terminate
|
* emit an error and terminate. We assume that if a user explicitly
|
||||||
|
* provides a configuration file, they'll want to make sure it's
|
||||||
|
* used and not fall back to any of the defaults.
|
||||||
*/
|
*/
|
||||||
if (config_file[0])
|
if (config_file[0])
|
||||||
{
|
{
|
||||||
strncpy(config_file_path, config_file, MAXPGPATH);
|
strncpy(config_file_path, config_file, MAXPGPATH);
|
||||||
canonicalize_path(config_file_path);
|
canonicalize_path(config_file_path);
|
||||||
|
|
||||||
if (stat(config_file_path, &config) != 0)
|
if (stat(config_file_path, &stat_config) != 0)
|
||||||
{
|
{
|
||||||
log_err(_("provided configuration file '%s' not found: %s\n"),
|
log_err(_("provided configuration file \"%s\" not found: %s\n"),
|
||||||
config_file,
|
config_file,
|
||||||
strerror(errno)
|
strerror(errno)
|
||||||
);
|
);
|
||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (verbose == true)
|
||||||
|
{
|
||||||
|
log_notice(_("using configuration file \"%s\"\n"), config_file);
|
||||||
|
}
|
||||||
|
|
||||||
config_file_provided = true;
|
config_file_provided = true;
|
||||||
|
config_file_found = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* If no configuration file was provided, attempt to find a default file
|
* If no configuration file was provided, attempt to find a default file
|
||||||
|
* in this order:
|
||||||
|
* - current directory
|
||||||
|
* - /etc/repmgr.conf
|
||||||
|
* - default sysconfdir
|
||||||
|
*
|
||||||
|
* here we just check for the existence of the file; parse_config()
|
||||||
|
* will handle read errors etc.
|
||||||
*/
|
*/
|
||||||
if (config_file_provided == false)
|
if (config_file_provided == false)
|
||||||
{
|
{
|
||||||
char my_exec_path[MAXPGPATH];
|
char my_exec_path[MAXPGPATH];
|
||||||
char etc_path[MAXPGPATH];
|
char sysconf_etc_path[MAXPGPATH];
|
||||||
|
|
||||||
/* First check if one is in the default sysconfdir */
|
/* 1. "./repmgr.conf" */
|
||||||
|
if (verbose == true)
|
||||||
|
{
|
||||||
|
log_notice(_("looking for configuration file in current directory\n"));
|
||||||
|
}
|
||||||
|
|
||||||
|
snprintf(config_file_path, MAXPGPATH, "./%s", CONFIG_FILE_NAME);
|
||||||
|
canonicalize_path(config_file_path);
|
||||||
|
|
||||||
|
if (stat(config_file_path, &stat_config) == 0)
|
||||||
|
{
|
||||||
|
config_file_found = true;
|
||||||
|
goto end_search;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* 2. "/etc/repmgr.conf" */
|
||||||
|
if (verbose == true)
|
||||||
|
{
|
||||||
|
log_notice(_("looking for configuration file in /etc\n"));
|
||||||
|
}
|
||||||
|
|
||||||
|
snprintf(config_file_path, MAXPGPATH, "/etc/%s", CONFIG_FILE_NAME);
|
||||||
|
if (stat(config_file_path, &stat_config) == 0)
|
||||||
|
{
|
||||||
|
config_file_found = true;
|
||||||
|
goto end_search;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* 3. default sysconfdir */
|
||||||
if (find_my_exec(argv0, my_exec_path) < 0)
|
if (find_my_exec(argv0, my_exec_path) < 0)
|
||||||
{
|
{
|
||||||
fprintf(stderr, _("%s: could not find own program executable\n"), argv0);
|
fprintf(stderr, _("%s: could not find own program executable\n"), argv0);
|
||||||
exit(EXIT_FAILURE);
|
exit(EXIT_FAILURE);
|
||||||
}
|
}
|
||||||
|
|
||||||
get_etc_path(my_exec_path, etc_path);
|
get_etc_path(my_exec_path, sysconf_etc_path);
|
||||||
|
|
||||||
snprintf(config_file_path, MAXPGPATH, "%s/repmgr.conf", etc_path);
|
if (verbose == true)
|
||||||
|
|
||||||
log_debug(_("Looking for configuration file in %s\n"), etc_path);
|
|
||||||
|
|
||||||
if (stat(config_file_path, &config) != 0)
|
|
||||||
{
|
{
|
||||||
/* Not found - default to ./repmgr.conf */
|
log_notice(_("looking for configuration file in %s\n"), sysconf_etc_path);
|
||||||
strncpy(config_file_path, DEFAULT_CONFIG_FILE, MAXPGPATH);
|
}
|
||||||
canonicalize_path(config_file_path);
|
|
||||||
log_debug(_("Looking for configuration file in %s\n"), config_file_path);
|
snprintf(config_file_path, MAXPGPATH, "%s/%s", sysconf_etc_path, CONFIG_FILE_NAME);
|
||||||
|
if (stat(config_file_path, &stat_config) == 0)
|
||||||
|
{
|
||||||
|
config_file_found = true;
|
||||||
|
goto end_search;
|
||||||
|
}
|
||||||
|
|
||||||
|
end_search:
|
||||||
|
if (config_file_found == true)
|
||||||
|
{
|
||||||
|
if (verbose == true)
|
||||||
|
{
|
||||||
|
log_notice(_("configuration file found at: %s\n"), config_file_path);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
if (verbose == true)
|
||||||
|
{
|
||||||
|
log_notice(_("no configuration file provided or found\n"));
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -102,49 +180,39 @@ load_config(const char *config_file, t_configuration_options *options, char *arg
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Parse configuration file; if any errors are encountered,
|
||||||
|
* list them and exit.
|
||||||
|
*
|
||||||
|
* Ensure any default values set here are synced with repmgr.conf.sample
|
||||||
|
* and any other documentation.
|
||||||
|
*/
|
||||||
bool
|
bool
|
||||||
parse_config(t_configuration_options *options)
|
parse_config(t_configuration_options *options)
|
||||||
{
|
{
|
||||||
FILE *fp;
|
FILE *fp;
|
||||||
char *s,
|
char *s,
|
||||||
buff[MAXLINELENGTH];
|
buf[MAXLINELENGTH];
|
||||||
char name[MAXLEN];
|
char name[MAXLEN];
|
||||||
char value[MAXLEN];
|
char value[MAXLEN];
|
||||||
|
|
||||||
/* For sanity-checking provided conninfo string */
|
/* For sanity-checking provided conninfo string */
|
||||||
PQconninfoOption *conninfo_options;
|
PQconninfoOption *conninfo_options;
|
||||||
char *conninfo_errmsg = NULL;
|
char *conninfo_errmsg = NULL;
|
||||||
|
|
||||||
fp = fopen(config_file_path, "r");
|
/* Collate configuration file errors here for friendlier reporting */
|
||||||
|
static ErrorList config_errors = { NULL, NULL };
|
||||||
|
|
||||||
/*
|
bool node_found = false;
|
||||||
* Since some commands don't require a config file at all, not having one
|
|
||||||
* isn't necessarily a problem.
|
/* Initialize configuration options with sensible defaults
|
||||||
*
|
* note: the default log level is set in log.c and does not need
|
||||||
* If the user explictly provided a configuration file and we can't
|
* to be initialised here
|
||||||
* read it we'll raise an error.
|
|
||||||
*
|
|
||||||
* If no configuration file was provided, we'll try and read the default\
|
|
||||||
* file if it exists and is readable, but won't worry if it's not.
|
|
||||||
*/
|
*/
|
||||||
if (fp == NULL)
|
|
||||||
{
|
|
||||||
if (config_file_provided)
|
|
||||||
{
|
|
||||||
log_err(_("unable to open provided configuration file '%s'; terminating\n"), config_file_path);
|
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
|
||||||
|
|
||||||
log_notice(_("no configuration file provided and default file '%s' not found - "
|
|
||||||
"continuing with default values\n"),
|
|
||||||
DEFAULT_CONFIG_FILE);
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Initialize configuration options with sensible defaults */
|
|
||||||
memset(options->cluster_name, 0, sizeof(options->cluster_name));
|
memset(options->cluster_name, 0, sizeof(options->cluster_name));
|
||||||
options->node = -1;
|
options->node = -1;
|
||||||
options->upstream_node = NO_UPSTREAM_NODE;
|
options->upstream_node = NO_UPSTREAM_NODE;
|
||||||
|
options->use_replication_slots = 0;
|
||||||
memset(options->conninfo, 0, sizeof(options->conninfo));
|
memset(options->conninfo, 0, sizeof(options->conninfo));
|
||||||
options->failover = MANUAL_FAILOVER;
|
options->failover = MANUAL_FAILOVER;
|
||||||
options->priority = DEFAULT_PRIORITY;
|
options->priority = DEFAULT_PRIORITY;
|
||||||
@@ -162,25 +230,58 @@ parse_config(t_configuration_options *options)
|
|||||||
|
|
||||||
/* default to 6 reconnection attempts at intervals of 10 seconds */
|
/* default to 6 reconnection attempts at intervals of 10 seconds */
|
||||||
options->reconnect_attempts = 6;
|
options->reconnect_attempts = 6;
|
||||||
options->reconnect_intvl = 10;
|
options->reconnect_interval = 10;
|
||||||
|
|
||||||
options->monitor_interval_secs = 2;
|
options->monitor_interval_secs = 2;
|
||||||
options->retry_promote_interval_secs = 300;
|
options->retry_promote_interval_secs = 300;
|
||||||
|
|
||||||
|
/* default to resyncing repl_nodes table every 30 seconds on the witness server */
|
||||||
|
options->witness_repl_nodes_sync_interval_secs = 30;
|
||||||
|
|
||||||
memset(options->event_notification_command, 0, sizeof(options->event_notification_command));
|
memset(options->event_notification_command, 0, sizeof(options->event_notification_command));
|
||||||
|
|
||||||
options->tablespace_mapping.head = NULL;
|
options->tablespace_mapping.head = NULL;
|
||||||
options->tablespace_mapping.tail = NULL;
|
options->tablespace_mapping.tail = NULL;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* If no configuration file available (user didn't specify and none found
|
||||||
|
* in the default locations), return with default values
|
||||||
|
*/
|
||||||
|
if (config_file_found == false)
|
||||||
|
{
|
||||||
|
log_verbose(LOG_NOTICE, _("no configuration file provided and no default file found - "
|
||||||
|
"continuing with default values\n"));
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
fp = fopen(config_file_path, "r");
|
||||||
|
|
||||||
/* Read next line */
|
/*
|
||||||
while ((s = fgets(buff, sizeof buff, fp)) != NULL)
|
* A configuration file has been found, either provided by the user
|
||||||
|
* or found in one of the default locations. If we can't open it,
|
||||||
|
* fail with an error.
|
||||||
|
*/
|
||||||
|
if (fp == NULL)
|
||||||
|
{
|
||||||
|
if (config_file_provided)
|
||||||
|
{
|
||||||
|
log_err(_("unable to open provided configuration file \"%s\"; terminating\n"), config_file_path);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
log_err(_("unable to open default configuration file \"%s\"; terminating\n"), config_file_path);
|
||||||
|
}
|
||||||
|
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Read file */
|
||||||
|
while ((s = fgets(buf, sizeof buf, fp)) != NULL)
|
||||||
{
|
{
|
||||||
bool known_parameter = true;
|
bool known_parameter = true;
|
||||||
|
|
||||||
/* Parse name/value pair from line */
|
/* Parse name/value pair from line */
|
||||||
parse_line(buff, name, value);
|
parse_line(buf, name, value);
|
||||||
|
|
||||||
/* Skip blank lines */
|
/* Skip blank lines */
|
||||||
if (!strlen(name))
|
if (!strlen(name))
|
||||||
@@ -194,9 +295,12 @@ parse_config(t_configuration_options *options)
|
|||||||
if (strcmp(name, "cluster") == 0)
|
if (strcmp(name, "cluster") == 0)
|
||||||
strncpy(options->cluster_name, value, MAXLEN);
|
strncpy(options->cluster_name, value, MAXLEN);
|
||||||
else if (strcmp(name, "node") == 0)
|
else if (strcmp(name, "node") == 0)
|
||||||
options->node = atoi(value);
|
{
|
||||||
|
options->node = repmgr_atoi(value, "node", &config_errors, false);
|
||||||
|
node_found = true;
|
||||||
|
}
|
||||||
else if (strcmp(name, "upstream_node") == 0)
|
else if (strcmp(name, "upstream_node") == 0)
|
||||||
options->upstream_node = atoi(value);
|
options->upstream_node = repmgr_atoi(value, "upstream_node", &config_errors, false);
|
||||||
else if (strcmp(name, "conninfo") == 0)
|
else if (strcmp(name, "conninfo") == 0)
|
||||||
strncpy(options->conninfo, value, MAXLEN);
|
strncpy(options->conninfo, value, MAXLEN);
|
||||||
else if (strcmp(name, "rsync_options") == 0)
|
else if (strcmp(name, "rsync_options") == 0)
|
||||||
@@ -223,12 +327,11 @@ parse_config(t_configuration_options *options)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
log_err(_("value for 'failover' must be 'automatic' or 'manual'\n"));
|
error_list_append(&config_errors,_("value for 'failover' must be 'automatic' or 'manual'\n"));
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else if (strcmp(name, "priority") == 0)
|
else if (strcmp(name, "priority") == 0)
|
||||||
options->priority = atoi(value);
|
options->priority = repmgr_atoi(value, "priority", &config_errors, true);
|
||||||
else if (strcmp(name, "node_name") == 0)
|
else if (strcmp(name, "node_name") == 0)
|
||||||
strncpy(options->node_name, value, MAXLEN);
|
strncpy(options->node_name, value, MAXLEN);
|
||||||
else if (strcmp(name, "promote_command") == 0)
|
else if (strcmp(name, "promote_command") == 0)
|
||||||
@@ -236,11 +339,16 @@ parse_config(t_configuration_options *options)
|
|||||||
else if (strcmp(name, "follow_command") == 0)
|
else if (strcmp(name, "follow_command") == 0)
|
||||||
strncpy(options->follow_command, value, MAXLEN);
|
strncpy(options->follow_command, value, MAXLEN);
|
||||||
else if (strcmp(name, "master_response_timeout") == 0)
|
else if (strcmp(name, "master_response_timeout") == 0)
|
||||||
options->master_response_timeout = atoi(value);
|
options->master_response_timeout = repmgr_atoi(value, "master_response_timeout", &config_errors, false);
|
||||||
|
/* 'primary_response_timeout' as synonym for 'master_response_timeout' -
|
||||||
|
* we'll switch terminology in a future release (3.1?)
|
||||||
|
*/
|
||||||
|
else if (strcmp(name, "primary_response_timeout") == 0)
|
||||||
|
options->master_response_timeout = repmgr_atoi(value, "primary_response_timeout", &config_errors, false);
|
||||||
else if (strcmp(name, "reconnect_attempts") == 0)
|
else if (strcmp(name, "reconnect_attempts") == 0)
|
||||||
options->reconnect_attempts = atoi(value);
|
options->reconnect_attempts = repmgr_atoi(value, "reconnect_attempts", &config_errors, false);
|
||||||
else if (strcmp(name, "reconnect_interval") == 0)
|
else if (strcmp(name, "reconnect_interval") == 0)
|
||||||
options->reconnect_intvl = atoi(value);
|
options->reconnect_interval = repmgr_atoi(value, "reconnect_interval", &config_errors, false);
|
||||||
else if (strcmp(name, "pg_bindir") == 0)
|
else if (strcmp(name, "pg_bindir") == 0)
|
||||||
strncpy(options->pg_bindir, value, MAXLEN);
|
strncpy(options->pg_bindir, value, MAXLEN);
|
||||||
else if (strcmp(name, "pg_ctl_options") == 0)
|
else if (strcmp(name, "pg_ctl_options") == 0)
|
||||||
@@ -250,11 +358,14 @@ parse_config(t_configuration_options *options)
|
|||||||
else if (strcmp(name, "logfile") == 0)
|
else if (strcmp(name, "logfile") == 0)
|
||||||
strncpy(options->logfile, value, MAXLEN);
|
strncpy(options->logfile, value, MAXLEN);
|
||||||
else if (strcmp(name, "monitor_interval_secs") == 0)
|
else if (strcmp(name, "monitor_interval_secs") == 0)
|
||||||
options->monitor_interval_secs = atoi(value);
|
options->monitor_interval_secs = repmgr_atoi(value, "monitor_interval_secs", &config_errors, false);
|
||||||
else if (strcmp(name, "retry_promote_interval_secs") == 0)
|
else if (strcmp(name, "retry_promote_interval_secs") == 0)
|
||||||
options->retry_promote_interval_secs = atoi(value);
|
options->retry_promote_interval_secs = repmgr_atoi(value, "retry_promote_interval_secs", &config_errors, false);
|
||||||
|
else if (strcmp(name, "witness_repl_nodes_sync_interval_secs") == 0)
|
||||||
|
options->witness_repl_nodes_sync_interval_secs = repmgr_atoi(value, "witness_repl_nodes_sync_interval_secs", &config_errors, false);
|
||||||
else if (strcmp(name, "use_replication_slots") == 0)
|
else if (strcmp(name, "use_replication_slots") == 0)
|
||||||
options->use_replication_slots = atoi(value);
|
/* XXX we should have a dedicated boolean argument format */
|
||||||
|
options->use_replication_slots = repmgr_atoi(value, "use_replication_slots", &config_errors, false);
|
||||||
else if (strcmp(name, "event_notification_command") == 0)
|
else if (strcmp(name, "event_notification_command") == 0)
|
||||||
strncpy(options->event_notification_command, value, MAXLEN);
|
strncpy(options->event_notification_command, value, MAXLEN);
|
||||||
else if (strcmp(name, "event_notifications") == 0)
|
else if (strcmp(name, "event_notifications") == 0)
|
||||||
@@ -274,76 +385,54 @@ parse_config(t_configuration_options *options)
|
|||||||
* as currently e.g. an empty `node` value will be converted to '0'.
|
* as currently e.g. an empty `node` value will be converted to '0'.
|
||||||
*/
|
*/
|
||||||
if (known_parameter == true && !strlen(value)) {
|
if (known_parameter == true && !strlen(value)) {
|
||||||
log_err(_("no value provided for parameter '%s'\n"), name);
|
char error_message_buf[MAXLEN] = "";
|
||||||
exit(ERR_BAD_CONFIG);
|
snprintf(error_message_buf,
|
||||||
|
MAXLEN,
|
||||||
|
_("no value provided for parameter \"%s\""),
|
||||||
|
name);
|
||||||
|
|
||||||
|
error_list_append(&config_errors, error_message_buf);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fclose(fp);
|
fclose(fp);
|
||||||
|
|
||||||
/* Check config settings */
|
|
||||||
|
|
||||||
/* The following checks are for the presence of the parameter */
|
if (node_found == false)
|
||||||
if (*options->cluster_name == '\0')
|
|
||||||
{
|
{
|
||||||
log_err(_("required parameter 'cluster' was not found\n"));
|
error_list_append(&config_errors, _("\"node\": parameter was not found"));
|
||||||
exit(ERR_BAD_CONFIG);
|
}
|
||||||
|
else if (options->node == 0)
|
||||||
|
{
|
||||||
|
error_list_append(&config_errors, _("\"node\": must be greater than zero"));
|
||||||
}
|
}
|
||||||
|
|
||||||
if (options->node == -1)
|
if (strlen(options->conninfo))
|
||||||
{
|
{
|
||||||
log_err(_("required parameter 'node' was not found\n"));
|
|
||||||
exit(ERR_BAD_CONFIG);
|
/* Sanity check the provided conninfo string
|
||||||
|
*
|
||||||
|
* NOTE: PQconninfoParse() verifies the string format and checks for valid options
|
||||||
|
* but does not sanity check values
|
||||||
|
*/
|
||||||
|
conninfo_options = PQconninfoParse(options->conninfo, &conninfo_errmsg);
|
||||||
|
if (conninfo_options == NULL)
|
||||||
|
{
|
||||||
|
char error_message_buf[MAXLEN] = "";
|
||||||
|
snprintf(error_message_buf,
|
||||||
|
MAXLEN,
|
||||||
|
_("\"conninfo\": %s"),
|
||||||
|
conninfo_errmsg);
|
||||||
|
|
||||||
|
error_list_append(&config_errors, error_message_buf);
|
||||||
|
}
|
||||||
|
|
||||||
|
PQconninfoFree(conninfo_options);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (options->node == 0)
|
if (config_errors.head != NULL)
|
||||||
{
|
{
|
||||||
log_err(_("'node' must be an integer greater than zero\n"));
|
exit_with_errors(&config_errors);
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
|
||||||
|
|
||||||
if (*options->node_name == '\0')
|
|
||||||
{
|
|
||||||
log_err(_("required parameter 'node_name' was not found\n"));
|
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
|
||||||
|
|
||||||
if (*options->conninfo == '\0')
|
|
||||||
{
|
|
||||||
log_err(_("required parameter 'conninfo' was not found\n"));
|
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Sanity check the provided conninfo string
|
|
||||||
*
|
|
||||||
* NOTE: this verifies the string format and checks for valid options
|
|
||||||
* but does not sanity check values
|
|
||||||
*/
|
|
||||||
conninfo_options = PQconninfoParse(options->conninfo, &conninfo_errmsg);
|
|
||||||
if (conninfo_options == NULL)
|
|
||||||
{
|
|
||||||
log_err(_("Parameter 'conninfo' is invalid: %s"), conninfo_errmsg);
|
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
|
||||||
PQconninfoFree(conninfo_options);
|
|
||||||
|
|
||||||
/* The following checks are for valid parameter values */
|
|
||||||
if (options->master_response_timeout <= 0)
|
|
||||||
{
|
|
||||||
log_err(_("'master_response_timeout' must be greater than zero\n"));
|
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
|
||||||
|
|
||||||
if (options->reconnect_attempts < 0)
|
|
||||||
{
|
|
||||||
log_err(_("'reconnect_attempts' must be zero or greater\n"));
|
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
|
||||||
|
|
||||||
if (options->reconnect_intvl < 0)
|
|
||||||
{
|
|
||||||
log_err(_("'reconnect_interval' must be zero or greater\n"));
|
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
return true;
|
return true;
|
||||||
@@ -378,7 +467,7 @@ trim(char *s)
|
|||||||
}
|
}
|
||||||
|
|
||||||
void
|
void
|
||||||
parse_line(char *buff, char *name, char *value)
|
parse_line(char *buf, char *name, char *value)
|
||||||
{
|
{
|
||||||
int i = 0;
|
int i = 0;
|
||||||
int j = 0;
|
int j = 0;
|
||||||
@@ -389,10 +478,10 @@ parse_line(char *buff, char *name, char *value)
|
|||||||
for (; i < MAXLEN; ++i)
|
for (; i < MAXLEN; ++i)
|
||||||
{
|
{
|
||||||
|
|
||||||
if (buff[i] == '=')
|
if (buf[i] == '=')
|
||||||
break;
|
break;
|
||||||
|
|
||||||
switch(buff[i])
|
switch(buf[i])
|
||||||
{
|
{
|
||||||
/* Ignore whitespace */
|
/* Ignore whitespace */
|
||||||
case ' ':
|
case ' ':
|
||||||
@@ -401,7 +490,7 @@ parse_line(char *buff, char *name, char *value)
|
|||||||
case '\t':
|
case '\t':
|
||||||
continue;
|
continue;
|
||||||
default:
|
default:
|
||||||
name[j++] = buff[i];
|
name[j++] = buf[i];
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
name[j] = '\0';
|
name[j] = '\0';
|
||||||
@@ -411,9 +500,9 @@ parse_line(char *buff, char *name, char *value)
|
|||||||
*/
|
*/
|
||||||
for (; i < MAXLEN; ++i)
|
for (; i < MAXLEN; ++i)
|
||||||
{
|
{
|
||||||
if (buff[i+1] == ' ')
|
if (buf[i+1] == ' ')
|
||||||
continue;
|
continue;
|
||||||
if (buff[i+1] == '\t')
|
if (buf[i+1] == '\t')
|
||||||
continue;
|
continue;
|
||||||
|
|
||||||
break;
|
break;
|
||||||
@@ -424,12 +513,12 @@ parse_line(char *buff, char *name, char *value)
|
|||||||
*/
|
*/
|
||||||
j = 0;
|
j = 0;
|
||||||
for (++i; i < MAXLEN; ++i)
|
for (++i; i < MAXLEN; ++i)
|
||||||
if (buff[i] == '\'')
|
if (buf[i] == '\'')
|
||||||
continue;
|
continue;
|
||||||
else if (buff[i] == '#')
|
else if (buf[i] == '#')
|
||||||
break;
|
break;
|
||||||
else if (buff[i] != '\n')
|
else if (buf[i] != '\n')
|
||||||
value[j++] = buff[i];
|
value[j++] = buf[i];
|
||||||
else
|
else
|
||||||
break;
|
break;
|
||||||
value[j] = '\0';
|
value[j] = '\0';
|
||||||
@@ -491,7 +580,7 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (new_options.reconnect_intvl < 0)
|
if (new_options.reconnect_interval < 0)
|
||||||
{
|
{
|
||||||
log_warning(_("new value for 'reconnect_interval' must be zero or greater\n"));
|
log_warning(_("new value for 'reconnect_interval' must be zero or greater\n"));
|
||||||
return false;
|
return false;
|
||||||
@@ -610,10 +699,10 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* reconnect_intvl */
|
/* reconnect_interval */
|
||||||
if (orig_options->reconnect_intvl != new_options.reconnect_intvl)
|
if (orig_options->reconnect_interval != new_options.reconnect_interval)
|
||||||
{
|
{
|
||||||
orig_options->reconnect_intvl = new_options.reconnect_intvl;
|
orig_options->reconnect_interval = new_options.reconnect_interval;
|
||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -665,6 +754,96 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
error_list_append(ErrorList *error_list, char *error_message)
|
||||||
|
{
|
||||||
|
ErrorListCell *cell;
|
||||||
|
|
||||||
|
cell = (ErrorListCell *) pg_malloc0(sizeof(ErrorListCell));
|
||||||
|
|
||||||
|
if (cell == NULL)
|
||||||
|
{
|
||||||
|
log_err(_("unable to allocate memory; terminating.\n"));
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
cell->error_message = pg_malloc0(MAXLEN);
|
||||||
|
strncpy(cell->error_message, error_message, MAXLEN);
|
||||||
|
|
||||||
|
if (error_list->tail)
|
||||||
|
{
|
||||||
|
error_list->tail->next = cell;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
error_list->head = cell;
|
||||||
|
}
|
||||||
|
|
||||||
|
error_list->tail = cell;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Convert provided string to an integer using strtol;
|
||||||
|
* on error, if a callback is provided, pass the error message to that,
|
||||||
|
* otherwise exit
|
||||||
|
*/
|
||||||
|
int
|
||||||
|
repmgr_atoi(const char *value, const char *config_item, ErrorList *error_list, bool allow_negative)
|
||||||
|
{
|
||||||
|
char *endptr;
|
||||||
|
long longval = 0;
|
||||||
|
char error_message_buf[MAXLEN] = "";
|
||||||
|
|
||||||
|
/* It's possible that some versions of strtol() don't treat an empty
|
||||||
|
* string as an error.
|
||||||
|
*/
|
||||||
|
|
||||||
|
if (*value == '\0')
|
||||||
|
{
|
||||||
|
snprintf(error_message_buf,
|
||||||
|
MAXLEN,
|
||||||
|
_("no value provided for \"%s\""),
|
||||||
|
config_item);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
errno = 0;
|
||||||
|
longval = strtol(value, &endptr, 10);
|
||||||
|
|
||||||
|
if (value == endptr || errno)
|
||||||
|
{
|
||||||
|
snprintf(error_message_buf,
|
||||||
|
MAXLEN,
|
||||||
|
_("\"%s\": invalid value (provided: \"%s\")"),
|
||||||
|
config_item, value);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Disallow negative values for most parameters */
|
||||||
|
if (allow_negative == false && longval < 0)
|
||||||
|
{
|
||||||
|
snprintf(error_message_buf,
|
||||||
|
MAXLEN,
|
||||||
|
_("\"%s\" must be zero or greater (provided: %s)"),
|
||||||
|
config_item, value);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Error message buffer is set */
|
||||||
|
if (error_message_buf[0] != '\0')
|
||||||
|
{
|
||||||
|
if (error_list == NULL)
|
||||||
|
{
|
||||||
|
log_err("%s\n", error_message_buf);
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
error_list_append(error_list, error_message_buf);
|
||||||
|
}
|
||||||
|
|
||||||
|
return (int32) longval;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Split argument into old_dir and new_dir and append to tablespace mapping
|
* Split argument into old_dir and new_dir and append to tablespace mapping
|
||||||
@@ -797,3 +976,21 @@ parse_event_notifications_list(t_configuration_options *options, const char *arg
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
static void
|
||||||
|
exit_with_errors(ErrorList *config_errors)
|
||||||
|
{
|
||||||
|
ErrorListCell *cell;
|
||||||
|
|
||||||
|
log_err(_("%s: following errors were found in the configuration file.\n"), progname());
|
||||||
|
|
||||||
|
for (cell = config_errors->head; cell; cell = cell->next)
|
||||||
|
{
|
||||||
|
log_err("%s\n", cell->error_message);
|
||||||
|
}
|
||||||
|
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
|||||||
29
config.h
29
config.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* config.h
|
* config.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -24,6 +24,7 @@
|
|||||||
|
|
||||||
#include "strutil.h"
|
#include "strutil.h"
|
||||||
|
|
||||||
|
#define CONFIG_FILE_NAME "repmgr.conf"
|
||||||
|
|
||||||
typedef struct EventNotificationListCell
|
typedef struct EventNotificationListCell
|
||||||
{
|
{
|
||||||
@@ -67,26 +68,46 @@ typedef struct
|
|||||||
char ssh_options[QUERY_STR_LEN];
|
char ssh_options[QUERY_STR_LEN];
|
||||||
int master_response_timeout;
|
int master_response_timeout;
|
||||||
int reconnect_attempts;
|
int reconnect_attempts;
|
||||||
int reconnect_intvl;
|
int reconnect_interval;
|
||||||
char pg_bindir[MAXLEN];
|
char pg_bindir[MAXLEN];
|
||||||
char pg_ctl_options[MAXLEN];
|
char pg_ctl_options[MAXLEN];
|
||||||
char pg_basebackup_options[MAXLEN];
|
char pg_basebackup_options[MAXLEN];
|
||||||
char logfile[MAXLEN];
|
char logfile[MAXLEN];
|
||||||
int monitor_interval_secs;
|
int monitor_interval_secs;
|
||||||
int retry_promote_interval_secs;
|
int retry_promote_interval_secs;
|
||||||
|
int witness_repl_nodes_sync_interval_secs;
|
||||||
int use_replication_slots;
|
int use_replication_slots;
|
||||||
char event_notification_command[MAXLEN];
|
char event_notification_command[MAXLEN];
|
||||||
EventNotificationList event_notifications;
|
EventNotificationList event_notifications;
|
||||||
TablespaceList tablespace_mapping;
|
TablespaceList tablespace_mapping;
|
||||||
} t_configuration_options;
|
} t_configuration_options;
|
||||||
|
|
||||||
#define T_CONFIGURATION_OPTIONS_INITIALIZER { "", -1, NO_UPSTREAM_NODE, "", MANUAL_FAILOVER, -1, "", "", "", "", "", "", "", -1, -1, -1, "", "", "", "", 0, 0, 0, "", { NULL, NULL }, {NULL, NULL} }
|
#define T_CONFIGURATION_OPTIONS_INITIALIZER { "", -1, NO_UPSTREAM_NODE, "", MANUAL_FAILOVER, -1, "", "", "", "", "", "", "", -1, -1, -1, "", "", "", "", 0, 0, 0, 0, "", { NULL, NULL }, {NULL, NULL} }
|
||||||
|
|
||||||
|
typedef struct ErrorListCell
|
||||||
|
{
|
||||||
|
struct ErrorListCell *next;
|
||||||
|
char *error_message;
|
||||||
|
} ErrorListCell;
|
||||||
|
|
||||||
bool load_config(const char *config_file, t_configuration_options *options, char *argv0);
|
typedef struct ErrorList
|
||||||
|
{
|
||||||
|
ErrorListCell *head;
|
||||||
|
ErrorListCell *tail;
|
||||||
|
} ErrorList;
|
||||||
|
|
||||||
|
void set_progname(const char *argv0);
|
||||||
|
const char * progname(void);
|
||||||
|
|
||||||
|
bool load_config(const char *config_file, bool verbose, t_configuration_options *options, char *argv0);
|
||||||
bool reload_config(t_configuration_options *orig_options);
|
bool reload_config(t_configuration_options *orig_options);
|
||||||
bool parse_config(t_configuration_options *options);
|
bool parse_config(t_configuration_options *options);
|
||||||
void parse_line(char *buff, char *name, char *value);
|
void parse_line(char *buff, char *name, char *value);
|
||||||
char *trim(char *s);
|
char *trim(char *s);
|
||||||
|
void error_list_append(ErrorList *error_list, char *error_message);
|
||||||
|
int repmgr_atoi(const char *s,
|
||||||
|
const char *config_item,
|
||||||
|
ErrorList *error_list,
|
||||||
|
bool allow_negative);
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
82
dbutils.h
82
dbutils.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* dbutils.h
|
* dbutils.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -20,13 +20,71 @@
|
|||||||
#ifndef _REPMGR_DBUTILS_H_
|
#ifndef _REPMGR_DBUTILS_H_
|
||||||
#define _REPMGR_DBUTILS_H_
|
#define _REPMGR_DBUTILS_H_
|
||||||
|
|
||||||
|
#include "access/xlogdefs.h"
|
||||||
|
|
||||||
#include "config.h"
|
#include "config.h"
|
||||||
#include "strutil.h"
|
#include "strutil.h"
|
||||||
|
|
||||||
|
|
||||||
|
typedef enum {
|
||||||
|
UNKNOWN = 0,
|
||||||
|
MASTER,
|
||||||
|
STANDBY,
|
||||||
|
WITNESS
|
||||||
|
} t_server_type;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Struct to store node information
|
||||||
|
*/
|
||||||
|
typedef struct s_node_info
|
||||||
|
{
|
||||||
|
int node_id;
|
||||||
|
int upstream_node_id;
|
||||||
|
t_server_type type;
|
||||||
|
char name[MAXLEN];
|
||||||
|
char conninfo_str[MAXLEN];
|
||||||
|
char slot_name[MAXLEN];
|
||||||
|
int priority;
|
||||||
|
bool active;
|
||||||
|
bool is_ready;
|
||||||
|
bool is_visible;
|
||||||
|
XLogRecPtr xlog_location;
|
||||||
|
} t_node_info;
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Struct to store replication slot information
|
||||||
|
*/
|
||||||
|
|
||||||
|
typedef struct s_replication_slot
|
||||||
|
{
|
||||||
|
char slot_name[MAXLEN];
|
||||||
|
char slot_type[MAXLEN];
|
||||||
|
bool active;
|
||||||
|
} t_replication_slot;
|
||||||
|
|
||||||
|
|
||||||
|
#define T_NODE_INFO_INITIALIZER { \
|
||||||
|
NODE_NOT_FOUND, \
|
||||||
|
NO_UPSTREAM_NODE, \
|
||||||
|
UNKNOWN, \
|
||||||
|
"", \
|
||||||
|
"", \
|
||||||
|
"", \
|
||||||
|
DEFAULT_PRIORITY, \
|
||||||
|
true, \
|
||||||
|
false, \
|
||||||
|
false, \
|
||||||
|
InvalidXLogRecPtr \
|
||||||
|
}
|
||||||
|
|
||||||
|
PGconn *_establish_db_connection(const char *conninfo,
|
||||||
|
const bool exit_on_error,
|
||||||
|
const bool log_notice);
|
||||||
PGconn *establish_db_connection(const char *conninfo,
|
PGconn *establish_db_connection(const char *conninfo,
|
||||||
const bool exit_on_error);
|
const bool exit_on_error);
|
||||||
|
PGconn *test_db_connection(const char *conninfo,
|
||||||
|
const bool exit_on_error);
|
||||||
PGconn *establish_db_connection_by_params(const char *keywords[],
|
PGconn *establish_db_connection_by_params(const char *keywords[],
|
||||||
const char *values[],
|
const char *values[],
|
||||||
const bool exit_on_error);
|
const bool exit_on_error);
|
||||||
@@ -45,7 +103,7 @@ int guc_set(PGconn *conn, const char *parameter, const char *op,
|
|||||||
const char *value);
|
const char *value);
|
||||||
int guc_set_typed(PGconn *conn, const char *parameter, const char *op,
|
int guc_set_typed(PGconn *conn, const char *parameter, const char *op,
|
||||||
const char *value, const char *datatype);
|
const char *value, const char *datatype);
|
||||||
|
bool get_conninfo_value(const char *conninfo, const char *keyword, char *output);
|
||||||
PGconn *get_upstream_connection(PGconn *standby_conn, char *cluster,
|
PGconn *get_upstream_connection(PGconn *standby_conn, char *cluster,
|
||||||
int node_id,
|
int node_id,
|
||||||
int *upstream_node_id_ptr,
|
int *upstream_node_id_ptr,
|
||||||
@@ -57,16 +115,22 @@ int wait_connection_availability(PGconn *conn, long long timeout);
|
|||||||
bool cancel_query(PGconn *conn, int timeout);
|
bool cancel_query(PGconn *conn, int timeout);
|
||||||
char *get_repmgr_schema(void);
|
char *get_repmgr_schema(void);
|
||||||
char *get_repmgr_schema_quoted(PGconn *conn);
|
char *get_repmgr_schema_quoted(PGconn *conn);
|
||||||
bool create_replication_slot(PGconn *conn, char *slot_name);
|
bool create_replication_slot(PGconn *conn, char *slot_name, int server_version_num);
|
||||||
|
int get_slot_record(PGconn *conn, char *slot_name, t_replication_slot *record);
|
||||||
|
bool drop_replication_slot(PGconn *conn, char *slot_name);
|
||||||
bool start_backup(PGconn *conn, char *first_wal_segment, bool fast_checkpoint);
|
bool start_backup(PGconn *conn, char *first_wal_segment, bool fast_checkpoint);
|
||||||
bool stop_backup(PGconn *conn, char *last_wal_segment);
|
bool stop_backup(PGconn *conn, char *last_wal_segment);
|
||||||
bool set_config_bool(PGconn *conn, const char *config_param, bool state);
|
bool set_config_bool(PGconn *conn, const char *config_param, bool state);
|
||||||
bool copy_configuration(PGconn *masterconn, PGconn *witnessconn, char *cluster_name);
|
bool witness_copy_node_records(PGconn *masterconn, PGconn *witnessconn, char *cluster_name);
|
||||||
bool create_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name);
|
bool create_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name, bool active);
|
||||||
bool delete_node_record(PGconn *conn, int node, char *action);
|
bool delete_node_record(PGconn *conn, int node, char *action);
|
||||||
bool create_event_record(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
int get_node_record(PGconn *conn, char *cluster, int node_id, t_node_info *node_info);
|
||||||
|
bool update_node_record_status(PGconn *conn, char *cluster_name, int this_node_id, char *type, int upstream_node_id, bool active);
|
||||||
bool update_node_record_set_upstream(PGconn *conn, char *cluster_name, int this_node_id, int new_upstream_node_id);
|
bool update_node_record_set_upstream(PGconn *conn, char *cluster_name, int this_node_id, int new_upstream_node_id);
|
||||||
PGresult * get_node_record(PGconn *conn, char *cluster, int node_id);
|
bool create_event_record(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
||||||
|
|
||||||
|
int get_node_replication_state(PGconn *conn, char *node_name, char *output);
|
||||||
|
t_server_type parse_node_type(const char *type);
|
||||||
|
int get_data_checksum_version(const char *data_directory);
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
|||||||
6
debian/DEBIAN/control
vendored
6
debian/DEBIAN/control
vendored
@@ -1,9 +1,9 @@
|
|||||||
Package: repmgr-auto
|
Package: repmgr-auto
|
||||||
Version: 2.0beta2
|
Version: 3.0.1
|
||||||
Section: database
|
Section: database
|
||||||
Priority: optional
|
Priority: optional
|
||||||
Architecture: all
|
Architecture: all
|
||||||
Depends: rsync, postgresql-9.0 | postgresql-9.1 | postgresql-9.2 | postgresql-9.3 | postgresql-9.4
|
Depends: rsync, postgresql-9.3 | postgresql-9.4
|
||||||
Maintainer: Jaime Casanova <jaime@2ndQuadrant.com>
|
Maintainer: Self built package <user@localhost>
|
||||||
Description: PostgreSQL replication setup, magament and monitoring
|
Description: PostgreSQL replication setup, magament and monitoring
|
||||||
has two main executables
|
has two main executables
|
||||||
|
|||||||
2
debian/repmgr.repmgrd.init
vendored
2
debian/repmgr.repmgrd.init
vendored
@@ -59,7 +59,7 @@ do_stop()
|
|||||||
# 0 if daemon has been stopped
|
# 0 if daemon has been stopped
|
||||||
# 1 if daemon was already stopped
|
# 1 if daemon was already stopped
|
||||||
# other if daemon could not be stopped or a failure occurred
|
# other if daemon could not be stopped or a failure occurred
|
||||||
start-stop-daemon --stop --quiet --retry=TERM/30/KILL/5 --pidfile $REPMGRD_PIDFILE --exec $REPMGRD_BIN
|
start-stop-daemon --stop --quiet --retry=TERM/30/KILL/5 --pidfile $REPMGRD_PIDFILE --name "$(basename $REPMGRD_BIN)"
|
||||||
}
|
}
|
||||||
|
|
||||||
case "$1" in
|
case "$1" in
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* errcode.h
|
* errcode.h
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -36,5 +36,7 @@
|
|||||||
#define ERR_SYS_FAILURE 13
|
#define ERR_SYS_FAILURE 13
|
||||||
#define ERR_BAD_BASEBACKUP 14
|
#define ERR_BAD_BASEBACKUP 14
|
||||||
#define ERR_INTERNAL 15
|
#define ERR_INTERNAL 15
|
||||||
|
#define ERR_MONITORING_FAIL 16
|
||||||
|
#define ERR_BAD_BACKUP_LABEL 17
|
||||||
|
|
||||||
#endif /* _ERRCODE_H_ */
|
#endif /* _ERRCODE_H_ */
|
||||||
|
|||||||
133
log.c
133
log.c
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* log.c - Logging methods
|
* log.c - Logging methods
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This module is a set of methods for logging (currently only syslog)
|
* This module is a set of methods for logging (currently only syslog)
|
||||||
*
|
*
|
||||||
@@ -39,13 +39,38 @@
|
|||||||
|
|
||||||
/* #define REPMGR_DEBUG */
|
/* #define REPMGR_DEBUG */
|
||||||
|
|
||||||
void
|
static int detect_log_facility(const char *facility);
|
||||||
|
static void _stderr_log_with_level(const char *level_name, int level, const char *fmt, va_list ap)
|
||||||
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 0)));
|
||||||
|
|
||||||
|
int log_type = REPMGR_STDERR;
|
||||||
|
int log_level = LOG_NOTICE;
|
||||||
|
int last_log_level = LOG_NOTICE;
|
||||||
|
int verbose_logging = false;
|
||||||
|
int terse_logging = false;
|
||||||
|
|
||||||
|
extern void
|
||||||
stderr_log_with_level(const char *level_name, int level, const char *fmt, ...)
|
stderr_log_with_level(const char *level_name, int level, const char *fmt, ...)
|
||||||
|
{
|
||||||
|
va_list arglist;
|
||||||
|
|
||||||
|
va_start(arglist, fmt);
|
||||||
|
_stderr_log_with_level(level_name, level, fmt, arglist);
|
||||||
|
va_end(arglist);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void
|
||||||
|
_stderr_log_with_level(const char *level_name, int level, const char *fmt, va_list ap)
|
||||||
{
|
{
|
||||||
time_t t;
|
time_t t;
|
||||||
struct tm *tm;
|
struct tm *tm;
|
||||||
char buff[100];
|
char buff[100];
|
||||||
va_list ap;
|
|
||||||
|
/*
|
||||||
|
* Store the requested level so that if there's a subsequent
|
||||||
|
* log_hint(), we can suppress that if appropriate.
|
||||||
|
*/
|
||||||
|
last_log_level = level;
|
||||||
|
|
||||||
if (log_level >= level)
|
if (log_level >= level)
|
||||||
{
|
{
|
||||||
@@ -54,24 +79,74 @@ stderr_log_with_level(const char *level_name, int level, const char *fmt, ...)
|
|||||||
strftime(buff, 100, "[%Y-%m-%d %H:%M:%S]", tm);
|
strftime(buff, 100, "[%Y-%m-%d %H:%M:%S]", tm);
|
||||||
fprintf(stderr, "%s [%s] ", buff, level_name);
|
fprintf(stderr, "%s [%s] ", buff, level_name);
|
||||||
|
|
||||||
va_start(ap, fmt);
|
|
||||||
vfprintf(stderr, fmt, ap);
|
vfprintf(stderr, fmt, ap);
|
||||||
va_end(ap);
|
|
||||||
|
|
||||||
fflush(stderr);
|
fflush(stderr);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void
|
||||||
|
log_hint(const char *fmt, ...)
|
||||||
|
{
|
||||||
|
va_list ap;
|
||||||
|
|
||||||
static int detect_log_level(const char *level);
|
if (terse_logging == false)
|
||||||
static int detect_log_facility(const char *facility);
|
{
|
||||||
|
va_start(ap, fmt);
|
||||||
|
_stderr_log_with_level("HINT", last_log_level, fmt, ap);
|
||||||
|
va_end(ap);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
log_verbose(int level, const char *fmt, ...)
|
||||||
|
{
|
||||||
|
va_list ap;
|
||||||
|
|
||||||
|
va_start(ap, fmt);
|
||||||
|
|
||||||
|
if (verbose_logging == true)
|
||||||
|
{
|
||||||
|
switch(level)
|
||||||
|
{
|
||||||
|
case LOG_EMERG:
|
||||||
|
_stderr_log_with_level("EMERG", level, fmt, ap);
|
||||||
|
break;
|
||||||
|
case LOG_ALERT:
|
||||||
|
_stderr_log_with_level("ALERT", level, fmt, ap);
|
||||||
|
break;
|
||||||
|
case LOG_CRIT:
|
||||||
|
_stderr_log_with_level("CRIT", level, fmt, ap);
|
||||||
|
break;
|
||||||
|
case LOG_ERR:
|
||||||
|
_stderr_log_with_level("ERR", level, fmt, ap);
|
||||||
|
break;
|
||||||
|
case LOG_WARNING:
|
||||||
|
_stderr_log_with_level("WARNING", level, fmt, ap);
|
||||||
|
break;
|
||||||
|
case LOG_NOTICE:
|
||||||
|
_stderr_log_with_level("NOTICE", level, fmt, ap);
|
||||||
|
break;
|
||||||
|
case LOG_INFO:
|
||||||
|
_stderr_log_with_level("INFO", level, fmt, ap);
|
||||||
|
break;
|
||||||
|
case LOG_DEBUG:
|
||||||
|
_stderr_log_with_level("DEBUG", level, fmt, ap);
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
va_end(ap);
|
||||||
|
}
|
||||||
|
|
||||||
int log_type = REPMGR_STDERR;
|
|
||||||
int log_level = LOG_NOTICE;
|
|
||||||
|
|
||||||
bool
|
bool
|
||||||
logger_init(t_configuration_options * opts, const char *ident, const char *level, const char *facility)
|
logger_init(t_configuration_options * opts, const char *ident)
|
||||||
{
|
{
|
||||||
|
char *level = opts->loglevel;
|
||||||
|
char *facility = opts->logfacility;
|
||||||
|
|
||||||
int l;
|
int l;
|
||||||
int f;
|
int f;
|
||||||
|
|
||||||
@@ -95,10 +170,10 @@ logger_init(t_configuration_options * opts, const char *ident, const char *level
|
|||||||
printf("Assigned level for logger: %d\n", l);
|
printf("Assigned level for logger: %d\n", l);
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
if (l > 0)
|
if (l >= 0)
|
||||||
log_level = l;
|
log_level = l;
|
||||||
else
|
else
|
||||||
stderr_log_warning(_("Cannot detect log level %s (use any of DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG)\n"), level);
|
stderr_log_warning(_("Invalid log level \"%s\" (available values: DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG)\n"), level);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (facility && *facility)
|
if (facility && *facility)
|
||||||
@@ -174,9 +249,9 @@ logger_init(t_configuration_options * opts, const char *ident, const char *level
|
|||||||
}
|
}
|
||||||
|
|
||||||
return true;
|
return true;
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
bool
|
bool
|
||||||
logger_shutdown(void)
|
logger_shutdown(void)
|
||||||
{
|
{
|
||||||
@@ -189,17 +264,32 @@ logger_shutdown(void)
|
|||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Set a minimum logging level. Intended for command line verbosity
|
* Indicate whether extra-verbose logging is required. This will
|
||||||
* options, which might increase requested logging over what's specified
|
* generate a lot of output, particularly debug logging, and should
|
||||||
* in the regular configuration file.
|
* not be permanently enabled in production.
|
||||||
|
*
|
||||||
|
* NOTE: in previous repmgr versions, this option forced the log
|
||||||
|
* level to INFO.
|
||||||
*/
|
*/
|
||||||
void
|
void
|
||||||
logger_min_verbose(int minimum)
|
logger_set_verbose(void)
|
||||||
{
|
{
|
||||||
if (log_level < minimum)
|
verbose_logging = true;
|
||||||
log_level = minimum;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Indicate whether some non-critical log messages can be omitted.
|
||||||
|
* Currently this includes warnings about irrelevant command line
|
||||||
|
* options and hints.
|
||||||
|
*/
|
||||||
|
|
||||||
|
void logger_set_terse(void)
|
||||||
|
{
|
||||||
|
terse_logging = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
int
|
int
|
||||||
detect_log_level(const char *level)
|
detect_log_level(const char *level)
|
||||||
{
|
{
|
||||||
@@ -220,17 +310,16 @@ detect_log_level(const char *level)
|
|||||||
if (!strcmp(level, "EMERG"))
|
if (!strcmp(level, "EMERG"))
|
||||||
return LOG_EMERG;
|
return LOG_EMERG;
|
||||||
|
|
||||||
return 0;
|
return -1;
|
||||||
}
|
}
|
||||||
|
|
||||||
int
|
static int
|
||||||
detect_log_facility(const char *facility)
|
detect_log_facility(const char *facility)
|
||||||
{
|
{
|
||||||
int local = 0;
|
int local = 0;
|
||||||
|
|
||||||
if (!strncmp(facility, "LOCAL", 5) && strlen(facility) == 6)
|
if (!strncmp(facility, "LOCAL", 5) && strlen(facility) == 6)
|
||||||
{
|
{
|
||||||
|
|
||||||
local = atoi(&facility[5]);
|
local = atoi(&facility[5]);
|
||||||
|
|
||||||
switch (local)
|
switch (local)
|
||||||
|
|||||||
18
log.h
18
log.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* log.h
|
* log.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -25,7 +25,7 @@
|
|||||||
#define REPMGR_SYSLOG 1
|
#define REPMGR_SYSLOG 1
|
||||||
#define REPMGR_STDERR 2
|
#define REPMGR_STDERR 2
|
||||||
|
|
||||||
void
|
extern void
|
||||||
stderr_log_with_level(const char *level_name, int level, const char *fmt,...)
|
stderr_log_with_level(const char *level_name, int level, const char *fmt,...)
|
||||||
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 4)));
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 4)));
|
||||||
|
|
||||||
@@ -112,13 +112,21 @@ __attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 4)));
|
|||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
|
||||||
|
int detect_log_level(const char *level);
|
||||||
|
|
||||||
/* Logger initialisation and shutdown */
|
/* Logger initialisation and shutdown */
|
||||||
|
|
||||||
|
bool logger_init(t_configuration_options * opts, const char *ident);
|
||||||
|
|
||||||
bool logger_shutdown(void);
|
bool logger_shutdown(void);
|
||||||
|
|
||||||
bool logger_init(t_configuration_options * opts, const char *ident,
|
void logger_set_verbose(void);
|
||||||
const char *level, const char *facility);
|
void logger_set_terse(void);
|
||||||
|
|
||||||
void logger_min_verbose(int minimum);
|
void log_hint(const char *fmt, ...)
|
||||||
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 1, 2)));
|
||||||
|
void log_verbose(int level, const char *fmt, ...)
|
||||||
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 2, 3)));
|
||||||
|
|
||||||
extern int log_type;
|
extern int log_type;
|
||||||
extern int log_level;
|
extern int log_level;
|
||||||
|
|||||||
@@ -2,6 +2,10 @@
|
|||||||
# Replication Manager sample configuration file
|
# Replication Manager sample configuration file
|
||||||
###################################################
|
###################################################
|
||||||
|
|
||||||
|
# Some configuration items will be set with a default value; this
|
||||||
|
# is noted for each item. Where no default value is shown, the
|
||||||
|
# parameter will be treated as empty or false.
|
||||||
|
|
||||||
# Required configuration items
|
# Required configuration items
|
||||||
# ============================
|
# ============================
|
||||||
#
|
#
|
||||||
@@ -11,17 +15,21 @@
|
|||||||
# schema (pattern: "repmgr_{cluster}"); while this name will be quoted
|
# schema (pattern: "repmgr_{cluster}"); while this name will be quoted
|
||||||
# to preserve case, we recommend using lower case and avoiding whitespace
|
# to preserve case, we recommend using lower case and avoiding whitespace
|
||||||
# to facilitate easier querying of the repmgr views and tables.
|
# to facilitate easier querying of the repmgr views and tables.
|
||||||
cluster=example_cluster
|
#cluster=example_cluster
|
||||||
|
|
||||||
# Node ID and name
|
# Node ID and name
|
||||||
# (Note: we recommend to avoid naming nodes after their initial
|
# (Note: we recommend to avoid naming nodes after their initial
|
||||||
# replication funcion, as this will cause confusion when e.g.
|
# replication funcion, as this will cause confusion when e.g.
|
||||||
# "standby2" is promoted to master)
|
# "standby2" is promoted to primary)
|
||||||
node=2
|
#node=2 # a unique integer
|
||||||
node_name=node2
|
#node_name=node2 # an arbitrary (but unique) string; we recommend using
|
||||||
|
# the server's hostname or another identifier unambiguously
|
||||||
|
# associated with the server to avoid confusion
|
||||||
|
|
||||||
# Database connection information
|
# Database connection information as a conninfo string
|
||||||
conninfo='host=192.168.204.104 dbname=repmgr_db user=repmgr_usr'
|
# This must be accessible to all servers in the cluster; for details see:
|
||||||
|
# http://www.postgresql.org/docs/current/static/libpq-connect.html#LIBPQ-CONNSTRING
|
||||||
|
#conninfo='host=192.168.204.104 dbname=repmgr_db user=repmgr_usr'
|
||||||
|
|
||||||
# Optional configuration items
|
# Optional configuration items
|
||||||
# ============================
|
# ============================
|
||||||
@@ -29,33 +37,34 @@ conninfo='host=192.168.204.104 dbname=repmgr_db user=repmgr_usr'
|
|||||||
# Replication settings
|
# Replication settings
|
||||||
# ---------------------
|
# ---------------------
|
||||||
|
|
||||||
# when using cascading replication and a standby is to be connected to an
|
# When using cascading replication, a standby can connect to another
|
||||||
# upstream standby, specify that node's ID with 'upstream_node'. The node
|
# upstream standby node which is specified by setting 'upstream_node'.
|
||||||
# must exist before the new standby can be registered. If a standby is
|
# In that case, the upstream node must exist before the new standby
|
||||||
# to connect directly to a master node, this parameter is not required.
|
# can be registered. If 'upstream_node' is not set, then the standby
|
||||||
#
|
# will connect directly to the primary node.
|
||||||
# upstream_node=1
|
#upstream_node=1
|
||||||
|
|
||||||
# physical replication slots - PostgreSQL 9.4 and later only
|
# use physical replication slots - PostgreSQL 9.4 and later only
|
||||||
# (default: 0)
|
# (default: 0)
|
||||||
#
|
#use_replication_slots=0
|
||||||
# use_replication_slots=0
|
|
||||||
|
|
||||||
|
# NOTE: 'max_replication_slots' should be configured for at least the
|
||||||
|
# number of standbys which will connect to the primary.
|
||||||
|
|
||||||
# Logging and monitoring settings
|
# Logging and monitoring settings
|
||||||
# -------------------------------
|
# -------------------------------
|
||||||
|
|
||||||
# Log level: possible values are DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG
|
# Log level: possible values are DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG
|
||||||
# (default: NOTICE)
|
# (default: NOTICE)
|
||||||
loglevel=NOTICE
|
#loglevel=NOTICE
|
||||||
|
|
||||||
# Logging facility: possible values are STDERR or - for Syslog integration - one of LOCAL0, LOCAL1, ..., LOCAL7, USER
|
# Logging facility: possible values are STDERR or - for Syslog integration - one of LOCAL0, LOCAL1, ..., LOCAL7, USER
|
||||||
# (default: STDERR)
|
# (default: STDERR)
|
||||||
logfacility=STDERR
|
#logfacility=STDERR
|
||||||
|
|
||||||
# stderr can be redirected to an arbitrary file:
|
# stderr can be redirected to an arbitrary file:
|
||||||
#
|
#
|
||||||
# logfile='/var/log/repmgr.log'
|
#logfile='/var/log/repmgr/repmgr.log'
|
||||||
|
|
||||||
# event notifications can be passed to an arbitrary external program
|
# event notifications can be passed to an arbitrary external program
|
||||||
# together with the following parameters:
|
# together with the following parameters:
|
||||||
@@ -69,12 +78,12 @@ logfacility=STDERR
|
|||||||
# the values provided for "%t" and "%d" will probably contain spaces,
|
# the values provided for "%t" and "%d" will probably contain spaces,
|
||||||
# so should be quoted in the provided command configuration, e.g.:
|
# so should be quoted in the provided command configuration, e.g.:
|
||||||
#
|
#
|
||||||
# event_notification_command='/path/to/some/script %n %e %s "%t" "%d"'
|
#event_notification_command='/path/to/some/script %n %e %s "%t" "%d"'
|
||||||
|
|
||||||
# By default, all notifications will be passed; the notification types
|
# By default, all notifications will be passed; the notification types
|
||||||
# can be filtered to explicitly named ones:
|
# can be filtered to explicitly named ones:
|
||||||
#
|
#
|
||||||
# event_notifications=master_register,standby_register,witness_create
|
#event_notifications=master_register,standby_register,witness_create
|
||||||
|
|
||||||
|
|
||||||
# Environment/command settings
|
# Environment/command settings
|
||||||
@@ -82,17 +91,17 @@ logfacility=STDERR
|
|||||||
|
|
||||||
# path to PostgreSQL binary directory (location of pg_ctl, pg_basebackup etc.)
|
# path to PostgreSQL binary directory (location of pg_ctl, pg_basebackup etc.)
|
||||||
# (if not provided, defaults to system $PATH)
|
# (if not provided, defaults to system $PATH)
|
||||||
# pg_bindir=/usr/bin/
|
#pg_bindir=/usr/bin/
|
||||||
|
|
||||||
# external command options
|
# external command options
|
||||||
|
|
||||||
# rsync_options=--archive --checksum --compress --progress --rsh="ssh -o \"StrictHostKeyChecking no\""
|
#rsync_options=--archive --checksum --compress --progress --rsh="ssh -o \"StrictHostKeyChecking no\""
|
||||||
# ssh_options=-o "StrictHostKeyChecking no"
|
#ssh_options=-o "StrictHostKeyChecking no"
|
||||||
|
|
||||||
# external command arguments
|
# external command arguments. Values shown are examples.
|
||||||
|
|
||||||
# pg_ctl_options='-s'
|
#pg_ctl_options='-s'
|
||||||
# pg_basebackup_options='--xlog-method=s'
|
#pg_basebackup_options='--xlog-method=s'
|
||||||
|
|
||||||
|
|
||||||
# Standby clone settings
|
# Standby clone settings
|
||||||
@@ -108,30 +117,36 @@ logfacility=STDERR
|
|||||||
# Failover settings (repmgrd)
|
# Failover settings (repmgrd)
|
||||||
# ---------------------------
|
# ---------------------------
|
||||||
#
|
#
|
||||||
# These settings are only applied when repmgrd is running.
|
# These settings are only applied when repmgrd is running. Values shown
|
||||||
|
# are defaults.
|
||||||
|
|
||||||
# How many seconds we wait for master response before declaring master failure
|
# Number of seconds to wait for a response from the primary server before
|
||||||
master_response_timeout=60
|
# deciding it has failed.
|
||||||
|
|
||||||
# How many time we try to reconnect to master before starting failover procedure
|
#master_response_timeout=60
|
||||||
reconnect_attempts=6
|
|
||||||
reconnect_interval=10
|
# Number of attempts at what interval (in seconds) to try and
|
||||||
|
# connect to a server to establish its status (e.g. master
|
||||||
|
# during failover)
|
||||||
|
#reconnect_attempts=6
|
||||||
|
#reconnect_interval=10
|
||||||
|
|
||||||
# Autofailover options
|
# Autofailover options
|
||||||
failover=automatic # one of 'automatic', 'manual'
|
#failover=manual # one of 'automatic', 'manual'
|
||||||
priority=100 # a value of zero or less prevents the node being promoted to master
|
# (default: manual)
|
||||||
promote_command='repmgr standby promote -f /path/to/repmgr.conf'
|
#priority=100 # a value of zero or less prevents the node being promoted to primary
|
||||||
follow_command='repmgr standby follow -f /path/to/repmgr.conf -W'
|
# (default: 100)
|
||||||
|
#promote_command='repmgr standby promote -f /path/to/repmgr.conf'
|
||||||
|
#follow_command='repmgr standby follow -f /path/to/repmgr.conf -W'
|
||||||
|
|
||||||
# monitoring interval; default is 2s
|
# monitoring interval in seconds; default is 2
|
||||||
#
|
#monitor_interval_secs=2
|
||||||
# monitor_interval_secs=2
|
|
||||||
|
|
||||||
# change wait time for master; before we bail out and exit when the master
|
# change wait time for primary; before we bail out and exit when the primary
|
||||||
# disappears, we wait 'reconnect_attempts' * 'retry_promote_interval_secs'
|
# disappears, we wait 'reconnect_attempts' * 'retry_promote_interval_secs'
|
||||||
# seconds; by default this would be half an hour, as 'retry_promote_interval_secs'
|
# seconds; by default this would be half an hour, as 'retry_promote_interval_secs'
|
||||||
# default value is 300)
|
# default value is 300)
|
||||||
#
|
#retry_promote_interval_secs=300
|
||||||
# retry_promote_interval_secs=300
|
|
||||||
|
|
||||||
|
|
||||||
|
# Number of seconds after which the witness server resyncs the repl_nodes table
|
||||||
|
#witness_repl_nodes_sync_interval_secs=15
|
||||||
|
|||||||
66
repmgr.h
66
repmgr.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr.h
|
* repmgr.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -32,15 +32,10 @@
|
|||||||
#define MIN_SUPPORTED_VERSION "9.3"
|
#define MIN_SUPPORTED_VERSION "9.3"
|
||||||
#define MIN_SUPPORTED_VERSION_NUM 90300
|
#define MIN_SUPPORTED_VERSION_NUM 90300
|
||||||
|
|
||||||
#include "config.h"
|
|
||||||
#define MAXFILENAME 1024
|
|
||||||
#define ERRBUFF_SIZE 512
|
#define ERRBUFF_SIZE 512
|
||||||
|
|
||||||
#define DEFAULT_CONFIG_FILE "./repmgr.conf"
|
|
||||||
#define DEFAULT_WAL_KEEP_SEGMENTS "5000"
|
#define DEFAULT_WAL_KEEP_SEGMENTS "5000"
|
||||||
#define DEFAULT_DEST_DIR "."
|
#define DEFAULT_DEST_DIR "."
|
||||||
#define DEFAULT_MASTER_PORT "5432"
|
|
||||||
#define DEFAULT_DBNAME "postgres"
|
|
||||||
#define DEFAULT_REPMGR_SCHEMA_PREFIX "repmgr_"
|
#define DEFAULT_REPMGR_SCHEMA_PREFIX "repmgr_"
|
||||||
#define DEFAULT_PRIORITY 100
|
#define DEFAULT_PRIORITY 100
|
||||||
#define FAILOVER_NODES_MAX_CHECK 50
|
#define FAILOVER_NODES_MAX_CHECK 50
|
||||||
@@ -49,14 +44,7 @@
|
|||||||
#define AUTOMATIC_FAILOVER 1
|
#define AUTOMATIC_FAILOVER 1
|
||||||
#define NODE_NOT_FOUND -1
|
#define NODE_NOT_FOUND -1
|
||||||
#define NO_UPSTREAM_NODE -1
|
#define NO_UPSTREAM_NODE -1
|
||||||
|
#define UNKNOWN_NODE_ID -1
|
||||||
|
|
||||||
typedef enum {
|
|
||||||
UNKNOWN = 0,
|
|
||||||
MASTER,
|
|
||||||
STANDBY,
|
|
||||||
WITNESS
|
|
||||||
} t_server_type;
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
@@ -67,44 +55,60 @@ typedef struct
|
|||||||
char dbname[MAXLEN];
|
char dbname[MAXLEN];
|
||||||
char host[MAXLEN];
|
char host[MAXLEN];
|
||||||
char username[MAXLEN];
|
char username[MAXLEN];
|
||||||
char dest_dir[MAXFILENAME];
|
char dest_dir[MAXPGPATH];
|
||||||
char config_file[MAXFILENAME];
|
char config_file[MAXPGPATH];
|
||||||
char remote_user[MAXLEN];
|
char remote_user[MAXLEN];
|
||||||
char superuser[MAXLEN];
|
char superuser[MAXLEN];
|
||||||
char wal_keep_segments[MAXLEN];
|
char wal_keep_segments[MAXLEN];
|
||||||
bool verbose;
|
bool verbose;
|
||||||
|
bool terse;
|
||||||
bool force;
|
bool force;
|
||||||
bool wait_for_master;
|
bool wait_for_master;
|
||||||
bool ignore_rsync_warn;
|
bool ignore_rsync_warn;
|
||||||
bool initdb_no_pwprompt;
|
bool witness_pwprompt;
|
||||||
bool rsync_only;
|
bool rsync_only;
|
||||||
bool fast_checkpoint;
|
bool fast_checkpoint;
|
||||||
bool ignore_external_config_files;
|
bool ignore_external_config_files;
|
||||||
|
char pg_ctl_mode[MAXLEN];
|
||||||
char masterport[MAXLEN];
|
char masterport[MAXLEN];
|
||||||
char localport[MAXLEN];
|
/*
|
||||||
|
* configuration file parameters which can be overridden on the
|
||||||
|
* command line
|
||||||
|
*/
|
||||||
|
char loglevel[MAXLEN];
|
||||||
|
|
||||||
|
/* parameter used by STANDBY SWITCHOVER */
|
||||||
|
char remote_config_file[MAXLEN];
|
||||||
|
char pg_rewind[MAXPGPATH];
|
||||||
|
/* parameter used by STANDBY {ARCHIVE_CONFIG | RESTORE_CONFIG} */
|
||||||
|
char config_archive_dir[MAXLEN];
|
||||||
/* parameter used by CLUSTER CLEANUP */
|
/* parameter used by CLUSTER CLEANUP */
|
||||||
int keep_history;
|
int keep_history;
|
||||||
|
|
||||||
char pg_bindir[MAXLEN];
|
char pg_bindir[MAXLEN];
|
||||||
|
|
||||||
char recovery_min_apply_delay[MAXLEN];
|
char recovery_min_apply_delay[MAXLEN];
|
||||||
|
|
||||||
|
/* deprecated command line options */
|
||||||
|
char localport[MAXLEN];
|
||||||
|
bool initdb_no_pwprompt;
|
||||||
} t_runtime_options;
|
} t_runtime_options;
|
||||||
|
|
||||||
#define T_RUNTIME_OPTIONS_INITIALIZER { "", "", "", "", "", "", "", DEFAULT_WAL_KEEP_SEGMENTS, false, false, false, false, false, false, false, false, "", "", 0, "", "" }
|
#define T_RUNTIME_OPTIONS_INITIALIZER { "", "", "", "", "", "", "", DEFAULT_WAL_KEEP_SEGMENTS, false, false, false, false, false, false, false, false, false, "smart", "", "", "", "", "", 0, "", "", "", false }
|
||||||
|
|
||||||
|
struct BackupLabel
|
||||||
|
{
|
||||||
|
XLogRecPtr start_wal_location;
|
||||||
|
char start_wal_file[MAXLEN];
|
||||||
|
XLogRecPtr checkpoint_location;
|
||||||
|
char backup_from[MAXLEN];
|
||||||
|
char backup_method[MAXLEN];
|
||||||
|
char start_time[MAXLEN];
|
||||||
|
char label[MAXLEN];
|
||||||
|
XLogRecPtr min_failover_slot_lsn;
|
||||||
|
};
|
||||||
|
|
||||||
extern char repmgr_schema[MAXLEN];
|
extern char repmgr_schema[MAXLEN];
|
||||||
|
extern bool config_file_found;
|
||||||
typedef struct ErrorListCell
|
|
||||||
{
|
|
||||||
struct ErrorListCell *next;
|
|
||||||
char *error_message;
|
|
||||||
} ErrorListCell;
|
|
||||||
|
|
||||||
typedef struct ErrorList
|
|
||||||
{
|
|
||||||
ErrorListCell *head;
|
|
||||||
ErrorListCell *tail;
|
|
||||||
} ErrorList;
|
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
11
repmgr.sql
11
repmgr.sql
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr.sql
|
* repmgr.sql
|
||||||
*
|
*
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
@@ -59,3 +59,12 @@ WHERE (standby_node, last_monitor_time) IN (SELECT standby_node, MAX(last_monito
|
|||||||
ALTER VIEW repl_status OWNER TO repmgr;
|
ALTER VIEW repl_status OWNER TO repmgr;
|
||||||
|
|
||||||
CREATE INDEX idx_repl_status_sort ON repl_monitor(last_monitor_time, standby_node);
|
CREATE INDEX idx_repl_status_sort ON repl_monitor(last_monitor_time, standby_node);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* This view shows the list of nodes with the information of which one is the upstream
|
||||||
|
* in each case (when appliable)
|
||||||
|
*/
|
||||||
|
CREATE VIEW repl_show_nodes AS
|
||||||
|
SELECT rn.id, rn.conninfo, rn.type, rn.name, rn.cluster,
|
||||||
|
rn.priority, rn.active, sq.name AS upstream_node_name
|
||||||
|
FROM repl_nodes as rn LEFT JOIN repl_nodes AS sq ON sq.id=rn.upstream_node_id;
|
||||||
|
|||||||
@@ -1,7 +1,7 @@
|
|||||||
#
|
#
|
||||||
# Makefile
|
# Makefile
|
||||||
#
|
#
|
||||||
# Copyright (c) 2ndQuadrant, 2010-2015
|
# Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
#
|
#
|
||||||
|
|
||||||
MODULE_big = repmgr_funcs
|
MODULE_big = repmgr_funcs
|
||||||
|
|||||||
35
sql/repmgr3.0_repmgr3.1.sql
Normal file
35
sql/repmgr3.0_repmgr3.1.sql
Normal file
@@ -0,0 +1,35 @@
|
|||||||
|
/*
|
||||||
|
* Update a repmgr 3.0 installation to repmgr 3.1
|
||||||
|
* ----------------------------------------------
|
||||||
|
*
|
||||||
|
* The new repmgr package should be installed first. Then
|
||||||
|
* carry out these steps:
|
||||||
|
*
|
||||||
|
* 1. (If repmgrd is used) stop any running repmgrd instances
|
||||||
|
* 2. On the master node, execute the SQL statements listed below
|
||||||
|
* 3. (If repmgrd is used) restart repmgrd
|
||||||
|
*/
|
||||||
|
|
||||||
|
/*
|
||||||
|
* If your repmgr installation is not included in your repmgr
|
||||||
|
* user's search path, please set the search path to the name
|
||||||
|
* of the repmgr schema to ensure objects are installed in
|
||||||
|
* the correct location.
|
||||||
|
*
|
||||||
|
* The repmgr schema is "repmgr_" + the cluster name defined in
|
||||||
|
* 'repmgr.conf'.
|
||||||
|
*/
|
||||||
|
|
||||||
|
-- SET search_path TO 'name_of_repmgr_schema';
|
||||||
|
|
||||||
|
BEGIN;
|
||||||
|
|
||||||
|
-- New view "repl_show_nodes" which also displays the server's
|
||||||
|
-- upstream node
|
||||||
|
|
||||||
|
CREATE VIEW repl_show_nodes AS
|
||||||
|
SELECT rn.id, rn.conninfo, rn.type, rn.name, rn.cluster,
|
||||||
|
rn.priority, rn.active, sq.name AS upstream_node_name
|
||||||
|
FROM repl_nodes as rn LEFT JOIN repl_nodes AS sq ON sq.id=rn.upstream_node_id;
|
||||||
|
|
||||||
|
COMMIT;
|
||||||
31
sql/repmgr3.1.1_repmgr3.1.2.sql
Normal file
31
sql/repmgr3.1.1_repmgr3.1.2.sql
Normal file
@@ -0,0 +1,31 @@
|
|||||||
|
/*
|
||||||
|
* Update a repmgr 3.1.1 installation to repmgr 3.1.2
|
||||||
|
* --------------------------------------------------
|
||||||
|
*
|
||||||
|
* This update is only required if repmgrd is being used in conjunction
|
||||||
|
* with a witness server.
|
||||||
|
*
|
||||||
|
* The new repmgr package should be installed first. Then
|
||||||
|
* carry out these steps:
|
||||||
|
*
|
||||||
|
* 1. (If repmgrd is used) stop any running repmgrd instances
|
||||||
|
* 2. On the master node, execute the SQL statement listed below
|
||||||
|
* 3. (If repmgrd is used) restart repmgrd
|
||||||
|
*/
|
||||||
|
|
||||||
|
/*
|
||||||
|
* If your repmgr installation is not included in your repmgr
|
||||||
|
* user's search path, please set the search path to the name
|
||||||
|
* of the repmgr schema to ensure objects are installed in
|
||||||
|
* the correct location.
|
||||||
|
*
|
||||||
|
* The repmgr schema is "repmgr_" + the cluster name defined in
|
||||||
|
* 'repmgr.conf'.
|
||||||
|
*/
|
||||||
|
|
||||||
|
-- SET search_path TO 'name_of_repmgr_schema';
|
||||||
|
|
||||||
|
BEGIN;
|
||||||
|
|
||||||
|
ALTER TABLE repl_nodes ALTER CONSTRAINT repl_nodes_upstream_node_id_fkey DEFERRABLE;
|
||||||
|
COMMIT;
|
||||||
@@ -83,7 +83,12 @@ _PG_init(void)
|
|||||||
* resources in repmgr_shmem_startup().
|
* resources in repmgr_shmem_startup().
|
||||||
*/
|
*/
|
||||||
RequestAddinShmemSpace(repmgr_memsize());
|
RequestAddinShmemSpace(repmgr_memsize());
|
||||||
|
|
||||||
|
#if (PG_VERSION_NUM >= 90600)
|
||||||
|
RequestNamedLWLockTranche("repmgr", 1);
|
||||||
|
#else
|
||||||
RequestAddinLWLocks(1);
|
RequestAddinLWLocks(1);
|
||||||
|
#endif
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Install hooks.
|
* Install hooks.
|
||||||
@@ -128,7 +133,11 @@ repmgr_shmem_startup(void)
|
|||||||
if (!found)
|
if (!found)
|
||||||
{
|
{
|
||||||
/* First time through ... */
|
/* First time through ... */
|
||||||
|
#if (PG_VERSION_NUM >= 90600)
|
||||||
|
shared_state->lock = &(GetNamedLWLockTranche("repmgr"))->lock;
|
||||||
|
#else
|
||||||
shared_state->lock = LWLockAssign();
|
shared_state->lock = LWLockAssign();
|
||||||
|
#endif
|
||||||
snprintf(shared_state->location,
|
snprintf(shared_state->location,
|
||||||
sizeof(shared_state->location), "%X/%X", 0, 0);
|
sizeof(shared_state->location), "%X/%X", 0, 0);
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr_function.sql
|
* repmgr_function.sql
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* uninstall_repmgr_funcs.sql
|
* uninstall_repmgr_funcs.sql
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|||||||
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* strutil.c
|
* strutil.c
|
||||||
*
|
*
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* strutil.h
|
* strutil.h
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
@@ -24,12 +24,17 @@
|
|||||||
#include <stdlib.h>
|
#include <stdlib.h>
|
||||||
#include "errcode.h"
|
#include "errcode.h"
|
||||||
|
|
||||||
|
|
||||||
#define QUERY_STR_LEN 8192
|
#define QUERY_STR_LEN 8192
|
||||||
#define MAXLEN 1024
|
#define MAXLEN 1024
|
||||||
#define MAXLINELENGTH 4096
|
#define MAXLINELENGTH 4096
|
||||||
#define MAXVERSIONSTR 16
|
#define MAXVERSIONSTR 16
|
||||||
#define MAXCONNINFO 1024
|
#define MAXCONNINFO 1024
|
||||||
|
|
||||||
|
/* Why? http://stackoverflow.com/a/5459929/398670 */
|
||||||
|
#define STR(x) CppAsString(x)
|
||||||
|
|
||||||
|
#define MAXLEN_STR STR(MAXLEN)
|
||||||
|
|
||||||
extern int
|
extern int
|
||||||
xsnprintf(char *str, size_t size, const char *format,...)
|
xsnprintf(char *str, size_t size, const char *format,...)
|
||||||
|
|||||||
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* uninstall_repmgr.sql
|
* uninstall_repmgr.sql
|
||||||
*
|
*
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user