mirror of
https://github.com/EnterpriseDB/repmgr.git
synced 2026-03-23 07:06:30 +00:00
Compare commits
99 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
9c28d3626b | ||
|
|
0916d8f2ad | ||
|
|
1964f890be | ||
|
|
976a61005e | ||
|
|
0c82278fd4 | ||
|
|
0abfde3773 | ||
|
|
1746831486 | ||
|
|
8c8e368a69 | ||
|
|
0ef532dcff | ||
|
|
478407fd86 | ||
|
|
05bfdfab2c | ||
|
|
29740dc41b | ||
|
|
ad6ecef2ab | ||
|
|
5318d37462 | ||
|
|
7244dda20f | ||
|
|
e651284927 | ||
|
|
72a2ac284a | ||
|
|
cec01c6620 | ||
|
|
989f683bc6 | ||
|
|
fa30382f2c | ||
|
|
defc2653e0 | ||
|
|
67e8ca73b5 | ||
|
|
a1a1d64e1f | ||
|
|
76509038cc | ||
|
|
7f8e50c882 | ||
|
|
5deb6c8ce4 | ||
|
|
175ee8acfc | ||
|
|
d1491f51a3 | ||
|
|
bc9febdc48 | ||
|
|
b6cf22ac90 | ||
|
|
d89a73cbf4 | ||
|
|
1f09e92e3f | ||
|
|
1bdc72a07b | ||
|
|
a6f1c6e483 | ||
|
|
6e14f0bc5d | ||
|
|
a336d22bd9 | ||
|
|
e88a8a9708 | ||
|
|
8f3f4eb4a3 | ||
|
|
dc18e5b791 | ||
|
|
9da0914976 | ||
|
|
666e71a589 | ||
|
|
062af91d36 | ||
|
|
571ad698db | ||
|
|
742f7e167f | ||
|
|
1fb2801639 | ||
|
|
e3031f0204 | ||
|
|
79748f28f1 | ||
|
|
46740b64a9 | ||
|
|
6557099832 | ||
|
|
083e288ac3 | ||
|
|
f5e3d7c041 | ||
|
|
402e02f4b7 | ||
|
|
a21b16f960 | ||
|
|
be58af701b | ||
|
|
eb2cdf8a98 | ||
|
|
7cc0400c03 | ||
|
|
9788b2bd29 | ||
|
|
227f0190f7 | ||
|
|
d6dbc70916 | ||
|
|
d2f4eda224 | ||
|
|
2588853e83 | ||
|
|
b54f98ed8a | ||
|
|
26f73686e5 | ||
|
|
e274a2cbcb | ||
|
|
d502bbe614 | ||
|
|
2594411820 | ||
|
|
d22535de00 | ||
|
|
fce1f0cd4a | ||
|
|
bb842c3989 | ||
|
|
556ff3c311 | ||
|
|
251486546d | ||
|
|
53d3e71cd3 | ||
|
|
b986ce81b2 | ||
|
|
7ddb060bdc | ||
|
|
6b02faf37c | ||
|
|
0cde0068dd | ||
|
|
20d66df0ef | ||
|
|
3f7c30b84d | ||
|
|
a63baf7fcb | ||
|
|
e19c643389 | ||
|
|
f058833451 | ||
|
|
96c14adfdb | ||
|
|
50119056a5 | ||
|
|
a279c42df9 | ||
|
|
f70b6ea136 | ||
|
|
e4cb6d7130 | ||
|
|
502c056753 | ||
|
|
871ec47ff5 | ||
|
|
f435abb3ec | ||
|
|
a217b4d0a9 | ||
|
|
2dcb75f889 | ||
|
|
b509ce6382 | ||
|
|
1150bf272a | ||
|
|
09ac6cd145 | ||
|
|
2fae788bc4 | ||
|
|
eb90f864c9 | ||
|
|
ba89758366 | ||
|
|
84595fe711 | ||
|
|
9523894808 |
@@ -2,7 +2,7 @@ License and Contributions
|
||||
=========================
|
||||
|
||||
`repmgr` is licensed under the GPL v3. All of its code and documentation is
|
||||
Copyright 2010-2016, 2ndQuadrant Limited. See the files COPYRIGHT and LICENSE for
|
||||
Copyright 2010-2017, 2ndQuadrant Limited. See the files COPYRIGHT and LICENSE for
|
||||
details.
|
||||
|
||||
The development of repmgr has primarily been sponsored by 2ndQuadrant customers.
|
||||
|
||||
@@ -1,4 +1,4 @@
|
||||
Copyright (c) 2010-2016, 2ndQuadrant Limited
|
||||
Copyright (c) 2010-2017, 2ndQuadrant Limited
|
||||
All rights reserved.
|
||||
|
||||
This program is free software: you can redistribute it and/or modify
|
||||
|
||||
48
HISTORY
48
HISTORY
@@ -1,4 +1,40 @@
|
||||
3.2 2016-
|
||||
3.3.1 2017-03-
|
||||
repmgrd: prevent invalid apply lag value being written to the
|
||||
monitoring table (Ian)
|
||||
repmgrd: fix error in XLogRecPtr conversion when calculating
|
||||
monitoring statistics (Ian)
|
||||
repmgr: if replication slots in use, where possible delete slot on old
|
||||
upstream node after following new upstream (Ian)
|
||||
repmgr: improve logging of rsync actions (Ian)
|
||||
repmgr: improve `standby clone` when synchronous replication in use (Ian)
|
||||
repmgr: stricter checking of allowed node id values
|
||||
repmgr: enable `master register --force` when there is a foreign key
|
||||
dependency from a standby node (Ian)
|
||||
|
||||
3.3 2016-12-27
|
||||
repmgr: always log to STDERR even if log facility defined (Ian)
|
||||
repmgr: add --log-to-file to log repmgr output to the defined
|
||||
log facility (Ian)
|
||||
repmgr: improve handling of command line parameter errors (Ian)
|
||||
repmgr: add option --upstream-conninfo to explicitly set
|
||||
'primary_conninfo' in recovery.conf (Ian)
|
||||
repmgr: enable a standby to be registered which isn't running (Ian)
|
||||
repmgr: enable `standby register --force` to update a node record
|
||||
with cascaded downstream node records (Ian)
|
||||
repmgr: add option `--no-conninfo-password` (Abhijit, Ian)
|
||||
repmgr: add initial support for PostgreSQL 10.0 (Ian)
|
||||
repmgr: escape values in primary_conninfo if needed (Ian)
|
||||
|
||||
3.2.1 2016-10-24
|
||||
repmgr: require a valid repmgr cluster name unless -F/--force
|
||||
supplied (Ian)
|
||||
repmgr: check master server is registered with repmgr before
|
||||
cloning (Ian)
|
||||
repmgr: ensure data directory defaults to that of the source node (Ian)
|
||||
repmgr: various fixes to Barman cloning mode (Gianni, Ian)
|
||||
repmgr: fix `repmgr cluster crosscheck` output (Ian)
|
||||
|
||||
3.2 2016-10-05
|
||||
repmgr: add support for cloning from a Barman backup (Gianni)
|
||||
repmgr: add commands `standby matrix` and `standby crosscheck` (Gianni)
|
||||
repmgr: suppress connection error display in `repmgr cluster show`
|
||||
@@ -15,10 +51,16 @@
|
||||
the standby (Ian)
|
||||
repmgr: add option `--copy-external-config-files` for files outside
|
||||
of the data directory (Ian)
|
||||
repmgr: add configuration options to override the default pg_ctl
|
||||
commands (Jarkko Oranen)
|
||||
repmgr: only require `wal_keep_segments` to be set in certain corner
|
||||
cases (Ian)
|
||||
repmgr: better support cloning from a node other than the one to
|
||||
stream from (Ian)
|
||||
repmgrd: add configuration options to override the default pg_ctl
|
||||
commands (Jarkko Oranen, Ian)
|
||||
repmgrd: don't start if node is inactive and failover=automatic (Ian)
|
||||
packaging: improve "repmgr-auto" Debian package (Gianni)
|
||||
|
||||
|
||||
3.1.5 2016-08-15
|
||||
repmgrd: in a failover situation, prevent endless looping when
|
||||
attempting to establish the status of a node with
|
||||
|
||||
4
Makefile
4
Makefile
@@ -1,11 +1,11 @@
|
||||
#
|
||||
# Makefile
|
||||
# Copyright (c) 2ndQuadrant, 2010-2016
|
||||
# Copyright (c) 2ndQuadrant, 2010-2017
|
||||
|
||||
HEADERS = $(wildcard *.h)
|
||||
|
||||
repmgrd_OBJS = dbutils.o config.o repmgrd.o log.o strutil.o
|
||||
repmgr_OBJS = dbutils.o check_dir.o config.o repmgr.o log.o strutil.o dirmod.o
|
||||
repmgr_OBJS = dbutils.o check_dir.o config.o repmgr.o log.o strutil.o dirmod.o compat.o
|
||||
|
||||
DATA = repmgr.sql uninstall_repmgr.sql
|
||||
|
||||
|
||||
279
README.md
279
README.md
@@ -7,8 +7,8 @@ replication capabilities with utilities to set up standby servers, monitor
|
||||
replication, and perform administrative tasks such as failover or switchover
|
||||
operations.
|
||||
|
||||
The current `repmgr` version, 3.1.5, supports all PostgreSQL versions from
|
||||
9.3, including the upcoming 9.6.
|
||||
The current `repmgr` version (3.3) supports all PostgreSQL versions from
|
||||
9.3 to 9.6.
|
||||
|
||||
Overview
|
||||
--------
|
||||
@@ -121,7 +121,8 @@ views:
|
||||
status for each node
|
||||
|
||||
The `repmgr` metadata schema can be stored in an existing database or in its own
|
||||
dedicated database.
|
||||
dedicated database. Note that the `repmgr` metadata schema cannot reside on a database
|
||||
server which is not part of the replication cluster managed by `repmgr`.
|
||||
|
||||
A dedicated database superuser is required to own the meta-database as well as carry
|
||||
out administrative actions.
|
||||
@@ -229,15 +230,29 @@ The configuration file will be searched for in the following locations:
|
||||
|
||||
Note that if a file is explicitly specified with `-f/--config-file`, an error will
|
||||
be raised if it is not found or not readable and no attempt will be made to check
|
||||
default locations; this is to prevent `repmgr` reading the wrong file.
|
||||
default locations; this is to prevent `repmgr` unexpectedly reading the wrong file.
|
||||
|
||||
For a full list of annotated configuration items, see the file `repmgr.conf.sample`.
|
||||
|
||||
The following parameters in the configuration file can be overridden with
|
||||
command line options:
|
||||
|
||||
- `-L/--log-level`
|
||||
- `-b/--pg_bindir`
|
||||
- `log_level` with `-L/--log-level`
|
||||
- `pg_bindir` with `-b/--pg_bindir`
|
||||
|
||||
|
||||
### Logging
|
||||
|
||||
By default `repmgr` and `repmgrd` will log directly to `STDERR`. For `repmgrd`
|
||||
we recommend capturing output in a logfile or using your system's log facility;
|
||||
see `repmgr.conf.sample` for details.
|
||||
|
||||
As a command line utility, `repmgr` will log directly to the console by default
|
||||
(this is a change in behaviour from versions before 3.3, where it would always
|
||||
log to the same location as `repmgrd`). However in some circumstances, such as
|
||||
when `repmgr` is executed by `repmgrd` during a failover event, it makes sense to
|
||||
capture `repmgr`'s log output - this can be done by supplying the command-line
|
||||
option `--log-to-file` to `repmgr`.
|
||||
|
||||
|
||||
### Command line options and environment variables
|
||||
@@ -274,14 +289,14 @@ Setting up a simple replication cluster with repmgr
|
||||
The following section will describe how to set up a basic replication cluster
|
||||
with a master and a standby server using the `repmgr` command line tool.
|
||||
It is assumed PostgreSQL is installed on both servers in the cluster,
|
||||
`rsync` is available and password-less SSH connections are possible between
|
||||
`rsync` is available and passwordless SSH connections are possible between
|
||||
both servers.
|
||||
|
||||
* * *
|
||||
|
||||
> *TIP*: for testing `repmgr`, it's possible to use multiple PostgreSQL
|
||||
> instances running on different ports on the same computer, with
|
||||
> password-less SSH access to `localhost` enabled.
|
||||
> passwordless SSH access to `localhost` enabled.
|
||||
|
||||
* * *
|
||||
|
||||
@@ -318,10 +333,11 @@ The following replication settings may need to be adjusted:
|
||||
archive_command = '/bin/true'
|
||||
|
||||
# If cloning using rsync, or you have configured `pg_basebackup_options`
|
||||
# in `repmgr.conf` to include the setting `--xlog-method=fetch`, *and*
|
||||
# you have not set `restore_command` in `repmgr.conf`to fetch WAL files
|
||||
# from another source such as Barman, you'll need to set `wal_keep_segments`
|
||||
# to a high enough value to ensure that all WAL files generated while
|
||||
# in `repmgr.conf` to include the setting `--xlog-method=fetch` (from
|
||||
# PostgreSQL 10 `--wal-method=fetch`), *and* you have not set
|
||||
# `restore_command` in `repmgr.conf`to fetch WAL files from another
|
||||
# source such as Barman, you'll need to set `wal_keep_segments` to a
|
||||
# high enough value to ensure that all WAL files generated while
|
||||
# the standby is being cloned are retained until the standby starts up.
|
||||
|
||||
# wal_keep_segments = 5000
|
||||
@@ -375,7 +391,8 @@ least the following parameters:
|
||||
|
||||
- `cluster`: an arbitrary name for the replication cluster; this must be identical
|
||||
on all nodes
|
||||
- `node`: a unique integer identifying the node
|
||||
- `node`: a unique integer identifying the node; note this must be a positive
|
||||
32 bit signed integer between 1 and 2147483647
|
||||
- `node_name`: a unique string identifying the node; we recommend a name
|
||||
specific to the server (e.g. 'server_1'); avoid names indicating the
|
||||
current replication role like 'master' or 'standby' as the server's
|
||||
@@ -412,7 +429,7 @@ be registered with `repmgr`, which creates the `repmgr` database and adds
|
||||
a metadata record for the server:
|
||||
|
||||
$ repmgr -f repmgr.conf master register
|
||||
[2016-01-07 16:56:46] [NOTICE] master node correctly registered for cluster test with id 1 (conninfo: host=repmgr_node1 user=repmgr dbname=repmgr)
|
||||
NOTICE: master node correctly registered for cluster test with id 1 (conninfo: host=repmgr_node1 user=repmgr dbname=repmgr)
|
||||
|
||||
The metadata record looks like this:
|
||||
|
||||
@@ -439,13 +456,13 @@ the values `node`, `node_name` and `conninfo` adjusted accordingly, e.g.:
|
||||
Clone the standby with:
|
||||
|
||||
$ repmgr -h repmgr_node1 -U repmgr -d repmgr -D /path/to/node2/data/ -f /etc/repmgr.conf standby clone
|
||||
[2016-01-07 17:21:26] [NOTICE] destination directory '/path/to/node2/data/' provided
|
||||
[2016-01-07 17:21:26] [NOTICE] starting backup...
|
||||
[2016-01-07 17:21:26] [HINT] this may take some time; consider using the -c/--fast-checkpoint option
|
||||
NOTICE: destination directory '/path/to/node2/data/' provided
|
||||
NOTICE: starting backup...
|
||||
HINT: this may take some time; consider using the -c/--fast-checkpoint option
|
||||
NOTICE: pg_stop_backup complete, all required WAL segments have been archived
|
||||
[2016-01-07 17:21:28] [NOTICE] standby clone (using pg_basebackup) complete
|
||||
[2016-01-07 17:21:28] [NOTICE] you can now start your PostgreSQL server
|
||||
[2016-01-07 17:21:28] [HINT] for example : pg_ctl -D /path/to/node2/data/ start
|
||||
NOTICE: standby clone (using pg_basebackup) complete
|
||||
NOTICE: you can now start your PostgreSQL server
|
||||
HINT: for example : pg_ctl -D /path/to/node2/data/ start
|
||||
|
||||
This will clone the PostgreSQL data directory files from the master at `repmgr_node1`
|
||||
using PostgreSQL's `pg_basebackup` utility. A `recovery.conf` file containing the
|
||||
@@ -486,7 +503,8 @@ place. To ensure this happens when using the default `pg_basebackup` method,
|
||||
`repmgr` will set `pg_basebackup`'s `--xlog-method` parameter to `stream`,
|
||||
which will ensure all WAL files generated during the cloning process are
|
||||
streamed in parallel with the main backup. Note that this requires two
|
||||
replication connections to be available.
|
||||
replication connections to be available (`repmgr` will verify sufficient
|
||||
connections are available before attempting to clonse).
|
||||
|
||||
To override this behaviour, in `repmgr.conf` set `pg_basebackup`'s
|
||||
`--xlog-method` parameter to `fetch`:
|
||||
@@ -498,6 +516,9 @@ See the `pg_basebackup` documentation for details:
|
||||
|
||||
https://www.postgresql.org/docs/current/static/app-pgbasebackup.html
|
||||
|
||||
> *NOTE*: From PostgreSQL 10, `pg_basebackup`'s `--xlog-method` parameter
|
||||
> has been renamed to `--wal-method`.
|
||||
|
||||
Make any adjustments to the standby's PostgreSQL configuration files now,
|
||||
then start the server.
|
||||
|
||||
@@ -540,8 +561,8 @@ Connect to the master server and execute:
|
||||
|
||||
Register the standby server with:
|
||||
|
||||
repmgr -f /etc/repmgr.conf standby register
|
||||
[2016-01-08 11:13:16] [NOTICE] standby node correctly registered for cluster test with id 2 (conninfo: host=repmgr_node2 user=repmgr dbname=repmgr)
|
||||
$ repmgr -f /etc/repmgr.conf standby register
|
||||
NOTICE: standby node correctly registered for cluster test with id 2 (conninfo: host=repmgr_node2 user=repmgr dbname=repmgr)
|
||||
|
||||
Connect to the standby server's `repmgr` database and check the `repl_nodes`
|
||||
table:
|
||||
@@ -572,6 +593,21 @@ to effectively manage cascading replication (see below).
|
||||
|
||||
* * *
|
||||
|
||||
Under some circumstances you may wish to register a standby which is not
|
||||
yet running; this can be the case when using provisioning tools to create
|
||||
a complex replication cluster. In this case, by using the `-F/--force`
|
||||
option and providing the connection parameters to the master server,
|
||||
the standby can be registered.
|
||||
|
||||
Similarly, with cascading replication it may be necessary to register
|
||||
a standby whose upstream node has not yet been registered - in this case,
|
||||
using `-F/--force` will result in the creation of an inactive placeholder
|
||||
record for the upstream node, which will however later need to be registered
|
||||
with the `-F/--force` option too.
|
||||
|
||||
When used with `standby register`, care should be taken that use of the
|
||||
`-F/--force` option does not result in an incorrectly configured cluster.
|
||||
|
||||
### Using Barman to clone a standby
|
||||
|
||||
`repmgr standby clone` also supports Barman, the Backup and
|
||||
@@ -580,13 +616,13 @@ base backups and WAL files.
|
||||
|
||||
Barman support provides the following advantages:
|
||||
|
||||
- the primary node does not need to perform a new backup every time a
|
||||
- the master node does not need to perform a new backup every time a
|
||||
new standby is cloned;
|
||||
- a standby node can be disconnected for longer periods without losing
|
||||
the ability to catch up, and without causing accumulation of WAL
|
||||
files on the primary node;
|
||||
files on the master node;
|
||||
- therefore, `repmgr` does not need to use replication slots, and the
|
||||
primary node does not need to set `wal_keep_segments`.
|
||||
master node does not need to set `wal_keep_segments`.
|
||||
|
||||
> *NOTE*: In view of the above, Barman support is incompatible with
|
||||
> the `use_replication_slots` setting in `repmgr.conf`.
|
||||
@@ -599,8 +635,8 @@ ensure that:
|
||||
- the `barman_server` setting in `repmgr.conf` is set to the SSH
|
||||
hostname of the Barman server;
|
||||
- the `restore_command` setting in `repmgr.conf` is configured to
|
||||
use a copy of the `barman-wal-restore.py` script shipped with Barman
|
||||
(see below);
|
||||
use a copy of the `barman-wal-restore` script shipped with the
|
||||
`barman-cli` package (see below);
|
||||
- the Barman catalogue includes at least one valid backup for this
|
||||
server.
|
||||
|
||||
@@ -616,39 +652,37 @@ ensure that:
|
||||
> corresponding to the value of `barman_server` in `repmgr.conf`. See
|
||||
> the "Host" section in `man 5 ssh_config` for more details.
|
||||
|
||||
`barman-wal-restore.py` is a Python script provided by the Barman
|
||||
development team, which must be copied in a location accessible to
|
||||
`repmgr`, and marked as executable; `restore_command` must then be
|
||||
set in `repmgr.conf` as follows:
|
||||
`barman-wal-restore` is a Python script provided by the Barman
|
||||
development team as part of the `barman-cli` package (Barman 2.0
|
||||
and later; for Barman 1.x the script is provided separately as
|
||||
`barman-wal-restore.py`).
|
||||
|
||||
`restore_command` must then be set in `repmgr.conf` as follows:
|
||||
|
||||
<script> <Barman hostname> <cluster_name> %f %p
|
||||
|
||||
For instance, suppose that we have installed Barman on the `barmansrv`
|
||||
host, and that we have placed a copy of `barman-wal-restore.py` into
|
||||
the `/usr/local/bin` directory. First, we ensure that the script is
|
||||
executable:
|
||||
|
||||
sudo chmod +x /usr/local/bin/barman-wal-restore.py
|
||||
|
||||
Then we check that `repmgr.conf` includes the following lines:
|
||||
host, and that `barman-wal-restore` is located as an executable at
|
||||
`/usr/bin/barman-wal-restore`; `repmgr.conf` should include the following
|
||||
lines:
|
||||
|
||||
barman_server=barmansrv
|
||||
restore_command=/usr/local/bin/barman-wal-restore.py barmansrv test %f %p
|
||||
restore_command=/usr/bin/barman-wal-restore barmansrv test %f %p
|
||||
|
||||
To use a non-default Barman configuration file on the Barman server,
|
||||
NOTE: to use a non-default Barman configuration file on the Barman server,
|
||||
specify this in `repmgr.conf` with `barman_config`:
|
||||
|
||||
barman_config=/path/to/barman.conf
|
||||
|
||||
Now we can clone a standby using the Barman server:
|
||||
|
||||
$ repmgr -h node1 -D 9.5/main -f /etc/repmgr.conf standby clone
|
||||
[2016-06-12 20:08:35] [NOTICE] destination directory '9.5/main' provided
|
||||
[2016-06-12 20:08:35] [NOTICE] getting backup from Barman...
|
||||
[2016-06-12 20:08:36] [NOTICE] standby clone (from Barman) complete
|
||||
[2016-06-12 20:08:36] [NOTICE] you can now start your PostgreSQL server
|
||||
[2016-06-12 20:08:36] [HINT] for example : pg_ctl -D 9.5/data start
|
||||
[2016-06-12 20:08:36] [HINT] After starting the server, you need to register this standby with "repmgr standby register"
|
||||
$ repmgr -h node1 -d repmgr -D 9.5/main -f /etc/repmgr.conf standby clone
|
||||
NOTICE: destination directory '9.5/main' provided
|
||||
NOTICE: getting backup from Barman...
|
||||
NOTICE: standby clone (from Barman) complete
|
||||
NOTICE: you can now start your PostgreSQL server
|
||||
HINT: for example : pg_ctl -D 9.5/data start
|
||||
HINT: After starting the server, you need to register this standby with "repmgr standby register"
|
||||
|
||||
|
||||
|
||||
@@ -688,24 +722,10 @@ and destination server as the contents of files existing on both servers need
|
||||
to be compared, meaning this method is not necessarily faster than making a
|
||||
fresh clone with `pg_basebackup`.
|
||||
|
||||
> *NOTE*: `barman-wal-restore.py` supports command line switches to
|
||||
> *NOTE*: `barman-wal-restore` supports command line switches to
|
||||
> control parallelism (`--parallel=N`) and compression (`--bzip2`,
|
||||
> `--gzip`).
|
||||
|
||||
### Dealing with PostgreSQL configuration files
|
||||
|
||||
By default, `repmgr` will attempt to copy the standard configuration files
|
||||
(`postgresql.conf`, `pg_hba.conf` and `pg_ident.conf`) even if they are located
|
||||
outside of the data directory (though currently they will be copied
|
||||
into the standby's data directory). To prevent this happening, when executing
|
||||
`repmgr standby clone` provide the `--ignore-external-config-files` option.
|
||||
|
||||
If using `rsync` to clone a standby, additional control over which files
|
||||
not to transfer is possible by configuring `rsync_options` in `repmgr.conf`,
|
||||
which enables any valid `rsync` options to be passed to that command, e.g.:
|
||||
|
||||
rsync_options='--exclude=postgresql.local.conf'
|
||||
|
||||
### Controlling `primary_conninfo` in `recovery.conf`
|
||||
|
||||
The `primary_conninfo` setting in `recovery.conf` generated by `repmgr`
|
||||
@@ -722,13 +742,22 @@ string passed to `repmgr` with `-d/--dbname` (see above for details), and/or set
|
||||
appropriate environment variables.
|
||||
|
||||
Note that PostgreSQL will always set explicit defaults for `sslmode` and
|
||||
`sslcompression`.
|
||||
`sslcompression` (and from PostgreSQL 10.0 also `target_session_attrs`).
|
||||
|
||||
If `application_name` is set in the standby's `conninfo` parameter in
|
||||
`repmgr.conf`, this value will be appended to `primary_conninfo`, otherwise
|
||||
`repmgr` will set `application_name` to the same value as the `node_name`
|
||||
parameter.
|
||||
|
||||
By default `repmgr` assumes the user who owns the `repmgr` metadatabase will
|
||||
also be the replication user; a different replication user can be specified
|
||||
with `--replication-user`.
|
||||
|
||||
If the upstream server requires a password, and this was provided via
|
||||
`PGPASSWORD`, `.pgpass` etc., by default `repmgr` will include this in
|
||||
`primary_conninfo`. Use the command line option `--no-conninfo-password` to
|
||||
suppress this.
|
||||
|
||||
|
||||
Setting up cascading replication with repmgr
|
||||
--------------------------------------------
|
||||
@@ -762,15 +791,15 @@ created standby. Clone this standby (using the connection parameters
|
||||
for the existing standby) and register it:
|
||||
|
||||
$ repmgr -h repmgr_node2 -U repmgr -d repmgr -D /path/to/node3/data/ -f /etc/repmgr.conf standby clone
|
||||
[2016-01-08 13:44:52] [NOTICE] destination directory 'node_3/data/' provided
|
||||
[2016-01-08 13:44:52] [NOTICE] starting backup (using pg_basebackup)...
|
||||
[2016-01-08 13:44:52] [HINT] this may take some time; consider using the -c/--fast-checkpoint option
|
||||
[2016-01-08 13:44:52] [NOTICE] standby clone (using pg_basebackup) complete
|
||||
[2016-01-08 13:44:52] [NOTICE] you can now start your PostgreSQL server
|
||||
[2016-01-08 13:44:52] [HINT] for example : pg_ctl -D /path/to/node_3/data start
|
||||
NOTICE: destination directory 'node_3/data/' provided
|
||||
NOTICE: starting backup (using pg_basebackup)...
|
||||
HINT: this may take some time; consider using the -c/--fast-checkpoint option
|
||||
NOTICE: standby clone (using pg_basebackup) complete
|
||||
NOTICE: you can now start your PostgreSQL server
|
||||
HINT: for example : pg_ctl -D /path/to/node_3/data start
|
||||
|
||||
$ repmgr -f /etc/repmgr.conf standby register
|
||||
[2016-01-08 14:04:32] [NOTICE] standby node correctly registered for cluster test with id 3 (conninfo: host=repmgr_node3 dbname=repmgr user=repmgr)
|
||||
NOTICE: standby node correctly registered for cluster test with id 3 (conninfo: host=repmgr_node3 dbname=repmgr user=repmgr)
|
||||
|
||||
After starting the standby, the `repl_nodes` table will look like this:
|
||||
|
||||
@@ -782,6 +811,15 @@ After starting the standby, the `repl_nodes` table will look like this:
|
||||
3 | standby | 2 | test | node3 | host=repmgr_node3 dbname=repmgr user=repmgr | | 100 | t
|
||||
(3 rows)
|
||||
|
||||
* * *
|
||||
|
||||
> *TIP*: under some circumstances when setting up a cascading replication
|
||||
> cluster, you may wish to clone a downstream standby whose upstream node
|
||||
> does not yet exist. In this case you can clone from the master (or
|
||||
> another upstream node) and provide the parameter `--upstream-conninfo`
|
||||
> to explictly set the upstream's `primary_conninfo` string in `recovery.conf`.
|
||||
|
||||
* * *
|
||||
|
||||
Using replication slots with repmgr
|
||||
-----------------------------------
|
||||
@@ -867,19 +905,19 @@ Promote the first standby with:
|
||||
|
||||
This will produce output similar to the following:
|
||||
|
||||
[2016-01-08 16:07:31] [ERROR] connection to database failed: could not connect to server: Connection refused
|
||||
ERROR: connection to database failed: could not connect to server: Connection refused
|
||||
Is the server running on host "repmgr_node1" (192.161.2.1) and accepting
|
||||
TCP/IP connections on port 5432?
|
||||
could not connect to server: Connection refused
|
||||
Is the server running on host "repmgr_node1" (192.161.2.1) and accepting
|
||||
TCP/IP connections on port 5432?
|
||||
|
||||
[2016-01-08 16:07:31] [NOTICE] promoting standby
|
||||
[2016-01-08 16:07:31] [NOTICE] promoting server using '/usr/bin/postgres/pg_ctl -D /path/to/node_2/data promote'
|
||||
NOTICE: promoting standby
|
||||
NOTICE: promoting server using '/usr/bin/postgres/pg_ctl -D /path/to/node_2/data promote'
|
||||
server promoting
|
||||
[2016-01-08 16:07:33] [NOTICE] STANDBY PROMOTE successful
|
||||
NOTICE: STANDBY PROMOTE successful
|
||||
|
||||
Note: the first `[ERROR]` is `repmgr` attempting to connect to the current
|
||||
Note: the first `ERROR` is `repmgr` attempting to connect to the current
|
||||
master to verify that it has failed. If a valid master is found, `repmgr`
|
||||
will refuse to promote a standby.
|
||||
|
||||
@@ -911,7 +949,7 @@ end of the preceding section ("Promoting a standby server with repmgr"),
|
||||
execute this:
|
||||
|
||||
$ repmgr -f /etc/repmgr.conf -D /path/to/node_3/data/ -h repmgr_node2 -U repmgr -d repmgr standby follow
|
||||
[2016-01-08 16:57:06] [NOTICE] restarting server using '/usr/bin/postgres/pg_ctl -D /path/to/node_3/data/ -w -m fast restart'
|
||||
NOTICE: restarting server using '/usr/bin/postgres/pg_ctl -D /path/to/node_3/data/ -w -m fast restart'
|
||||
waiting for server to shut down.... done
|
||||
server stopped
|
||||
waiting for server to start.... done
|
||||
@@ -983,26 +1021,26 @@ local server, as well as the normal default locations. `repmgr` will check
|
||||
this file can be found before performing any further actions.
|
||||
|
||||
$ repmgr -f /etc/repmgr.conf -C /etc/repmgr.conf standby switchover -v
|
||||
[2016-01-27 16:38:33] [NOTICE] using configuration file "/etc/repmgr.conf"
|
||||
[2016-01-27 16:38:33] [NOTICE] switching current node 2 to master server and demoting current master to standby...
|
||||
[2016-01-27 16:38:34] [NOTICE] 5 files copied to /tmp/repmgr-node1-archive
|
||||
[2016-01-27 16:38:34] [NOTICE] connection to database failed: FATAL: the database system is shutting down
|
||||
NOTICE: using configuration file "/etc/repmgr.conf"
|
||||
NOTICE: switching current node 2 to master server and demoting current master to standby...
|
||||
NOTICE: 5 files copied to /tmp/repmgr-node1-archive
|
||||
NOTICE: connection to database failed: FATAL: the database system is shutting down
|
||||
|
||||
[2016-01-27 16:38:34] [NOTICE] current master has been stopped
|
||||
[2016-01-27 16:38:34] [ERROR] connection to database failed: FATAL: the database system is shutting down
|
||||
NOTICE: current master has been stopped
|
||||
ERROR: connection to database failed: FATAL: the database system is shutting down
|
||||
|
||||
[2016-01-27 16:38:34] [NOTICE] promoting standby
|
||||
[2016-01-27 16:38:34] [NOTICE] promoting server using '/usr/local/bin/pg_ctl -D /var/lib/postgresql/9.5/node_2/data promote'
|
||||
NOTICE: promoting standby
|
||||
NOTICE: promoting server using '/usr/local/bin/pg_ctl -D /var/lib/postgresql/9.5/node_2/data promote'
|
||||
server promoting
|
||||
[2016-01-27 16:38:36] [NOTICE] STANDBY PROMOTE successful
|
||||
[2016-01-27 16:38:36] [NOTICE] Executing pg_rewind on old master server
|
||||
[2016-01-27 16:38:36] [NOTICE] 5 files copied to /var/lib/postgresql/9.5/data
|
||||
[2016-01-27 16:38:36] [NOTICE] restarting server using '/usr/local/bin/pg_ctl -w -D /var/lib/postgresql/9.5/node_1/data -m fast restart'
|
||||
NOTICE: STANDBY PROMOTE successful
|
||||
NOTICE: Executing pg_rewind on old master server
|
||||
NOTICE: 5 files copied to /var/lib/postgresql/9.5/data
|
||||
NOTICE: restarting server using '/usr/local/bin/pg_ctl -w -D /var/lib/postgresql/9.5/node_1/data -m fast restart'
|
||||
pg_ctl: PID file "/var/lib/postgresql/9.5/node_1/data/postmaster.pid" does not exist
|
||||
Is server running?
|
||||
starting server anyway
|
||||
[2016-01-27 16:38:37] [NOTICE] node 1 is replicating in state "streaming"
|
||||
[2016-01-27 16:38:37] [NOTICE] switchover was successful
|
||||
NOTICE: node 1 is replicating in state "streaming"
|
||||
NOTICE: switchover was successful
|
||||
|
||||
Messages containing the line `connection to database failed: FATAL: the database
|
||||
system is shutting down` are not errors - `repmgr` is polling the old master database
|
||||
@@ -1028,7 +1066,7 @@ should have been updated to reflect this:
|
||||
at a two-server master/standby replication cluster and currently does
|
||||
not support additional standbys.
|
||||
- `repmgr standby switchover` is designed to use the `pg_rewind` utility,
|
||||
standard in 9.5 and later and available for separately in 9.3 and 9.4
|
||||
standard in 9.5 and later and available separately in 9.3 and 9.4
|
||||
(see note below)
|
||||
- `pg_rewind` *requires* that either `wal_log_hints` is enabled, or that
|
||||
data checksums were enabled when the cluster was initialized. See the
|
||||
@@ -1088,8 +1126,9 @@ This will remove the standby record from `repmgr`'s internal metadata
|
||||
table (`repl_nodes`). A `standby_unregister` event notification will be
|
||||
recorded in the `repl_events` table.
|
||||
|
||||
Note that this command will not stop the server itself or remove
|
||||
it from the replication cluster.
|
||||
Note that this command will not stop the server itself or remove it from
|
||||
the replication cluster. Note that if the standby was using a replication
|
||||
slot, this will not be removed.
|
||||
|
||||
If the standby is not running, the command can be executed on another
|
||||
node by providing the id of the node to be unregistered using
|
||||
@@ -1107,19 +1146,23 @@ Automatic failover with `repmgrd`
|
||||
and which can automate actions such as failover and updating standbys to
|
||||
follow the new master.
|
||||
|
||||
To use `repmgrd` for automatic failover, the following `repmgrd` options must
|
||||
be set in `repmgr.conf`:
|
||||
|
||||
failover=automatic
|
||||
promote_command='repmgr standby promote -f /etc/repmgr.conf'
|
||||
follow_command='repmgr standby follow -f /etc/repmgr.conf'
|
||||
|
||||
(See `repmgr.conf.sample` for further `repmgrd`-specific settings).
|
||||
|
||||
Additionally, `postgresql.conf` must contain the following line:
|
||||
To use `repmgrd` for automatic failover, `postgresql.conf` must contain the
|
||||
following line:
|
||||
|
||||
shared_preload_libraries = 'repmgr_funcs'
|
||||
|
||||
(changing this setting requires a restart of PostgreSQL).
|
||||
|
||||
Additionally the following `repmgrd` options must be set in `repmgr.conf`:
|
||||
|
||||
failover=automatic
|
||||
promote_command='repmgr standby promote -f /etc/repmgr.conf --log-to-file'
|
||||
follow_command='repmgr standby follow -f /etc/repmgr.conf --log-to-file'
|
||||
|
||||
Note that the `--log-to-file` option will cause `repmgr`'s output to be logged to
|
||||
the destination configured to receive log output for `repmgrd`.
|
||||
See `repmgr.conf.sample` for further `repmgrd`-specific settings
|
||||
|
||||
When `failover` is set to `automatic`, upon detecting failure of the current
|
||||
master, `repmgrd` will execute one of `promote_command` or `follow_command`,
|
||||
depending on whether the current server is becoming the new master or
|
||||
@@ -1421,7 +1464,9 @@ functionality will be included in a feature release (e.g. 3.0.x to 3.1.x).
|
||||
|
||||
In general `repmgr` can be upgraded as-is without any further action required,
|
||||
however feature releases may require the `repmgr` database to be upgraded.
|
||||
An SQL script will be provided - please check the release notes for details.
|
||||
An SQL script will be provided - please check the release notes for details:
|
||||
|
||||
* http://repmgr.org/release-notes-3.3.html#UPGRADING
|
||||
|
||||
|
||||
Distribution-specific configuration
|
||||
@@ -1524,7 +1569,7 @@ which contains connection details for the local database.
|
||||
bootstrapping new installations. To update an existing but 'stale'
|
||||
data directory (for example belonging to a failed master), `rsync`
|
||||
must be used by specifying `--rsync-only`. In this case,
|
||||
password-less SSH connections between servers are required.
|
||||
passwordless SSH connections between servers are required.
|
||||
|
||||
* `standby promote`
|
||||
|
||||
@@ -1538,13 +1583,13 @@ which contains connection details for the local database.
|
||||
by using `standby follow` (see below); if `repmgrd` is active, it will
|
||||
handle this.
|
||||
|
||||
This command will not function if the current master is still running.
|
||||
This command will fail with an error if the current master is still running.
|
||||
|
||||
* `standby switchover`
|
||||
|
||||
Promotes a standby to master and demotes the existing master to a standby.
|
||||
This command must be run on the standby to be promoted, and requires a
|
||||
password-less SSH connection to the current master. Additionally the
|
||||
passwordless SSH connection to the current master. Additionally the
|
||||
location of the master's `repmgr.conf` file must be provided with
|
||||
`-C/--remote-config-file`.
|
||||
|
||||
@@ -1651,7 +1696,7 @@ which contains connection details for the local database.
|
||||
overview of connections between all databases in the cluster.
|
||||
|
||||
These commands require a valid `repmgr.conf` file on each node.
|
||||
Additionally password-less `ssh` connections are required between
|
||||
Additionally passwordless `ssh` connections are required between
|
||||
all nodes.
|
||||
|
||||
Example 1 (all nodes up):
|
||||
@@ -1745,6 +1790,21 @@ which contains connection details for the local database.
|
||||
the current working directory; no additional arguments are required.
|
||||
|
||||
|
||||
### Further documentation
|
||||
|
||||
As well as this README, the `repmgr` source contains following additional
|
||||
documentation files:
|
||||
|
||||
* FAQ.md - frequently asked questions
|
||||
* CONTRIBUTING.md - how to contribute to `repmgr`
|
||||
* PACKAGES.md - details on building packages
|
||||
* SSH-RSYNC.md - how to set up passwordless SSH between nodes
|
||||
* docs/repmgrd-failover-mechanism.md - how repmgrd picks which node to promote
|
||||
* docs/repmgrd-node-fencing.md - how to "fence" a failed master node
|
||||
|
||||
|
||||
|
||||
|
||||
### Error codes
|
||||
|
||||
`repmgr` or `repmgrd` will return one of the following error codes on program
|
||||
@@ -1814,6 +1874,7 @@ Thanks from the repmgr core team.
|
||||
Further reading
|
||||
---------------
|
||||
|
||||
* http://blog.2ndquadrant.com/repmgr-3-2-is-here-barman-support-brand-new-high-availability-features/
|
||||
* http://blog.2ndquadrant.com/improvements-in-repmgr-3-1-4/
|
||||
* http://blog.2ndquadrant.com/managing-useful-clusters-repmgr/
|
||||
* http://blog.2ndquadrant.com/easier_postgresql_90_clusters/
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* check_dir.c - Directories management functions
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* check_dir.h
|
||||
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
|
||||
107
compat.c
Normal file
107
compat.c
Normal file
@@ -0,0 +1,107 @@
|
||||
/*
|
||||
*
|
||||
* compat.c
|
||||
* Provides a couple of useful string utility functions adapted
|
||||
* from the backend code, which are not publicly exposed. They're
|
||||
* unlikely to change but it would be worth keeping an eye on them
|
||||
* for any fixes/improvements
|
||||
*
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* Portions Copyright (c) 1996-2013, PostgreSQL Global Development Group
|
||||
* Portions Copyright (c) 1994, Regents of the University of California
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
* the Free Software Foundation, either version 3 of the License, or
|
||||
* (at your option) any later version.
|
||||
*
|
||||
* This program is distributed in the hope that it will be useful,
|
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
* GNU General Public License for more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*
|
||||
*/
|
||||
|
||||
#include "repmgr.h"
|
||||
#include "compat.h"
|
||||
|
||||
/*
|
||||
* Append the given string to the buffer, with suitable quoting for passing
|
||||
* the string as a value, in a keyword/pair value in a libpq connection
|
||||
* string
|
||||
*
|
||||
* This function is adapted from src/fe_utils/string_utils.c (before 9.6
|
||||
* located in: src/bin/pg_dump/dumputils.c)
|
||||
*/
|
||||
void
|
||||
appendConnStrVal(PQExpBuffer buf, const char *str)
|
||||
{
|
||||
const char *s;
|
||||
bool needquotes;
|
||||
|
||||
/*
|
||||
* If the string is one or more plain ASCII characters, no need to quote
|
||||
* it. This is quite conservative, but better safe than sorry.
|
||||
*/
|
||||
needquotes = true;
|
||||
for (s = str; *s; s++)
|
||||
{
|
||||
if (!((*s >= 'a' && *s <= 'z') || (*s >= 'A' && *s <= 'Z') ||
|
||||
(*s >= '0' && *s <= '9') || *s == '_' || *s == '.'))
|
||||
{
|
||||
needquotes = true;
|
||||
break;
|
||||
}
|
||||
needquotes = false;
|
||||
}
|
||||
|
||||
if (needquotes)
|
||||
{
|
||||
appendPQExpBufferChar(buf, '\'');
|
||||
while (*str)
|
||||
{
|
||||
/* ' and \ must be escaped by to \' and \\ */
|
||||
if (*str == '\'' || *str == '\\')
|
||||
appendPQExpBufferChar(buf, '\\');
|
||||
|
||||
appendPQExpBufferChar(buf, *str);
|
||||
str++;
|
||||
}
|
||||
appendPQExpBufferChar(buf, '\'');
|
||||
}
|
||||
else
|
||||
appendPQExpBufferStr(buf, str);
|
||||
}
|
||||
|
||||
/*
|
||||
* Adapted from: src/fe_utils/string_utils.c
|
||||
*/
|
||||
void
|
||||
appendShellString(PQExpBuffer buf, const char *str)
|
||||
{
|
||||
const char *p;
|
||||
|
||||
appendPQExpBufferChar(buf, '\'');
|
||||
for (p = str; *p; p++)
|
||||
{
|
||||
if (*p == '\n' || *p == '\r')
|
||||
{
|
||||
fprintf(stderr,
|
||||
_("shell command argument contains a newline or carriage return: \"%s\"\n"),
|
||||
str);
|
||||
exit(ERR_BAD_CONFIG);
|
||||
}
|
||||
|
||||
if (*p == '\'')
|
||||
appendPQExpBufferStr(buf, "'\"'\"'");
|
||||
else
|
||||
appendPQExpBufferChar(buf, *p);
|
||||
}
|
||||
|
||||
appendPQExpBufferChar(buf, '\'');
|
||||
}
|
||||
|
||||
29
compat.h
Normal file
29
compat.h
Normal file
@@ -0,0 +1,29 @@
|
||||
/*
|
||||
* compat.h
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
* the Free Software Foundation, either version 3 of the License, or
|
||||
* (at your option) any later version.
|
||||
*
|
||||
* This program is distributed in the hope that it will be useful,
|
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
* GNU General Public License for more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*
|
||||
*/
|
||||
|
||||
#ifndef _COMPAT_H_
|
||||
#define _COMPAT_H_
|
||||
|
||||
extern void
|
||||
appendConnStrVal(PQExpBuffer buf, const char *str);
|
||||
|
||||
extern void
|
||||
appendShellString(PQExpBuffer buf, const char *str);
|
||||
|
||||
#endif
|
||||
329
config.c
329
config.c
@@ -1,7 +1,7 @@
|
||||
/*
|
||||
* config.c - Functions to parse the config file
|
||||
*
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
@@ -10,11 +10,11 @@
|
||||
*
|
||||
* This program is distributed in the hope that it will be useful,
|
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
* GNU General Public License for more details.
|
||||
*
|
||||
* You should have received a copy of the GNU General Public License
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||
*
|
||||
*/
|
||||
|
||||
@@ -55,8 +55,8 @@ progname(void)
|
||||
*
|
||||
* Returns true if a configuration file could be parsed, otherwise false.
|
||||
*
|
||||
* Any configuration options changed in this function must also be changed in
|
||||
* reload_config()
|
||||
* Any *repmgrd-specific* configuration options added/changed in this function must also be
|
||||
* added/changed in reload_config()
|
||||
*
|
||||
* NOTE: this function is called before the logger is set up, so we need
|
||||
* to handle the verbose option ourselves; also the default log level is NOTICE,
|
||||
@@ -99,9 +99,9 @@ load_config(const char *config_file, bool verbose, t_configuration_options *opti
|
||||
/*
|
||||
* If no configuration file was provided, attempt to find a default file
|
||||
* in this order:
|
||||
* - current directory
|
||||
* - /etc/repmgr.conf
|
||||
* - default sysconfdir
|
||||
* - current directory
|
||||
* - /etc/repmgr.conf
|
||||
* - default sysconfdir
|
||||
*
|
||||
* here we just check for the existence of the file; parse_config()
|
||||
* will handle read errors etc.
|
||||
@@ -181,6 +181,23 @@ load_config(const char *config_file, bool verbose, t_configuration_options *opti
|
||||
}
|
||||
|
||||
|
||||
bool
|
||||
parse_config(t_configuration_options *options)
|
||||
{
|
||||
/* Collate configuration file errors here for friendlier reporting */
|
||||
static ItemList config_errors = { NULL, NULL };
|
||||
|
||||
_parse_config(options, &config_errors);
|
||||
|
||||
if (config_errors.head != NULL)
|
||||
{
|
||||
exit_with_errors(&config_errors);
|
||||
}
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
|
||||
/*
|
||||
* Parse configuration file; if any errors are encountered,
|
||||
* list them and exit.
|
||||
@@ -188,8 +205,8 @@ load_config(const char *config_file, bool verbose, t_configuration_options *opti
|
||||
* Ensure any default values set here are synced with repmgr.conf.sample
|
||||
* and any other documentation.
|
||||
*/
|
||||
bool
|
||||
parse_config(t_configuration_options *options)
|
||||
void
|
||||
_parse_config(t_configuration_options *options, ItemList *error_list)
|
||||
{
|
||||
FILE *fp;
|
||||
char *s,
|
||||
@@ -201,9 +218,6 @@ parse_config(t_configuration_options *options)
|
||||
PQconninfoOption *conninfo_options;
|
||||
char *conninfo_errmsg = NULL;
|
||||
|
||||
/* Collate configuration file errors here for friendlier reporting */
|
||||
static ItemList config_errors = { NULL, NULL };
|
||||
|
||||
bool node_found = false;
|
||||
|
||||
/* Initialize configuration options with sensible defaults
|
||||
@@ -211,7 +225,7 @@ parse_config(t_configuration_options *options)
|
||||
* to be initialised here
|
||||
*/
|
||||
memset(options->cluster_name, 0, sizeof(options->cluster_name));
|
||||
options->node = -1;
|
||||
options->node = UNKNOWN_NODE_ID;
|
||||
options->upstream_node = NO_UPSTREAM_NODE;
|
||||
options->use_replication_slots = 0;
|
||||
memset(options->conninfo, 0, sizeof(options->conninfo));
|
||||
@@ -262,7 +276,7 @@ parse_config(t_configuration_options *options)
|
||||
{
|
||||
log_verbose(LOG_NOTICE, _("no configuration file provided and no default file found - "
|
||||
"continuing with default values\n"));
|
||||
return true;
|
||||
return;
|
||||
}
|
||||
|
||||
fp = fopen(config_file_path, "r");
|
||||
@@ -307,11 +321,11 @@ parse_config(t_configuration_options *options)
|
||||
strncpy(options->cluster_name, value, MAXLEN);
|
||||
else if (strcmp(name, "node") == 0)
|
||||
{
|
||||
options->node = repmgr_atoi(value, "node", &config_errors, false);
|
||||
options->node = repmgr_atoi(value, "node", error_list, false);
|
||||
node_found = true;
|
||||
}
|
||||
else if (strcmp(name, "upstream_node") == 0)
|
||||
options->upstream_node = repmgr_atoi(value, "upstream_node", &config_errors, false);
|
||||
options->upstream_node = repmgr_atoi(value, "upstream_node", error_list, false);
|
||||
else if (strcmp(name, "conninfo") == 0)
|
||||
strncpy(options->conninfo, value, MAXLEN);
|
||||
else if (strcmp(name, "barman_server") == 0)
|
||||
@@ -342,11 +356,11 @@ parse_config(t_configuration_options *options)
|
||||
}
|
||||
else
|
||||
{
|
||||
item_list_append(&config_errors,_("value for 'failover' must be 'automatic' or 'manual'\n"));
|
||||
item_list_append(error_list, _("value for 'failover' must be 'automatic' or 'manual'\n"));
|
||||
}
|
||||
}
|
||||
else if (strcmp(name, "priority") == 0)
|
||||
options->priority = repmgr_atoi(value, "priority", &config_errors, true);
|
||||
options->priority = repmgr_atoi(value, "priority", error_list, true);
|
||||
else if (strcmp(name, "node_name") == 0)
|
||||
strncpy(options->node_name, value, MAXLEN);
|
||||
else if (strcmp(name, "promote_command") == 0)
|
||||
@@ -364,17 +378,17 @@ parse_config(t_configuration_options *options)
|
||||
else if (strcmp(name, "service_promote_command") == 0)
|
||||
strncpy(options->service_promote_command, value, MAXLEN);
|
||||
else if (strcmp(name, "master_response_timeout") == 0)
|
||||
options->master_response_timeout = repmgr_atoi(value, "master_response_timeout", &config_errors, false);
|
||||
options->master_response_timeout = repmgr_atoi(value, "master_response_timeout", error_list, false);
|
||||
/*
|
||||
* 'primary_response_timeout' as synonym for 'master_response_timeout' -
|
||||
* we'll switch terminology in a future release (3.1?)
|
||||
*/
|
||||
else if (strcmp(name, "primary_response_timeout") == 0)
|
||||
options->master_response_timeout = repmgr_atoi(value, "primary_response_timeout", &config_errors, false);
|
||||
options->master_response_timeout = repmgr_atoi(value, "primary_response_timeout", error_list, false);
|
||||
else if (strcmp(name, "reconnect_attempts") == 0)
|
||||
options->reconnect_attempts = repmgr_atoi(value, "reconnect_attempts", &config_errors, false);
|
||||
options->reconnect_attempts = repmgr_atoi(value, "reconnect_attempts", error_list, false);
|
||||
else if (strcmp(name, "reconnect_interval") == 0)
|
||||
options->reconnect_interval = repmgr_atoi(value, "reconnect_interval", &config_errors, false);
|
||||
options->reconnect_interval = repmgr_atoi(value, "reconnect_interval", error_list, false);
|
||||
else if (strcmp(name, "pg_bindir") == 0)
|
||||
strncpy(options->pg_bindir, value, MAXLEN);
|
||||
else if (strcmp(name, "pg_ctl_options") == 0)
|
||||
@@ -384,14 +398,14 @@ parse_config(t_configuration_options *options)
|
||||
else if (strcmp(name, "logfile") == 0)
|
||||
strncpy(options->logfile, value, MAXLEN);
|
||||
else if (strcmp(name, "monitor_interval_secs") == 0)
|
||||
options->monitor_interval_secs = repmgr_atoi(value, "monitor_interval_secs", &config_errors, false);
|
||||
options->monitor_interval_secs = repmgr_atoi(value, "monitor_interval_secs", error_list, false);
|
||||
else if (strcmp(name, "retry_promote_interval_secs") == 0)
|
||||
options->retry_promote_interval_secs = repmgr_atoi(value, "retry_promote_interval_secs", &config_errors, false);
|
||||
options->retry_promote_interval_secs = repmgr_atoi(value, "retry_promote_interval_secs", error_list, false);
|
||||
else if (strcmp(name, "witness_repl_nodes_sync_interval_secs") == 0)
|
||||
options->witness_repl_nodes_sync_interval_secs = repmgr_atoi(value, "witness_repl_nodes_sync_interval_secs", &config_errors, false);
|
||||
options->witness_repl_nodes_sync_interval_secs = repmgr_atoi(value, "witness_repl_nodes_sync_interval_secs", error_list, false);
|
||||
else if (strcmp(name, "use_replication_slots") == 0)
|
||||
/* XXX we should have a dedicated boolean argument format */
|
||||
options->use_replication_slots = repmgr_atoi(value, "use_replication_slots", &config_errors, false);
|
||||
options->use_replication_slots = repmgr_atoi(value, "use_replication_slots", error_list, false);
|
||||
else if (strcmp(name, "event_notification_command") == 0)
|
||||
strncpy(options->event_notification_command, value, MAXLEN);
|
||||
else if (strcmp(name, "event_notifications") == 0)
|
||||
@@ -419,7 +433,7 @@ parse_config(t_configuration_options *options)
|
||||
_("no value provided for parameter \"%s\""),
|
||||
name);
|
||||
|
||||
item_list_append(&config_errors, error_message_buf);
|
||||
item_list_append(error_list, error_message_buf);
|
||||
}
|
||||
}
|
||||
|
||||
@@ -428,11 +442,15 @@ parse_config(t_configuration_options *options)
|
||||
|
||||
if (node_found == false)
|
||||
{
|
||||
item_list_append(&config_errors, _("\"node\": parameter was not found"));
|
||||
item_list_append(error_list, _("\"node\": parameter was not found"));
|
||||
}
|
||||
else if (options->node == 0)
|
||||
{
|
||||
item_list_append(&config_errors, _("\"node\": must be greater than zero"));
|
||||
item_list_append(error_list, _("\"node\": must be greater than zero"));
|
||||
}
|
||||
else if (options->node < 0)
|
||||
{
|
||||
item_list_append(error_list, _("\"node\": must be a positive signed 32 bit integer, i.e. 2147483647 or less"));
|
||||
}
|
||||
|
||||
if (strlen(options->conninfo))
|
||||
@@ -452,18 +470,11 @@ parse_config(t_configuration_options *options)
|
||||
_("\"conninfo\": %s"),
|
||||
conninfo_errmsg);
|
||||
|
||||
item_list_append(&config_errors, error_message_buf);
|
||||
item_list_append(error_list, error_message_buf);
|
||||
}
|
||||
|
||||
PQconninfoFree(conninfo_options);
|
||||
}
|
||||
|
||||
if (config_errors.head != NULL)
|
||||
{
|
||||
exit_with_errors(&config_errors);
|
||||
}
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
|
||||
@@ -553,70 +564,85 @@ parse_line(char *buf, char *name, char *value)
|
||||
trim(value);
|
||||
}
|
||||
|
||||
|
||||
/*
|
||||
* reload_config()
|
||||
*
|
||||
* This is only called by repmgrd after receiving a SIGHUP or when a monitoring
|
||||
* loop is started up; it therefore only needs to reload options required
|
||||
* by repmgrd, which are as follows:
|
||||
*
|
||||
* changeable options:
|
||||
* - failover
|
||||
* - follow_command
|
||||
* - logfacility
|
||||
* - logfile
|
||||
* - loglevel
|
||||
* - master_response_timeout
|
||||
* - monitor_interval_secs
|
||||
* - priority
|
||||
* - promote_command
|
||||
* - reconnect_attempts
|
||||
* - reconnect_interval
|
||||
* - retry_promote_interval_secs
|
||||
* - witness_repl_nodes_sync_interval_secs
|
||||
*
|
||||
* non-changeable options:
|
||||
* - cluster_name
|
||||
* - conninfo
|
||||
* - node
|
||||
* - node_name
|
||||
*
|
||||
* extract with something like:
|
||||
* grep local_options\\. repmgrd.c | perl -n -e '/local_options\.([\w_]+)/ && print qq|$1\n|;' | sort | uniq
|
||||
|
||||
*/
|
||||
bool
|
||||
reload_config(t_configuration_options *orig_options)
|
||||
{
|
||||
PGconn *conn;
|
||||
t_configuration_options new_options;
|
||||
t_configuration_options new_options = T_CONFIGURATION_OPTIONS_INITIALIZER;
|
||||
bool config_changed = false;
|
||||
bool log_config_changed = false;
|
||||
|
||||
static ItemList config_errors = { NULL, NULL };
|
||||
|
||||
/*
|
||||
* Re-read the configuration file: repmgr.conf
|
||||
*/
|
||||
log_info(_("reloading configuration file and updating repmgr tables\n"));
|
||||
log_info(_("reloading configuration file\n"));
|
||||
|
||||
parse_config(&new_options);
|
||||
if (new_options.node == -1)
|
||||
_parse_config(&new_options, &config_errors);
|
||||
|
||||
if (config_errors.head != NULL)
|
||||
{
|
||||
/* XXX dump errors to log */
|
||||
log_warning(_("unable to parse new configuration, retaining current configuration\n"));
|
||||
return false;
|
||||
}
|
||||
|
||||
/* The following options cannot be changed */
|
||||
if (strcmp(new_options.cluster_name, orig_options->cluster_name) != 0)
|
||||
{
|
||||
log_warning(_("unable to change cluster name, retaining current configuration\n"));
|
||||
log_warning(_("cluster_name cannot be changed, retaining current configuration\n"));
|
||||
return false;
|
||||
}
|
||||
|
||||
if (new_options.node != orig_options->node)
|
||||
{
|
||||
log_warning(_("unable to change node ID, retaining current configuration\n"));
|
||||
log_warning(_("node ID cannot be changed, retaining current configuration\n"));
|
||||
return false;
|
||||
}
|
||||
|
||||
if (strcmp(new_options.node_name, orig_options->node_name) != 0)
|
||||
{
|
||||
log_warning(_("unable to change standby name, keeping current configuration\n"));
|
||||
return false;
|
||||
}
|
||||
|
||||
if (new_options.failover != MANUAL_FAILOVER && new_options.failover != AUTOMATIC_FAILOVER)
|
||||
{
|
||||
log_warning(_("new value for 'failover' must be 'automatic' or 'manual'\n"));
|
||||
return false;
|
||||
}
|
||||
|
||||
if (new_options.master_response_timeout <= 0)
|
||||
{
|
||||
log_warning(_("new value for 'master_response_timeout' must be greater than zero\n"));
|
||||
return false;
|
||||
}
|
||||
|
||||
if (new_options.reconnect_attempts < 0)
|
||||
{
|
||||
log_warning(_("new value for 'reconnect_attempts' must be zero or greater\n"));
|
||||
return false;
|
||||
}
|
||||
|
||||
if (new_options.reconnect_interval < 0)
|
||||
{
|
||||
log_warning(_("new value for 'reconnect_interval' must be zero or greater\n"));
|
||||
log_warning(_("node_name cannot be changed, keeping current configuration\n"));
|
||||
return false;
|
||||
}
|
||||
|
||||
if (strcmp(orig_options->conninfo, new_options.conninfo) != 0)
|
||||
{
|
||||
/* Test conninfo string */
|
||||
/* Test conninfo string works*/
|
||||
conn = establish_db_connection(new_options.conninfo, false);
|
||||
if (!conn || (PQstatus(conn) != CONNECTION_OK))
|
||||
{
|
||||
@@ -633,34 +659,6 @@ reload_config(t_configuration_options *orig_options)
|
||||
* to manage them
|
||||
*/
|
||||
|
||||
/* cluster_name */
|
||||
if (strcmp(orig_options->cluster_name, new_options.cluster_name) != 0)
|
||||
{
|
||||
strcpy(orig_options->cluster_name, new_options.cluster_name);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* conninfo */
|
||||
if (strcmp(orig_options->conninfo, new_options.conninfo) != 0)
|
||||
{
|
||||
strcpy(orig_options->conninfo, new_options.conninfo);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* barman_server */
|
||||
if (strcmp(orig_options->barman_server, new_options.barman_server) != 0)
|
||||
{
|
||||
strcpy(orig_options->barman_server, new_options.barman_server);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* node */
|
||||
if (orig_options->node != new_options.node)
|
||||
{
|
||||
orig_options->node = new_options.node;
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* failover */
|
||||
if (orig_options->failover != new_options.failover)
|
||||
{
|
||||
@@ -668,27 +666,6 @@ reload_config(t_configuration_options *orig_options)
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* priority */
|
||||
if (orig_options->priority != new_options.priority)
|
||||
{
|
||||
orig_options->priority = new_options.priority;
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* node_name */
|
||||
if (strcmp(orig_options->node_name, new_options.node_name) != 0)
|
||||
{
|
||||
strcpy(orig_options->node_name, new_options.node_name);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* promote_command */
|
||||
if (strcmp(orig_options->promote_command, new_options.promote_command) != 0)
|
||||
{
|
||||
strcpy(orig_options->promote_command, new_options.promote_command);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* follow_command */
|
||||
if (strcmp(orig_options->follow_command, new_options.follow_command) != 0)
|
||||
{
|
||||
@@ -696,30 +673,6 @@ reload_config(t_configuration_options *orig_options)
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/*
|
||||
* XXX These ones can change with a simple SIGHUP?
|
||||
*
|
||||
* strcpy (orig_options->loglevel, new_options.loglevel); strcpy
|
||||
* (orig_options->logfacility, new_options.logfacility);
|
||||
*
|
||||
* logger_shutdown(); XXX do we have progname here ? logger_init(progname,
|
||||
* orig_options.loglevel, orig_options.logfacility);
|
||||
*/
|
||||
|
||||
/* rsync_options */
|
||||
if (strcmp(orig_options->rsync_options, new_options.rsync_options) != 0)
|
||||
{
|
||||
strcpy(orig_options->rsync_options, new_options.rsync_options);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* ssh_options */
|
||||
if (strcmp(orig_options->ssh_options, new_options.ssh_options) != 0)
|
||||
{
|
||||
strcpy(orig_options->ssh_options, new_options.ssh_options);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* master_response_timeout */
|
||||
if (orig_options->master_response_timeout != new_options.master_response_timeout)
|
||||
{
|
||||
@@ -727,6 +680,27 @@ reload_config(t_configuration_options *orig_options)
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* monitor_interval_secs */
|
||||
if (orig_options->monitor_interval_secs != new_options.monitor_interval_secs)
|
||||
{
|
||||
orig_options->monitor_interval_secs = new_options.monitor_interval_secs;
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* priority */
|
||||
if (orig_options->priority != new_options.priority)
|
||||
{
|
||||
orig_options->priority = new_options.priority;
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* promote_command */
|
||||
if (strcmp(orig_options->promote_command, new_options.promote_command) != 0)
|
||||
{
|
||||
strcpy(orig_options->promote_command, new_options.promote_command);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* reconnect_attempts */
|
||||
if (orig_options->reconnect_attempts != new_options.reconnect_attempts)
|
||||
{
|
||||
@@ -741,27 +715,6 @@ reload_config(t_configuration_options *orig_options)
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* pg_ctl_options */
|
||||
if (strcmp(orig_options->pg_ctl_options, new_options.pg_ctl_options) != 0)
|
||||
{
|
||||
strcpy(orig_options->pg_ctl_options, new_options.pg_ctl_options);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* pg_basebackup_options */
|
||||
if (strcmp(orig_options->pg_basebackup_options, new_options.pg_basebackup_options) != 0)
|
||||
{
|
||||
strcpy(orig_options->pg_basebackup_options, new_options.pg_basebackup_options);
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* monitor_interval_secs */
|
||||
if (orig_options->monitor_interval_secs != new_options.monitor_interval_secs)
|
||||
{
|
||||
orig_options->monitor_interval_secs = new_options.monitor_interval_secs;
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* retry_promote_interval_secs */
|
||||
if (orig_options->retry_promote_interval_secs != new_options.retry_promote_interval_secs)
|
||||
{
|
||||
@@ -769,20 +722,54 @@ reload_config(t_configuration_options *orig_options)
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/* use_replication_slots */
|
||||
if (orig_options->use_replication_slots != new_options.use_replication_slots)
|
||||
|
||||
/* witness_repl_nodes_sync_interval_secs */
|
||||
if (orig_options->witness_repl_nodes_sync_interval_secs != new_options.witness_repl_nodes_sync_interval_secs)
|
||||
{
|
||||
orig_options->use_replication_slots = new_options.use_replication_slots;
|
||||
orig_options->witness_repl_nodes_sync_interval_secs = new_options.witness_repl_nodes_sync_interval_secs;
|
||||
config_changed = true;
|
||||
}
|
||||
|
||||
/*
|
||||
* Handle changes to logging configuration
|
||||
*/
|
||||
if (strcmp(orig_options->logfacility, new_options.logfacility) != 0)
|
||||
{
|
||||
strcpy(orig_options->logfacility, new_options.logfacility);
|
||||
log_config_changed = true;
|
||||
}
|
||||
|
||||
if (strcmp(orig_options->logfile, new_options.logfile) != 0)
|
||||
{
|
||||
strcpy(orig_options->logfile, new_options.logfile);
|
||||
log_config_changed = true;
|
||||
}
|
||||
|
||||
|
||||
if (strcmp(orig_options->loglevel, new_options.loglevel) != 0)
|
||||
{
|
||||
strcpy(orig_options->loglevel, new_options.loglevel);
|
||||
log_config_changed = true;
|
||||
}
|
||||
|
||||
if (log_config_changed == true)
|
||||
{
|
||||
log_notice(_("restarting logging with changed parameters\n"));
|
||||
logger_shutdown();
|
||||
logger_init(orig_options, progname());
|
||||
}
|
||||
|
||||
if (config_changed == true)
|
||||
{
|
||||
log_debug(_("reload_config(): configuration has changed\n"));
|
||||
log_notice(_("configuration file reloaded with changed parameters\n"));
|
||||
}
|
||||
else
|
||||
/*
|
||||
* if logging configuration changed, don't say the configuration didn't
|
||||
* change, as it clearly has.
|
||||
*/
|
||||
else if (log_config_changed == false)
|
||||
{
|
||||
log_debug(_("reload_config(): configuration has not changed\n"));
|
||||
log_info(_("configuration has not changed\n"));
|
||||
}
|
||||
|
||||
return config_changed;
|
||||
@@ -956,7 +943,7 @@ static void
|
||||
parse_event_notifications_list(t_configuration_options *options, const char *arg)
|
||||
{
|
||||
const char *arg_ptr;
|
||||
char event_type_buf[MAXLEN] = "";
|
||||
char event_type_buf[MAXLEN] = "";
|
||||
char *dst_ptr = event_type_buf;
|
||||
|
||||
|
||||
|
||||
9
config.h
9
config.h
@@ -1,7 +1,7 @@
|
||||
/*
|
||||
* config.h
|
||||
*
|
||||
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
@@ -97,7 +97,7 @@ typedef struct
|
||||
* The following will initialize the structure with a minimal set of options;
|
||||
* actual defaults are set in parse_config() before parsing the configuration file
|
||||
*/
|
||||
#define T_CONFIGURATION_OPTIONS_INITIALIZER { "", -1, NO_UPSTREAM_NODE, "", "", "", MANUAL_FAILOVER, -1, "", "", "", "", "", "", "", "", "", "", "", "", -1, -1, -1, "", "", "", "", "", 0, 0, 0, 0, "", { NULL, NULL }, { NULL, NULL } }
|
||||
#define T_CONFIGURATION_OPTIONS_INITIALIZER { "", UNKNOWN_NODE_ID, NO_UPSTREAM_NODE, "", "", "", MANUAL_FAILOVER, -1, "", "", "", "", "", "", "", "", "", "", "", "", -1, -1, -1, "", "", "", "", "", 0, 0, 0, 0, "", { NULL, NULL }, { NULL, NULL } }
|
||||
|
||||
typedef struct ItemListCell
|
||||
{
|
||||
@@ -131,8 +131,11 @@ void set_progname(const char *argv0);
|
||||
const char * progname(void);
|
||||
|
||||
bool load_config(const char *config_file, bool verbose, t_configuration_options *options, char *argv0);
|
||||
bool reload_config(t_configuration_options *orig_options);
|
||||
|
||||
void _parse_config(t_configuration_options *options, ItemList *error_list);
|
||||
bool parse_config(t_configuration_options *options);
|
||||
bool reload_config(t_configuration_options *orig_options);
|
||||
|
||||
void parse_line(char *buff, char *name, char *value);
|
||||
char *trim(char *s);
|
||||
void item_list_append(ItemList *item_list, char *error_message);
|
||||
|
||||
199
dbutils.c
199
dbutils.c
@@ -1,7 +1,7 @@
|
||||
/*
|
||||
* dbutils.c - Database connection/management functions
|
||||
*
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
@@ -33,6 +33,15 @@ char repmgr_schema[MAXLEN] = "";
|
||||
char repmgr_schema_quoted[MAXLEN] = "";
|
||||
|
||||
static int _get_node_record(PGconn *conn, char *cluster, char *sqlquery, t_node_info *node_info);
|
||||
static bool _set_config(PGconn *conn, const char *config_param, const char *sqlquery);
|
||||
|
||||
/*
|
||||
* _establish_db_connection()
|
||||
*
|
||||
* Connect to a database using a conninfo string.
|
||||
*
|
||||
* NOTE: *do not* use this for replication connections; use establish_db_connection_by_params() instead.
|
||||
*/
|
||||
|
||||
PGconn *
|
||||
_establish_db_connection(const char *conninfo, const bool exit_on_error, const bool log_notice, const bool verbose_only)
|
||||
@@ -77,6 +86,19 @@ _establish_db_connection(const char *conninfo, const bool exit_on_error, const b
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
* set "synchronous_commit" to "local" in case synchronous replication is in use
|
||||
*/
|
||||
|
||||
else if (set_config(conn, "synchronous_commit", "local") == false)
|
||||
{
|
||||
if (exit_on_error)
|
||||
{
|
||||
PQfinish(conn);
|
||||
exit(ERR_DB_CON);
|
||||
}
|
||||
}
|
||||
|
||||
return conn;
|
||||
}
|
||||
|
||||
@@ -116,8 +138,12 @@ PGconn *
|
||||
establish_db_connection_by_params(const char *keywords[], const char *values[],
|
||||
const bool exit_on_error)
|
||||
{
|
||||
/* Make a connection to the database */
|
||||
PGconn *conn = PQconnectdbParams(keywords, values, true);
|
||||
PGconn *conn;
|
||||
bool replication_connection = false;
|
||||
int i;
|
||||
|
||||
/* Connect to the database using the provided parameters */
|
||||
conn = PQconnectdbParams(keywords, values, true);
|
||||
|
||||
/* Check to see that the backend connection was successfully made */
|
||||
if ((PQstatus(conn) != CONNECTION_OK))
|
||||
@@ -130,6 +156,28 @@ establish_db_connection_by_params(const char *keywords[], const char *values[],
|
||||
exit(ERR_DB_CON);
|
||||
}
|
||||
}
|
||||
else
|
||||
{
|
||||
/*
|
||||
* set "synchronous_commit" to "local" in case synchronous replication is in
|
||||
* use (provided this is not a replication connection)
|
||||
*/
|
||||
|
||||
for (i = 0; keywords[i]; i++)
|
||||
{
|
||||
if (strcmp(keywords[i], "replication") == 0)
|
||||
replication_connection = true;
|
||||
}
|
||||
|
||||
if (replication_connection == false && set_config(conn, "synchronous_commit", "local") == false)
|
||||
{
|
||||
if (exit_on_error)
|
||||
{
|
||||
PQfinish(conn);
|
||||
exit(ERR_DB_CON);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return conn;
|
||||
}
|
||||
@@ -279,7 +327,6 @@ is_pgup(PGconn *conn, int timeout)
|
||||
/* Check the connection status twice in case it changes after reset */
|
||||
bool twice = false;
|
||||
|
||||
/* Check the connection status twice in case it changes after reset */
|
||||
for (;;)
|
||||
{
|
||||
if (PQstatus(conn) != CONNECTION_OK)
|
||||
@@ -1151,19 +1198,12 @@ stop_backup(PGconn *conn, char *last_wal_segment)
|
||||
}
|
||||
|
||||
|
||||
|
||||
bool
|
||||
set_config_bool(PGconn *conn, const char *config_param, bool state)
|
||||
_set_config(PGconn *conn, const char *config_param, const char *sqlquery)
|
||||
{
|
||||
char sqlquery[QUERY_STR_LEN];
|
||||
PGresult *res;
|
||||
|
||||
sqlquery_snprintf(sqlquery,
|
||||
"SET %s TO %s",
|
||||
config_param,
|
||||
state ? "TRUE" : "FALSE");
|
||||
|
||||
log_verbose(LOG_DEBUG, "set_config_bool():\n%s\n", sqlquery);
|
||||
|
||||
res = PQexec(conn, sqlquery);
|
||||
|
||||
if (PQresultStatus(res) != PGRES_COMMAND_OK)
|
||||
@@ -1178,6 +1218,36 @@ set_config_bool(PGconn *conn, const char *config_param, bool state)
|
||||
return true;
|
||||
}
|
||||
|
||||
bool
|
||||
set_config(PGconn *conn, const char *config_param, const char *config_value)
|
||||
{
|
||||
char sqlquery[QUERY_STR_LEN];
|
||||
|
||||
sqlquery_snprintf(sqlquery,
|
||||
"SET %s TO '%s'",
|
||||
config_param,
|
||||
config_value);
|
||||
|
||||
log_verbose(LOG_DEBUG, "set_config():\n%s\n", sqlquery);
|
||||
|
||||
return _set_config(conn, config_param, sqlquery);
|
||||
}
|
||||
|
||||
bool
|
||||
set_config_bool(PGconn *conn, const char *config_param, bool state)
|
||||
{
|
||||
char sqlquery[QUERY_STR_LEN];
|
||||
|
||||
sqlquery_snprintf(sqlquery,
|
||||
"SET %s TO %s",
|
||||
config_param,
|
||||
state ? "TRUE" : "FALSE");
|
||||
|
||||
log_verbose(LOG_DEBUG, "set_config_bool():\n%s\n", sqlquery);
|
||||
|
||||
return _set_config(conn, config_param, sqlquery);
|
||||
}
|
||||
|
||||
|
||||
/*
|
||||
* witness_copy_node_records()
|
||||
@@ -1437,10 +1507,11 @@ create_event_record(PGconn *conn, t_configuration_options *options, int node_id,
|
||||
bool success = true;
|
||||
struct tm ts;
|
||||
|
||||
/* Only attempt to write a record if a connection handle was provided.
|
||||
Also check that the repmgr schema has been properly intialised - if
|
||||
not it means no configuration file was provided, which can happen with
|
||||
e.g. `repmgr standby clone`, and we won't know which schema to write to.
|
||||
/*
|
||||
* Only attempt to write a record if a connection handle was provided.
|
||||
* Also check that the repmgr schema has been properly initialised - if
|
||||
* not it means no configuration file was provided, which can happen with
|
||||
* e.g. `repmgr standby clone`, and we won't know which schema to write to.
|
||||
*/
|
||||
if (conn != NULL && strcmp(repmgr_schema, DEFAULT_REPMGR_SCHEMA_PREFIX) != 0)
|
||||
{
|
||||
@@ -1629,6 +1700,89 @@ create_event_record(PGconn *conn, t_configuration_options *options, int node_id,
|
||||
}
|
||||
|
||||
|
||||
bool
|
||||
update_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name, bool active)
|
||||
{
|
||||
char sqlquery[QUERY_STR_LEN];
|
||||
char upstream_node_id[MAXLEN];
|
||||
char slot_name_buf[MAXLEN];
|
||||
PGresult *res;
|
||||
|
||||
/* XXX this segment copied from create_node_record() */
|
||||
if (upstream_node == NO_UPSTREAM_NODE)
|
||||
{
|
||||
/*
|
||||
* No explicit upstream node id provided for standby - attempt to
|
||||
* get primary node id
|
||||
*/
|
||||
if (strcmp(type, "standby") == 0)
|
||||
{
|
||||
int primary_node_id = get_master_node_id(conn, cluster_name);
|
||||
maxlen_snprintf(upstream_node_id, "%i", primary_node_id);
|
||||
}
|
||||
else
|
||||
{
|
||||
maxlen_snprintf(upstream_node_id, "%s", "NULL");
|
||||
}
|
||||
}
|
||||
else
|
||||
{
|
||||
maxlen_snprintf(upstream_node_id, "%i", upstream_node);
|
||||
}
|
||||
|
||||
if (slot_name != NULL && slot_name[0])
|
||||
{
|
||||
maxlen_snprintf(slot_name_buf, "'%s'", slot_name);
|
||||
}
|
||||
else
|
||||
{
|
||||
maxlen_snprintf(slot_name_buf, "%s", "NULL");
|
||||
}
|
||||
|
||||
/* XXX convert to placeholder query */
|
||||
sqlquery_snprintf(sqlquery,
|
||||
"UPDATE %s.repl_nodes SET "
|
||||
" type = '%s', "
|
||||
" upstream_node_id = %s, "
|
||||
" cluster = '%s', "
|
||||
" name = '%s', "
|
||||
" conninfo = '%s', "
|
||||
" slot_name = %s, "
|
||||
" priority = %i, "
|
||||
" active = %s "
|
||||
" WHERE id = %i ",
|
||||
get_repmgr_schema_quoted(conn),
|
||||
type,
|
||||
upstream_node_id,
|
||||
cluster_name,
|
||||
node_name,
|
||||
conninfo,
|
||||
slot_name_buf,
|
||||
priority,
|
||||
active == true ? "TRUE" : "FALSE",
|
||||
node);
|
||||
|
||||
log_verbose(LOG_DEBUG, "update_node_record(): %s\n", sqlquery);
|
||||
|
||||
if (action != NULL)
|
||||
{
|
||||
log_verbose(LOG_DEBUG, "update_node_record(): action is \"%s\"\n", action);
|
||||
}
|
||||
|
||||
res = PQexec(conn, sqlquery);
|
||||
if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
|
||||
{
|
||||
log_err(_("Unable to update node record\n%s\n"),
|
||||
PQerrorMessage(conn));
|
||||
PQclear(res);
|
||||
return false;
|
||||
}
|
||||
|
||||
PQclear(res);
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
/*
|
||||
* Update node record following change of status
|
||||
* (e.g. inactive primary converted to standby)
|
||||
@@ -1789,7 +1943,16 @@ _get_node_record(PGconn *conn, char *cluster, char *sqlquery, t_node_info *node_
|
||||
|
||||
node_info->node_id = atoi(PQgetvalue(res, 0, 0));
|
||||
node_info->type = parse_node_type(PQgetvalue(res, 0, 1));
|
||||
node_info->upstream_node_id = atoi(PQgetvalue(res, 0, 2));
|
||||
|
||||
if (PQgetisnull(res, 0, 2))
|
||||
{
|
||||
node_info->upstream_node_id = NO_UPSTREAM_NODE;
|
||||
}
|
||||
else
|
||||
{
|
||||
node_info->upstream_node_id = atoi(PQgetvalue(res, 0, 2));
|
||||
}
|
||||
|
||||
strncpy(node_info->name, PQgetvalue(res, 0, 3), MAXLEN);
|
||||
strncpy(node_info->conninfo_str, PQgetvalue(res, 0, 4), MAXLEN);
|
||||
strncpy(node_info->slot_name, PQgetvalue(res, 0, 5), MAXLEN);
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
/*
|
||||
* dbutils.h
|
||||
*
|
||||
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
@@ -124,12 +124,14 @@ int get_slot_record(PGconn *conn, char *slot_name, t_replication_slot *record)
|
||||
bool drop_replication_slot(PGconn *conn, char *slot_name);
|
||||
bool start_backup(PGconn *conn, char *first_wal_segment, bool fast_checkpoint);
|
||||
bool stop_backup(PGconn *conn, char *last_wal_segment);
|
||||
bool set_config(PGconn *conn, const char *config_param, const char *config_value);
|
||||
bool set_config_bool(PGconn *conn, const char *config_param, bool state);
|
||||
bool witness_copy_node_records(PGconn *masterconn, PGconn *witnessconn, char *cluster_name);
|
||||
bool create_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name, bool active);
|
||||
bool delete_node_record(PGconn *conn, int node, char *action);
|
||||
int get_node_record(PGconn *conn, char *cluster, int node_id, t_node_info *node_info);
|
||||
int get_node_record_by_name(PGconn *conn, char *cluster, const char *node_name, t_node_info *node_info);
|
||||
bool update_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name, bool active);
|
||||
bool update_node_record_status(PGconn *conn, char *cluster_name, int this_node_id, char *type, int upstream_node_id, bool active);
|
||||
bool update_node_record_set_upstream(PGconn *conn, char *cluster_name, int this_node_id, int new_upstream_node_id);
|
||||
bool create_event_record(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
||||
|
||||
2
dirmod.c
2
dirmod.c
@@ -3,7 +3,7 @@
|
||||
* dirmod.c
|
||||
* directory handling functions
|
||||
*
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* Portions Copyright (c) 1996-2013, PostgreSQL Global Development Group
|
||||
* Portions Copyright (c) 1994, Regents of the University of California
|
||||
|
||||
2
dirmod.h
2
dirmod.h
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* dirmod.h
|
||||
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
|
||||
75
docs/repmgrd-failover-mechanism.md
Normal file
75
docs/repmgrd-failover-mechanism.md
Normal file
@@ -0,0 +1,75 @@
|
||||
repmgrd's failover algorithm
|
||||
============================
|
||||
|
||||
When implementing automatic failover, there are two factors which are critical in
|
||||
ensuring the desired result is achieved:
|
||||
|
||||
- has the master node genuinely failed?
|
||||
- which is the best node to promote to the new master?
|
||||
|
||||
This document outlines repmgrd's decision-making process during automatic failover
|
||||
for standbys directly connected to the master node.
|
||||
|
||||
|
||||
Master node failure detection
|
||||
-----------------------------
|
||||
|
||||
If a `repmgrd` instance running on a PostgreSQL standby node is unable to connect to
|
||||
the master node, this doesn't neccesarily mean that the master is down and a
|
||||
failover is required. Factors such as network connectivity issues could mean that
|
||||
even though the standby node is isolated, the replication cluster as a whole
|
||||
is functioning correctly, and promoting the standby without further verification
|
||||
could result in a "split-brain" situation.
|
||||
|
||||
In the event that `repmgrd` is unable to connect to the master node, it will attempt
|
||||
to reconnect to the master server several times (as defined by the `reconnect_attempts`
|
||||
parameter in `repmgr.conf`), with reconnection attempts occuring at the interval
|
||||
specified by `reconnect_interval`. This happens to verify that the master is definitively
|
||||
not accessible (e.g. that connection was not lost due to a brief network glitch).
|
||||
|
||||
Appropriate values for these settings will depend very much on the replication
|
||||
cluster environment. There will necessarily be a trade-off between the time it
|
||||
takes to assume the master is not reachable, and the reliability of that conclusion.
|
||||
A standby in a different physical location to the master will probably need a longer
|
||||
check interval to rule out possible network issues, whereas one located in the same
|
||||
rack with a direct connection between servers could perform the check very quickly.
|
||||
|
||||
Note that it's possible the master comes back online after this point is reached,
|
||||
but before a new master has been selected; in this case it will be noticed
|
||||
during the selection of a new master and no actual failover will take place.
|
||||
|
||||
Promotion candidate selection
|
||||
-----------------------------
|
||||
|
||||
Once `repmgrd` has decided the master is definitively unreachable, following checks
|
||||
will be carried out:
|
||||
|
||||
* attempts to connect to all other nodes in the cluster (including the witness
|
||||
node, if defined) to establish the state of the cluster, including their
|
||||
current LSN
|
||||
|
||||
* If less than half of the nodes are visible (from the viewpoint
|
||||
of this node), `repmgrd` will not take any further action. This is to ensure that
|
||||
e.g. if a replication cluster is spread over multiple data centres, a split-brain
|
||||
situation does not occur if there is a network failure between datacentres. Note
|
||||
that if nodes are split evenly between data centres, a witness server can be
|
||||
used to establish the "majority" daat centre.
|
||||
|
||||
* `repmgrd` polls all visible servers and waits for each node to return a valid LSN;
|
||||
it updates the LSN previously stored for this node if it has increased since
|
||||
the initial check
|
||||
|
||||
* once all LSNs have been retrieved, `repmgrd` will check for the highest LSN; if
|
||||
its own node has the highest LSN, it will attempt to promote itself (using the
|
||||
command defined in `promote_command` in `repmgr.conf`. Note that if using
|
||||
`repmgr standby promote` as the promotion command, and the original master becomes available
|
||||
before the promotion takes effect, `repmgr` will return an error and no promotion
|
||||
will take place, and `repmgrd` will resume monitoring as usual.
|
||||
|
||||
* if the node is not the promotion candidate, `repmgrd` will execute the
|
||||
`follow_command` defined in `repmgr.conf`. If using `repmgr standby follow` here,
|
||||
`repmgr` will attempt to detect the new master node and attach to that.
|
||||
|
||||
|
||||
|
||||
|
||||
152
docs/repmgrd-node-fencing.md
Normal file
152
docs/repmgrd-node-fencing.md
Normal file
@@ -0,0 +1,152 @@
|
||||
Fencing a failed master node with repmgrd and pgbouncer
|
||||
=======================================================
|
||||
|
||||
With automatic failover, it's essential to ensure that a failed master
|
||||
remains inaccessible to your application, even if it comes back online
|
||||
again, to avoid a split-brain situation.
|
||||
|
||||
By using `pgbouncer` together with `repmgrd`, it's possible to combine
|
||||
automatic failover with a process to isolate the failed master from
|
||||
your application and ensure that all connections which should go to
|
||||
the master are directed there smoothly without having to reconfigure
|
||||
your application. (Note that as a connection pooler, `pgbouncer` can
|
||||
benefit your application in other ways, but those are beyond the scope
|
||||
of this document).
|
||||
|
||||
* * *
|
||||
|
||||
> *WARNING*: automatic failover is tricky to get right. This document
|
||||
> demonstrates one possible implementation method, however you should
|
||||
> carefully configure and test any setup to suit the needs of your own
|
||||
> replication cluster/application.
|
||||
|
||||
* * *
|
||||
|
||||
In a failover situation, `repmgrd` promotes a standby to master by executing
|
||||
the command defined in `promote_command`. Normally this would be something like:
|
||||
|
||||
repmgr standby promote -f /etc/repmgr.conf
|
||||
|
||||
By wrapping this in a custom script which adjusts the `pgbouncer` configuration
|
||||
on all nodes, it's possible to fence the failed master and redirect write
|
||||
connections to the new master.
|
||||
|
||||
The script consists of three sections:
|
||||
|
||||
* commands to pause `pgbouncer` on all nodes
|
||||
* the promotion command itself
|
||||
* commands to reconfigure and restart `pgbouncer` on all nodes
|
||||
|
||||
Note that it requires password-less SSH access between all nodes to be able to
|
||||
update the `pgbouncer` configuration files.
|
||||
|
||||
For the purposes of this demonstration, we'll assume there are 3 nodes (master
|
||||
and two standbys), with `pgbouncer` listening on port 6432 handling connections
|
||||
to a database called `appdb`. The `postgres` system user must have write
|
||||
access to the `pgbouncer` configuration files on all nodes. We'll assume
|
||||
there's a main `pgbouncer` configuration file, `/etc/pgbouncer.ini`, which uses
|
||||
the `%include` directive (available from PgBouncer 1.6) to include a separate
|
||||
configuration file, `/etc/pgbouncer.database.ini`, which will be modified by
|
||||
`repmgr`.
|
||||
|
||||
`/etc/pgbouncer.ini` should look something like this:
|
||||
|
||||
[pgbouncer]
|
||||
|
||||
logfile = /var/log/pgbouncer/pgbouncer.log
|
||||
pidfile = /var/run/pgbouncer/pgbouncer.pid
|
||||
|
||||
listen_addr = *
|
||||
listen_port = 6532
|
||||
unix_socket_dir = /tmp
|
||||
|
||||
auth_type = trust
|
||||
auth_file = /etc/pgbouncer.auth
|
||||
|
||||
admin_users = postgres
|
||||
stats_users = postgres
|
||||
|
||||
pool_mode = transaction
|
||||
|
||||
max_client_conn = 100
|
||||
default_pool_size = 20
|
||||
min_pool_size = 5
|
||||
reserve_pool_size = 5
|
||||
reserve_pool_timeout = 3
|
||||
|
||||
log_connections = 1
|
||||
log_disconnections = 1
|
||||
log_pooler_errors = 1
|
||||
|
||||
%include /etc/pgbouncer.database.ini
|
||||
|
||||
The actual script is as follows; adjust the configurable items as appropriate:
|
||||
|
||||
`/var/lib/postgres/repmgr/promote.sh`
|
||||
|
||||
|
||||
#!/usr/bin/env bash
|
||||
set -u
|
||||
set -e
|
||||
|
||||
# Configurable items
|
||||
PGBOUNCER_HOSTS="node1 node2 node3"
|
||||
PGBOUNCER_DATABASE_INI="/etc/pgbouncer.database.ini"
|
||||
PGBOUNCER_DATABASE="appdb"
|
||||
PGBOUNCER_PORT=6432
|
||||
|
||||
REPMGR_DB="repmgr"
|
||||
REPMGR_USER="repmgr"
|
||||
REPMGR_SCHEMA="repmgr_test"
|
||||
|
||||
# 1. Pause running pgbouncer instances
|
||||
for HOST in $PGBOUNCER_HOSTS
|
||||
do
|
||||
psql -t -c "pause" -h $HOST -p $PGBOUNCER_PORT -U postgres pgbouncer
|
||||
done
|
||||
|
||||
# 2. Promote this node from standby to master
|
||||
|
||||
repmgr standby promote -f /etc/repmgr.conf
|
||||
|
||||
# 3. Reconfigure pgbouncer instances
|
||||
|
||||
PGBOUNCER_DATABASE_INI_NEW="/tmp/pgbouncer.database.ini"
|
||||
|
||||
for HOST in $PGBOUNCER_HOSTS
|
||||
do
|
||||
# Recreate the pgbouncer config file
|
||||
echo -e "[databases]\n" > $PGBOUNCER_DATABASE_INI_NEW
|
||||
|
||||
psql -d $REPMGR_DB -U $REPMGR_USER -t -A \
|
||||
-c "SELECT '${PGBOUNCER_DATABASE}-rw= ' || conninfo || ' application_name=pgbouncer_${HOST}' \
|
||||
FROM ${REPMGR_SCHEMA}.repl_nodes \
|
||||
WHERE active = TRUE AND type='master'" >> $PGBOUNCER_DATABASE_INI_NEW
|
||||
|
||||
psql -d $REPMGR_DB -U $REPMGR_USER -t -A \
|
||||
-c "SELECT '${PGBOUNCER_DATABASE}-ro= ' || conninfo || ' application_name=pgbouncer_${HOST}' \
|
||||
FROM $REPMGR_SCHEMA.repl_nodes \
|
||||
WHERE node_name='${HOST}'" >> $PGBOUNCER_DATABASE_INI_NEW
|
||||
|
||||
rsync $PGBOUNCER_DATABASE_INI_NEW $HOST:$PGBOUNCER_DATABASE_INI
|
||||
|
||||
psql -tc "reload" -h $HOST -p $PGBOUNCER_PORT -U postgres pgbouncer
|
||||
psql -tc "resume" -h $HOST -p $PGBOUNCER_PORT -U postgres pgbouncer
|
||||
|
||||
done
|
||||
|
||||
# Clean up generated file
|
||||
rm $PGBOUNCER_DATABASE_INI_NEW
|
||||
|
||||
echo "Reconfiguration of pgbouncer complete"
|
||||
|
||||
Script and template file should be installed on each node where
|
||||
`repmgrd` is running.
|
||||
|
||||
Finally, set `promote_command` in `repmgr.conf` on each node to
|
||||
point to the custom promote script:
|
||||
|
||||
promote_command=/var/lib/postgres/repmgr/promote.sh
|
||||
|
||||
and reload/restart any running `repmgrd` instances for the changes to take
|
||||
effect.
|
||||
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* errcode.h
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
|
||||
44
log.c
44
log.c
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* log.c - Logging methods
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This module is a set of methods for logging (currently only syslog)
|
||||
*
|
||||
@@ -48,6 +48,11 @@ int log_level = LOG_NOTICE;
|
||||
int last_log_level = LOG_NOTICE;
|
||||
int verbose_logging = false;
|
||||
int terse_logging = false;
|
||||
/*
|
||||
* Global variable to be set by the main application to ensure any log output
|
||||
* emitted before logger_init is called, is output in the correct format
|
||||
*/
|
||||
int logger_output_mode = OM_DAEMON;
|
||||
|
||||
extern void
|
||||
stderr_log_with_level(const char *level_name, int level, const char *fmt, ...)
|
||||
@@ -62,9 +67,7 @@ stderr_log_with_level(const char *level_name, int level, const char *fmt, ...)
|
||||
static void
|
||||
_stderr_log_with_level(const char *level_name, int level, const char *fmt, va_list ap)
|
||||
{
|
||||
time_t t;
|
||||
struct tm *tm;
|
||||
char buff[100];
|
||||
char buf[100];
|
||||
|
||||
/*
|
||||
* Store the requested level so that if there's a subsequent
|
||||
@@ -74,10 +77,21 @@ _stderr_log_with_level(const char *level_name, int level, const char *fmt, va_li
|
||||
|
||||
if (log_level >= level)
|
||||
{
|
||||
time(&t);
|
||||
tm = localtime(&t);
|
||||
strftime(buff, 100, "[%Y-%m-%d %H:%M:%S]", tm);
|
||||
fprintf(stderr, "%s [%s] ", buff, level_name);
|
||||
|
||||
/* Format log line prefix with timestamp if in daemon mode */
|
||||
if (logger_output_mode == OM_DAEMON)
|
||||
{
|
||||
time_t t;
|
||||
struct tm *tm;
|
||||
time(&t);
|
||||
tm = localtime(&t);
|
||||
strftime(buf, 100, "[%Y-%m-%d %H:%M:%S]", tm);
|
||||
fprintf(stderr, "%s [%s] ", buf, level_name);
|
||||
}
|
||||
else
|
||||
{
|
||||
fprintf(stderr, "%s: ", level_name);
|
||||
}
|
||||
|
||||
vfprintf(stderr, fmt, ap);
|
||||
|
||||
@@ -176,6 +190,13 @@ logger_init(t_configuration_options *opts, const char *ident)
|
||||
stderr_log_warning(_("Invalid log level \"%s\" (available values: DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG)\n"), level);
|
||||
}
|
||||
|
||||
/*
|
||||
* STDERR only logging requested - finish here without setting up any further
|
||||
* logging facility.
|
||||
*/
|
||||
if (logger_output_mode == OM_COMMAND_LINE)
|
||||
return true;
|
||||
|
||||
if (facility && *facility)
|
||||
{
|
||||
|
||||
@@ -236,9 +257,10 @@ logger_init(t_configuration_options *opts, const char *ident)
|
||||
stderr_log_notice(_("Redirecting logging output to '%s'\n"), opts->logfile);
|
||||
fd = freopen(opts->logfile, "a", stderr);
|
||||
|
||||
/* It's possible freopen() may still fail due to e.g. a race condition;
|
||||
as it's not feasible to restore stderr after a failed freopen(),
|
||||
we'll write to stdout as a last resort.
|
||||
/*
|
||||
* It's possible freopen() may still fail due to e.g. a race condition;
|
||||
* as it's not feasible to restore stderr after a failed freopen(),
|
||||
* we'll write to stdout as a last resort.
|
||||
*/
|
||||
if (fd == NULL)
|
||||
{
|
||||
|
||||
6
log.h
6
log.h
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* log.h
|
||||
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
@@ -25,6 +25,9 @@
|
||||
#define REPMGR_SYSLOG 1
|
||||
#define REPMGR_STDERR 2
|
||||
|
||||
#define OM_COMMAND_LINE 1
|
||||
#define OM_DAEMON 2
|
||||
|
||||
extern void
|
||||
stderr_log_with_level(const char *level_name, int level, const char *fmt,...)
|
||||
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 4)));
|
||||
@@ -132,5 +135,6 @@ extern int log_type;
|
||||
extern int log_level;
|
||||
extern int verbose_logging;
|
||||
extern int terse_logging;
|
||||
extern int logger_output_mode;
|
||||
|
||||
#endif /* _REPMGR_LOG_H_ */
|
||||
|
||||
@@ -66,6 +66,12 @@
|
||||
# (default: NOTICE)
|
||||
#loglevel=NOTICE
|
||||
|
||||
# Note that logging facility settings will only apply to `repmgrd` by default;
|
||||
# `repmgr` will always write to STDERR unless the switch `--log-to-file` is
|
||||
# supplied, in which case it will log to the same destination as `repmgrd`.
|
||||
# This is mainly intended for those cases when `repmgr` is executed directly
|
||||
# by `repmgrd`.
|
||||
|
||||
# Logging facility: possible values are STDERR or - for Syslog integration - one of LOCAL0, LOCAL1, ..., LOCAL7, USER
|
||||
# (default: STDERR)
|
||||
#logfacility=STDERR
|
||||
@@ -137,8 +143,15 @@
|
||||
# external command arguments. Values shown are examples.
|
||||
|
||||
#pg_ctl_options='-s'
|
||||
#pg_basebackup_options='--xlog-method=s'
|
||||
#pg_basebackup_options='--label=repmgr_backup'
|
||||
|
||||
# This is the host name of the barman server, which is used for connecting over
|
||||
# to the barman server (passwordless ssh keys should be in place)
|
||||
#barman_server='backup_server'
|
||||
# If you are placing the barman.conf file in a non-standard path, or using
|
||||
# a name other than barman.conf, use this parameter to specify the path and
|
||||
# name of the barman configuration file.
|
||||
#barman_config='/path/to/barman.conf'
|
||||
|
||||
# Standby clone settings
|
||||
# ----------------------
|
||||
@@ -160,9 +173,11 @@
|
||||
# These settings are only applied when repmgrd is running. Values shown
|
||||
# are defaults.
|
||||
|
||||
# Number of seconds to wait for a response from the primary server before
|
||||
# deciding it has failed.
|
||||
# monitoring interval in seconds; default is 2
|
||||
#monitor_interval_secs=2
|
||||
|
||||
# Maximum number of seconds to wait for a response from the primary server
|
||||
# before deciding it has failed.
|
||||
#master_response_timeout=60
|
||||
|
||||
# Number of attempts at what interval (in seconds) to try and
|
||||
@@ -187,9 +202,6 @@
|
||||
#promote_command='repmgr standby promote -f /path/to/repmgr.conf'
|
||||
#follow_command='repmgr standby follow -f /path/to/repmgr.conf -W'
|
||||
|
||||
# monitoring interval in seconds; default is 2
|
||||
#monitor_interval_secs=2
|
||||
|
||||
# change wait time for primary; before we bail out and exit when the primary
|
||||
# disappears, we wait 'reconnect_attempts' * 'retry_promote_interval_secs'
|
||||
# seconds; by default this would be half an hour, as 'retry_promote_interval_secs'
|
||||
|
||||
118
repmgr.h
118
repmgr.h
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* repmgr.h
|
||||
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
@@ -62,11 +62,16 @@
|
||||
#define OPT_NO_UPSTREAM_CONNECTION 11
|
||||
#define OPT_REGISTER_WAIT 12
|
||||
#define OPT_CLUSTER 13
|
||||
#define OPT_LOG_TO_FILE 14
|
||||
#define OPT_UPSTREAM_CONNINFO 15
|
||||
#define OPT_NO_CONNINFO_PASSWORD 16
|
||||
#define OPT_REPLICATION_USER 17
|
||||
|
||||
/* deprecated command line options */
|
||||
#define OPT_INITDB_NO_PWPROMPT 999
|
||||
#define OPT_IGNORE_EXTERNAL_CONFIG_FILES 998
|
||||
#define OPT_INITDB_NO_PWPROMPT 998
|
||||
#define OPT_IGNORE_EXTERNAL_CONFIG_FILES 999
|
||||
|
||||
/* values for --copy-external-config-files */
|
||||
#define CONFIG_FILE_SAMEPATH 1
|
||||
#define CONFIG_FILE_PGDATA 2
|
||||
|
||||
@@ -74,53 +79,102 @@
|
||||
/* Run time options type */
|
||||
typedef struct
|
||||
{
|
||||
/* general repmgr options */
|
||||
char config_file[MAXPGPATH];
|
||||
bool verbose;
|
||||
bool terse;
|
||||
bool force;
|
||||
char pg_bindir[MAXLEN]; /* overrides setting in repmgr.conf */
|
||||
|
||||
/* logging parameters */
|
||||
char loglevel[MAXLEN]; /* overrides setting in repmgr.conf */
|
||||
bool log_to_file;
|
||||
|
||||
/* connection parameters */
|
||||
char dbname[MAXLEN];
|
||||
char host[MAXLEN];
|
||||
char username[MAXLEN];
|
||||
char dest_dir[MAXPGPATH];
|
||||
char config_file[MAXPGPATH];
|
||||
char remote_user[MAXLEN];
|
||||
char superuser[MAXLEN];
|
||||
char masterport[MAXLEN];
|
||||
bool conninfo_provided;
|
||||
bool connection_param_provided;
|
||||
bool host_param_provided;
|
||||
|
||||
/* standby clone parameters */
|
||||
bool wal_keep_segments_used;
|
||||
char wal_keep_segments[MAXLEN];
|
||||
bool verbose;
|
||||
bool terse;
|
||||
bool force;
|
||||
bool wait_for_master;
|
||||
bool ignore_rsync_warn;
|
||||
bool witness_pwprompt;
|
||||
bool rsync_only;
|
||||
bool fast_checkpoint;
|
||||
bool csv_mode;
|
||||
bool without_barman;
|
||||
bool no_upstream_connection;
|
||||
bool no_conninfo_password;
|
||||
bool copy_external_config_files;
|
||||
int copy_external_config_files_destination;
|
||||
bool wait_register_sync;
|
||||
int wait_register_sync_seconds;
|
||||
char masterport[MAXLEN];
|
||||
/*
|
||||
* configuration file parameters which can be overridden on the
|
||||
* command line
|
||||
*/
|
||||
char loglevel[MAXLEN];
|
||||
|
||||
/* parameter used by STANDBY SWITCHOVER */
|
||||
char remote_config_file[MAXLEN];
|
||||
char pg_rewind[MAXPGPATH];
|
||||
char pg_ctl_mode[MAXLEN];
|
||||
/* parameter used by STANDBY {ARCHIVE_CONFIG | RESTORE_CONFIG} */
|
||||
char config_archive_dir[MAXLEN];
|
||||
/* parameter used by CLUSTER CLEANUP */
|
||||
int keep_history;
|
||||
/* parameter used by {STANDBY|WITNESS} UNREGISTER */
|
||||
int node;
|
||||
|
||||
char pg_bindir[MAXLEN];
|
||||
char upstream_conninfo[MAXLEN];
|
||||
char replication_user[MAXLEN];
|
||||
|
||||
char recovery_min_apply_delay[MAXLEN];
|
||||
|
||||
/* standby register paarameters */
|
||||
bool wait_register_sync;
|
||||
int wait_register_sync_seconds;
|
||||
|
||||
/* witness create parameters */
|
||||
bool witness_pwprompt;
|
||||
|
||||
/* standby follow parameters */
|
||||
bool wait_for_master;
|
||||
|
||||
/* cluster {show|matrix|crosscheck} parameters */
|
||||
bool csv_mode;
|
||||
|
||||
/* cluster cleanup parameters */
|
||||
int keep_history;
|
||||
|
||||
/* standby switchover parameters */
|
||||
char remote_config_file[MAXLEN];
|
||||
bool pg_rewind_supplied;
|
||||
char pg_rewind[MAXPGPATH];
|
||||
char pg_ctl_mode[MAXLEN];
|
||||
|
||||
/* standby {archive_config | restore_config} parameters */
|
||||
char config_archive_dir[MAXLEN];
|
||||
|
||||
/* {standby|witness} unregister parameters */
|
||||
int node;
|
||||
|
||||
} t_runtime_options;
|
||||
|
||||
#define T_RUNTIME_OPTIONS_INITIALIZER { "", "", "", "", "", "", "", DEFAULT_WAL_KEEP_SEGMENTS, false, false, false, false, false, false, false, false, false, false, false, false, CONFIG_FILE_SAMEPATH, false, 0, "", "", "", "", "fast", "", 0, UNKNOWN_NODE_ID, "", ""}
|
||||
#define T_RUNTIME_OPTIONS_INITIALIZER { \
|
||||
/* general repmgr options */ \
|
||||
"", false, false, false, "", \
|
||||
/* logging parameters */ \
|
||||
"", false, \
|
||||
/* connection parameters */ \
|
||||
"", "", "", "", "", "", "", \
|
||||
false, false, false, \
|
||||
/* standby clone parameters */ \
|
||||
false, DEFAULT_WAL_KEEP_SEGMENTS, false, false, false, false, false, false, \
|
||||
false, CONFIG_FILE_SAMEPATH, "", "", "", \
|
||||
/* standby register paarameters */ \
|
||||
false, 0, \
|
||||
/* witness create parameters */ \
|
||||
false, \
|
||||
/* standby follow parameters */ \
|
||||
false, \
|
||||
/* cluster {show|matrix|crosscheck} parameters */ \
|
||||
false, \
|
||||
/* cluster cleanup parameters */ \
|
||||
0, \
|
||||
/* standby switchover parameters */ \
|
||||
"", false, "", "fast", \
|
||||
/* standby {archive_config | restore_config} parameters */ \
|
||||
"", \
|
||||
/* {standby|witness} unregister parameters */ \
|
||||
UNKNOWN_NODE_ID }
|
||||
|
||||
struct BackupLabel
|
||||
{
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
/*
|
||||
* repmgr.sql
|
||||
*
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
*/
|
||||
|
||||
|
||||
75
repmgrd.c
75
repmgrd.c
@@ -1,7 +1,7 @@
|
||||
/*
|
||||
* repmgrd.c - Replication manager daemon
|
||||
*
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This module connects to the nodes of a replication cluster and monitors
|
||||
* how far are they from master
|
||||
@@ -207,6 +207,13 @@ main(int argc, char **argv)
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
/*
|
||||
* Tell the logger we're a daemon - this will ensure any output logged
|
||||
* before the logger is initialized will be formatted correctly
|
||||
*/
|
||||
logger_output_mode = OM_DAEMON;
|
||||
|
||||
/*
|
||||
* Parse the configuration file, if provided. If no configuration file
|
||||
* was provided, or one was but was incomplete, parse_config() will
|
||||
@@ -247,6 +254,7 @@ main(int argc, char **argv)
|
||||
}
|
||||
|
||||
logger_init(&local_options, progname());
|
||||
|
||||
if (verbose)
|
||||
logger_set_verbose();
|
||||
|
||||
@@ -647,15 +655,15 @@ witness_monitor(void)
|
||||
}
|
||||
else
|
||||
{
|
||||
log_debug(_("new master found with node ID: %i\n"), master_options.node);
|
||||
log_info(_("new master found with node ID: %i\n"), master_options.node);
|
||||
connection_ok = true;
|
||||
|
||||
/*
|
||||
* Update the repl_nodes table from the new master to reflect the changed
|
||||
* node configuration
|
||||
*
|
||||
* XXX it would be neat to be able to handle this with e.g. table-based
|
||||
* logical replication
|
||||
* It would be neat to be able to handle this with e.g. table-based
|
||||
* logical replication if available in core
|
||||
*/
|
||||
witness_copy_node_records(master_conn, my_local_conn, local_options.cluster_name);
|
||||
|
||||
@@ -774,7 +782,6 @@ standby_monitor(void)
|
||||
PGconn *upstream_conn;
|
||||
char upstream_conninfo[MAXCONNINFO];
|
||||
int upstream_node_id;
|
||||
t_node_info upstream_node;
|
||||
|
||||
int active_master_id;
|
||||
const char *upstream_node_type = NULL;
|
||||
@@ -956,6 +963,8 @@ standby_monitor(void)
|
||||
* Failover handling is handled differently depending on whether
|
||||
* the failed node is the master or a cascading standby
|
||||
*/
|
||||
t_node_info upstream_node;
|
||||
|
||||
upstream_node = get_node_info(my_local_conn, local_options.cluster_name, upstream_node_id);
|
||||
|
||||
if (upstream_node.type == MASTER)
|
||||
@@ -1013,8 +1022,8 @@ standby_monitor(void)
|
||||
*
|
||||
* We should log a message so the user knows of the situation at hand.
|
||||
*
|
||||
* XXX check if the original master is still active and display a
|
||||
* warning
|
||||
* XXX check if the original master is still active and display a warning
|
||||
* XXX add event notification
|
||||
*/
|
||||
log_err(_("It seems this server was promoted manually (not by repmgr) so you might by in the presence of a split-brain.\n"));
|
||||
log_err(_("Check your cluster and manually fix any anomaly.\n"));
|
||||
@@ -1059,9 +1068,6 @@ standby_monitor(void)
|
||||
* from the upstream node to write monitoring information
|
||||
*/
|
||||
|
||||
/* XXX not used? */
|
||||
upstream_node = get_node_info(my_local_conn, local_options.cluster_name, upstream_node_id);
|
||||
|
||||
sprintf(sqlquery,
|
||||
"SELECT id "
|
||||
" FROM %s.repl_nodes "
|
||||
@@ -1181,10 +1187,22 @@ standby_monitor(void)
|
||||
PQclear(res);
|
||||
|
||||
lsn_master_current_xlog_location = lsn_to_xlogrecptr(last_wal_primary_location, NULL);
|
||||
lsn_last_xlog_replay_location = lsn_to_xlogrecptr(last_xlog_replay_location, NULL);
|
||||
lsn_last_xlog_receive_location = lsn_to_xlogrecptr(last_xlog_receive_location, NULL);
|
||||
lsn_last_xlog_replay_location = lsn_to_xlogrecptr(last_xlog_replay_location, NULL);
|
||||
|
||||
if (lsn_last_xlog_receive_location >= lsn_last_xlog_replay_location)
|
||||
{
|
||||
apply_lag = (long long unsigned int)lsn_last_xlog_receive_location - lsn_last_xlog_replay_location;
|
||||
}
|
||||
else
|
||||
{
|
||||
/* This should never happen, but in case it does set apply lag to zero */
|
||||
log_warning("Standby receive (%s) location appears less than standby replay location (%s)\n",
|
||||
last_xlog_receive_location,
|
||||
last_xlog_replay_location);
|
||||
apply_lag = 0;
|
||||
}
|
||||
|
||||
apply_lag = (long long unsigned int)lsn_last_xlog_receive_location - lsn_last_xlog_replay_location;
|
||||
|
||||
/* Calculate replication lag */
|
||||
if (lsn_master_current_xlog_location >= lsn_last_xlog_receive_location)
|
||||
@@ -1193,7 +1211,7 @@ standby_monitor(void)
|
||||
}
|
||||
else
|
||||
{
|
||||
/* This should never happen, but in case it does set lag to zero */
|
||||
/* This should never happen, but in case it does set replication lag to zero */
|
||||
log_warning("Master xlog (%s) location appears less than standby receive location (%s)\n",
|
||||
last_wal_primary_location,
|
||||
last_xlog_receive_location);
|
||||
@@ -1513,7 +1531,6 @@ do_master_failover(void)
|
||||
*/
|
||||
if (PQstatus(node_conn) != CONNECTION_OK)
|
||||
{
|
||||
/* XXX */
|
||||
log_info(_("At this point, it could be some race conditions "
|
||||
"that are acceptable, assume the node is restarting "
|
||||
"and starting failover procedure\n"));
|
||||
@@ -2086,18 +2103,21 @@ check_connection(PGconn **conn, const char *type, const char *conninfo)
|
||||
/*
|
||||
* set_local_node_status()
|
||||
*
|
||||
* If failure of the local node is detected, attempt to connect
|
||||
* to the current master server (as stored in the global variable
|
||||
* `master_conn`) and update its record to failed.
|
||||
* Attempt to connect to the current master server (as stored in the global
|
||||
* variable `master_conn`) and set the local node's status to the result
|
||||
* of `is_standby(my_local_conn)`. Normally this will be used to mark
|
||||
* a node as failed, but in some circumstances we may be marking it
|
||||
* as recovered.
|
||||
*/
|
||||
|
||||
static bool
|
||||
set_local_node_status(void)
|
||||
{
|
||||
PGresult *res;
|
||||
PGresult *res;
|
||||
char sqlquery[QUERY_STR_LEN];
|
||||
int active_master_node_id = NODE_NOT_FOUND;
|
||||
int active_master_node_id = NODE_NOT_FOUND;
|
||||
char master_conninfo[MAXLEN];
|
||||
bool local_node_status;
|
||||
|
||||
if (!check_connection(&master_conn, "master", NULL))
|
||||
{
|
||||
@@ -2156,24 +2176,29 @@ set_local_node_status(void)
|
||||
|
||||
/*
|
||||
* Attempt to set the active record to the correct value.
|
||||
* First
|
||||
*/
|
||||
|
||||
local_node_status = (is_standby(my_local_conn) == 1);
|
||||
|
||||
if (!update_node_record_status(master_conn,
|
||||
local_options.cluster_name,
|
||||
node_info.node_id,
|
||||
"standby",
|
||||
node_info.upstream_node_id,
|
||||
is_standby(my_local_conn)==1))
|
||||
local_node_status))
|
||||
{
|
||||
log_err(_("unable to set local node %i as inactive on master: %s\n"),
|
||||
log_err(_("unable to set local node %i as %s on master: %s\n"),
|
||||
node_info.node_id,
|
||||
local_node_status == false ? "inactive" : "active",
|
||||
PQerrorMessage(master_conn));
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
log_notice(_("marking this node (%i) as inactive on master\n"), node_info.node_id);
|
||||
log_notice(_("marking this node (%i) as %s on master\n"),
|
||||
node_info.node_id,
|
||||
local_node_status == false ? "inactive" : "active");
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
@@ -2314,13 +2339,13 @@ lsn_to_xlogrecptr(char *lsn, bool *format_ok)
|
||||
if (format_ok != NULL)
|
||||
*format_ok = true;
|
||||
|
||||
return (((XLogRecPtr) xlogid * 16 * 1024 * 1024 * 255) + xrecoff);
|
||||
return (XLogRecPtr) ((uint64) xlogid) << 32 | (uint64) xrecoff;
|
||||
}
|
||||
|
||||
void
|
||||
usage(void)
|
||||
{
|
||||
log_err(_("%s: Replicator manager daemon \n"), progname());
|
||||
log_err(_("%s: replication management daemon for PostgreSQL\n"), progname());
|
||||
log_err(_("Try \"%s --help\" for more information.\n"), progname());
|
||||
}
|
||||
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
#
|
||||
# Makefile
|
||||
#
|
||||
# Copyright (c) 2ndQuadrant, 2010-2016
|
||||
# Copyright (c) 2ndQuadrant, 2010-2017
|
||||
#
|
||||
|
||||
MODULE_big = repmgr_funcs
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* repmgr_function.sql
|
||||
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
*/
|
||||
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* uninstall_repmgr_funcs.sql
|
||||
* Copyright (c) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
*/
|
||||
|
||||
|
||||
33
strutil.c
33
strutil.c
@@ -1,7 +1,7 @@
|
||||
/*
|
||||
* strutil.c
|
||||
*
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
* it under the terms of the GNU General Public License as published by
|
||||
@@ -90,31 +90,18 @@ maxlen_snprintf(char *str, const char *format,...)
|
||||
|
||||
|
||||
/*
|
||||
* Adapted from: src/fe_utils/string_utils.c
|
||||
*
|
||||
* Function not publicly available before PostgreSQL 9.6.
|
||||
* Escape a string for use as a parameter in recovery.conf
|
||||
* Caller must free returned value
|
||||
*/
|
||||
void
|
||||
appendShellString(PQExpBuffer buf, const char *str)
|
||||
char *
|
||||
escape_recovery_conf_value(const char *src)
|
||||
{
|
||||
const char *p;
|
||||
char *result = escape_single_quotes_ascii(src);
|
||||
|
||||
appendPQExpBufferChar(buf, '\'');
|
||||
for (p = str; *p; p++)
|
||||
if (!result)
|
||||
{
|
||||
if (*p == '\n' || *p == '\r')
|
||||
{
|
||||
fprintf(stderr,
|
||||
_("shell command argument contains a newline or carriage return: \"%s\"\n"),
|
||||
str);
|
||||
exit(ERR_BAD_CONFIG);
|
||||
}
|
||||
|
||||
if (*p == '\'')
|
||||
appendPQExpBufferStr(buf, "'\"'\"'");
|
||||
else
|
||||
appendPQExpBufferChar(buf, *p);
|
||||
fprintf(stderr, _("%s: out of memory\n"), progname());
|
||||
exit(ERR_INTERNAL);
|
||||
}
|
||||
|
||||
appendPQExpBufferChar(buf, '\'');
|
||||
return result;
|
||||
}
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
/*
|
||||
* strutil.h
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
*
|
||||
* This program is free software: you can redistribute it and/or modify
|
||||
@@ -49,6 +49,6 @@ extern int
|
||||
maxlen_snprintf(char *str, const char *format,...)
|
||||
__attribute__((format(PG_PRINTF_ATTRIBUTE, 2, 3)));
|
||||
|
||||
extern void
|
||||
appendShellString(PQExpBuffer buf, const char *str);
|
||||
extern char *
|
||||
escape_recovery_conf_value(const char *src);
|
||||
#endif /* _STRUTIL_H_ */
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
/*
|
||||
* uninstall_repmgr.sql
|
||||
*
|
||||
* Copyright (C) 2ndQuadrant, 2010-2016
|
||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||
*
|
||||
*/
|
||||
|
||||
|
||||
Reference in New Issue
Block a user