mirror of
https://github.com/EnterpriseDB/repmgr.git
synced 2026-03-23 15:16:29 +00:00
Compare commits
488 Commits
REL4_0_STA
...
v4.2.0
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
0cafeb3828 | ||
|
|
79e79bd5f2 | ||
|
|
a4e21fd8fe | ||
|
|
e826f72312 | ||
|
|
1e8b3313ee | ||
|
|
b5772d88dd | ||
|
|
22614573b9 | ||
|
|
77c9092794 | ||
|
|
15bbe04a6f | ||
|
|
0842560a88 | ||
|
|
8bec4946bc | ||
|
|
3ab22f9442 | ||
|
|
3a9c36a36c | ||
|
|
2ded8987ac | ||
|
|
6311f3f30a | ||
|
|
12ec6c7abc | ||
|
|
b2348c9a70 | ||
|
|
7b26180ebb | ||
|
|
d70a5250ab | ||
|
|
024accfbba | ||
|
|
55c967fd14 | ||
|
|
c1edb896df | ||
|
|
fd66d93937 | ||
|
|
40e94635b2 | ||
|
|
9ad41bfb0f | ||
|
|
35c156ce7e | ||
|
|
85f27ff559 | ||
|
|
ad03885b72 | ||
|
|
3e38759c02 | ||
|
|
15a5d2ee9d | ||
|
|
61c91df332 | ||
|
|
b346914d4d | ||
|
|
ac40ef0e43 | ||
|
|
eebf07549f | ||
|
|
a40fd60cb5 | ||
|
|
bd24848ce9 | ||
|
|
7ab81e10de | ||
|
|
455a0bd93f | ||
|
|
11d25e2aef | ||
|
|
b14fbbdc72 | ||
|
|
2491b8ae52 | ||
|
|
fce3c02760 | ||
|
|
1f8f6f3a39 | ||
|
|
401f903456 | ||
|
|
688337dec3 | ||
|
|
b660cb9fe4 | ||
|
|
5d8d9db21d | ||
|
|
9439467958 | ||
|
|
38e3aae053 | ||
|
|
80bef0eb28 | ||
|
|
bea4b03cc2 | ||
|
|
97905b02ae | ||
|
|
b0a2ee2259 | ||
|
|
bb4fdcda98 | ||
|
|
7b33faa09b | ||
|
|
5de2b1ee13 | ||
|
|
f184b1e68a | ||
|
|
bd2f6db1e1 | ||
|
|
1693ec0e90 | ||
|
|
17e75f6b31 | ||
|
|
3b8586d82a | ||
|
|
6acec3e041 | ||
|
|
1d830bf0e2 | ||
|
|
3f99ee8ede | ||
|
|
b5f640d04d | ||
|
|
92a62a958e | ||
|
|
a4a956593c | ||
|
|
ceeb6d7130 | ||
|
|
9681708b1a | ||
|
|
3573950425 | ||
|
|
c1586e39b7 | ||
|
|
7745844078 | ||
|
|
e1e59e85d7 | ||
|
|
6fc79470fc | ||
|
|
b7d576863d | ||
|
|
c1338df5e3 | ||
|
|
221fb63e92 | ||
|
|
987823861f | ||
|
|
7a6eb6321b | ||
|
|
f4df6696ba | ||
|
|
bc584d84f6 | ||
|
|
76f5bcf3cd | ||
|
|
b1aab930af | ||
|
|
58994365ff | ||
|
|
c3949b2aea | ||
|
|
6ba49de44e | ||
|
|
b61f853a69 | ||
|
|
f2bc898761 | ||
|
|
7bcf87b8ed | ||
|
|
6983547325 | ||
|
|
34c4f4c3f8 | ||
|
|
f8667c1aac | ||
|
|
08ab6290c1 | ||
|
|
97cafd8c54 | ||
|
|
78b969f208 | ||
|
|
3f558416f3 | ||
|
|
410fa5e54d | ||
|
|
44a224ad92 | ||
|
|
33dedf4e96 | ||
|
|
4f4d20c30b | ||
|
|
69cb87322d | ||
|
|
4351836520 | ||
|
|
a87f18682c | ||
|
|
1a630d079e | ||
|
|
d2929f6426 | ||
|
|
f3f002bea5 | ||
|
|
93471b8d68 | ||
|
|
46e0a9a8db | ||
|
|
3620fa79e8 | ||
|
|
c236405251 | ||
|
|
527a5f7fee | ||
|
|
937cffd54c | ||
|
|
2b1e12591a | ||
|
|
7ecfb333b9 | ||
|
|
8f13a66aaa | ||
|
|
ef35d071bf | ||
|
|
b87f9dabb4 | ||
|
|
7decc7975f | ||
|
|
a5cfc244bc | ||
|
|
673bde2b7f | ||
|
|
81de200561 | ||
|
|
cb46fb6410 | ||
|
|
bd58e4128c | ||
|
|
63242e2277 | ||
|
|
69782cf703 | ||
|
|
5acb3e6790 | ||
|
|
6dfcaa357e | ||
|
|
8acc50e752 | ||
|
|
56919ea499 | ||
|
|
b3f64987cb | ||
|
|
388ac2f392 | ||
|
|
8b059bc9b0 | ||
|
|
cfa7155784 | ||
|
|
47644b55ed | ||
|
|
17f30ec364 | ||
|
|
c6b8d78bad | ||
|
|
ae60caacdd | ||
|
|
92d0e6809b | ||
|
|
4c7c681a14 | ||
|
|
29de052dd8 | ||
|
|
ebf2a3a7cc | ||
|
|
37311e15a3 | ||
|
|
a194cf56b3 | ||
|
|
c4f9205f17 | ||
|
|
6d09ebcfb5 | ||
|
|
319a29583d | ||
|
|
a5d47fd478 | ||
|
|
190104c7db | ||
|
|
ff16d3b3bb | ||
|
|
802755fd60 | ||
|
|
d00c0c67d0 | ||
|
|
8d636690bd | ||
|
|
b2081dca52 | ||
|
|
080a29c33b | ||
|
|
dd7a4068d2 | ||
|
|
fcf237fe31 | ||
|
|
4d70a667fb | ||
|
|
c5ba72c2c5 | ||
|
|
0f97a98f28 | ||
|
|
269e3242c8 | ||
|
|
b0ed87832b | ||
|
|
836d2125fe | ||
|
|
bf0d67c60a | ||
|
|
e1d807188d | ||
|
|
108c3a36fb | ||
|
|
8377704596 | ||
|
|
4f642f8332 | ||
|
|
029ba46470 | ||
|
|
098f8eaf2a | ||
|
|
d60bd232f0 | ||
|
|
eca1943026 | ||
|
|
bcab4bc391 | ||
|
|
bb320a64f5 | ||
|
|
3b0cde2846 | ||
|
|
00704913a6 | ||
|
|
efc388065e | ||
|
|
e12fbb7b4d | ||
|
|
0108fb2e72 | ||
|
|
e408351697 | ||
|
|
f904cd2573 | ||
|
|
95fe7ea621 | ||
|
|
a50ac039da | ||
|
|
535fba43d3 | ||
|
|
043a6c5bea | ||
|
|
8da26f1c6c | ||
|
|
7861392450 | ||
|
|
b297e40d77 | ||
|
|
7613b1769c | ||
|
|
b1b49748a7 | ||
|
|
276239422b | ||
|
|
49418e096e | ||
|
|
6c518f1403 | ||
|
|
b365765bc8 | ||
|
|
bd63948937 | ||
|
|
69c1f147ea | ||
|
|
ce8d3cf0b0 | ||
|
|
14134f8e70 | ||
|
|
be8448ddcb | ||
|
|
a2ff1536ad | ||
|
|
9c0c1b663e | ||
|
|
2d43feb34b | ||
|
|
6f315c1b3c | ||
|
|
635bdccb2c | ||
|
|
16048a879e | ||
|
|
eac80ae9c1 | ||
|
|
887b845aa0 | ||
|
|
8320179f34 | ||
|
|
7822aa784f | ||
|
|
4455ded935 | ||
|
|
fd0b850f41 | ||
|
|
d9ac1d6fd0 | ||
|
|
11e4d9fd05 | ||
|
|
4b54106f48 | ||
|
|
f3941ceab0 | ||
|
|
93f80c413e | ||
|
|
09b8a86605 | ||
|
|
6b3d54a5f3 | ||
|
|
85ab2d94b7 | ||
|
|
cda952f1e4 | ||
|
|
99ad57f88a | ||
|
|
ad0671ead2 | ||
|
|
1bbb2ef213 | ||
|
|
62c29aab32 | ||
|
|
b9dc94f28f | ||
|
|
e8ba213174 | ||
|
|
0dcddbb062 | ||
|
|
b4dab86c3b | ||
|
|
644a56a645 | ||
|
|
4876a9fde3 | ||
|
|
ec998bf9c5 | ||
|
|
e36b180de8 | ||
|
|
a2068768ab | ||
|
|
bde9fea48c | ||
|
|
cdaf84c329 | ||
|
|
c4cd0c46da | ||
|
|
3b00dc912a | ||
|
|
1a80de1290 | ||
|
|
26b565dff2 | ||
|
|
96811ccc01 | ||
|
|
73982859f6 | ||
|
|
afb7ca886c | ||
|
|
df11ad894f | ||
|
|
614b4ae84b | ||
|
|
1e1b4b1a65 | ||
|
|
cf64f9e95c | ||
|
|
dfdebd6c08 | ||
|
|
63a11f8926 | ||
|
|
a3f371b8c0 | ||
|
|
938692c169 | ||
|
|
ad24b04c35 | ||
|
|
3ccf1cf182 | ||
|
|
5e4bdb5a1b | ||
|
|
50321bb95d | ||
|
|
253c215c12 | ||
|
|
22c40ae62d | ||
|
|
239a548e9d | ||
|
|
231ef5563e | ||
|
|
e1413fa8ea | ||
|
|
7111483b65 | ||
|
|
1558497ae4 | ||
|
|
9c5e76401f | ||
|
|
a403da67bc | ||
|
|
71b13f5307 | ||
|
|
1c5561d114 | ||
|
|
c0b607ef41 | ||
|
|
462fdca4b4 | ||
|
|
0e55a60660 | ||
|
|
93deab3e96 | ||
|
|
81c69e3677 | ||
|
|
0219f4c91f | ||
|
|
85a4adc99c | ||
|
|
208d7d418e | ||
|
|
7cb6e5af8d | ||
|
|
d2a2df13d5 | ||
|
|
358e001218 | ||
|
|
d7702b3444 | ||
|
|
a8286030c0 | ||
|
|
ff0ba3e19a | ||
|
|
6f5cce7e6f | ||
|
|
509f7a8255 | ||
|
|
e8cdf72ecd | ||
|
|
2a99dfa15b | ||
|
|
bad034f7ee | ||
|
|
cdb504d700 | ||
|
|
0af2077bed | ||
|
|
dea87b7285 | ||
|
|
d6b13f3428 | ||
|
|
5808d8190e | ||
|
|
d2a5cc23cc | ||
|
|
9981ede1af | ||
|
|
40ccae57a3 | ||
|
|
3c2b8e5792 | ||
|
|
354231284e | ||
|
|
dbbfcb6a63 | ||
|
|
bc766a48ed | ||
|
|
55441f2729 | ||
|
|
e38a9ec7e1 | ||
|
|
c1356b9e0d | ||
|
|
383a17fba1 | ||
|
|
29cb153643 | ||
|
|
15625183c1 | ||
|
|
b6a1b75d22 | ||
|
|
c644ddde51 | ||
|
|
ee98a3a58e | ||
|
|
22b3a74fa0 | ||
|
|
98af51da03 | ||
|
|
e5eff3f6d5 | ||
|
|
728a256a93 | ||
|
|
f5f02ae0ee | ||
|
|
64d85587de | ||
|
|
6b7f6089ba | ||
|
|
5719a0dfd3 | ||
|
|
927bf038a0 | ||
|
|
76a93af15c | ||
|
|
ee2df36a76 | ||
|
|
571e6b2783 | ||
|
|
76cc11b786 | ||
|
|
56710f4819 | ||
|
|
f9528efdb8 | ||
|
|
658ec20e37 | ||
|
|
e6aa831782 | ||
|
|
9b56f157dc | ||
|
|
05f872effe | ||
|
|
ae691688be | ||
|
|
57f1e939c5 | ||
|
|
48b5deebf3 | ||
|
|
1868453953 | ||
|
|
dd45189fa8 | ||
|
|
a79c4fae88 | ||
|
|
657ed83921 | ||
|
|
4fb085f52d | ||
|
|
d0bb5b1565 | ||
|
|
ee64f3a745 | ||
|
|
6c81e54f76 | ||
|
|
65bf203a89 | ||
|
|
b4dbee517f | ||
|
|
e23d28a22d | ||
|
|
811d2a45bd | ||
|
|
92f4710ee2 | ||
|
|
044d8a1098 | ||
|
|
b38f45120c | ||
|
|
db3a046393 | ||
|
|
ec068e38a2 | ||
|
|
3a382e826e | ||
|
|
3dcf57a333 | ||
|
|
f658c8d3d8 | ||
|
|
375a96a5c8 | ||
|
|
b4d6724405 | ||
|
|
8fd0c4ad83 | ||
|
|
7ccae6c2b1 | ||
|
|
61d46172b9 | ||
|
|
810471b2f2 | ||
|
|
5bd8cf958a | ||
|
|
5a45997db5 | ||
|
|
f1f5100007 | ||
|
|
1c8ad4d89b | ||
|
|
842a610e84 | ||
|
|
fcb7e7a29b | ||
|
|
26e404b1f3 | ||
|
|
625d032435 | ||
|
|
3d07d65966 | ||
|
|
b705127a34 | ||
|
|
832b38c5cb | ||
|
|
3739a7b84d | ||
|
|
841f03aeba | ||
|
|
cad12b1fb7 | ||
|
|
d31cc80d26 | ||
|
|
625187a61e | ||
|
|
e64d965c6a | ||
|
|
5d8ec136e6 | ||
|
|
9951a8e106 | ||
|
|
26a9e848fd | ||
|
|
ba0b0a497f | ||
|
|
09dc43a61c | ||
|
|
b349f82571 | ||
|
|
adbb627850 | ||
|
|
c47f976bde | ||
|
|
7c8cd7a482 | ||
|
|
edce8addbd | ||
|
|
b0f6202448 | ||
|
|
985b13b6d3 | ||
|
|
69e64a9464 | ||
|
|
f58954b3be | ||
|
|
3761d17752 | ||
|
|
8c121da8a1 | ||
|
|
6e9e4543e8 | ||
|
|
c94f1b7338 | ||
|
|
f78c169c3d | ||
|
|
f2db9f3ea4 | ||
|
|
9944324c3a | ||
|
|
836f32bdbc | ||
|
|
cebbc73c38 | ||
|
|
472d703d2e | ||
|
|
de34e4e89b | ||
|
|
3a8ee126f3 | ||
|
|
da93dd1f57 | ||
|
|
295c18f6ff | ||
|
|
81beec54aa | ||
|
|
2e42226f68 | ||
|
|
de10d7984a | ||
|
|
404aab4041 | ||
|
|
8c422d6084 | ||
|
|
8b78b7292d | ||
|
|
4cebba32e2 | ||
|
|
c9f12cfbe0 | ||
|
|
5b4c92392c | ||
|
|
e2b94adec3 | ||
|
|
3164bfa043 | ||
|
|
08b443dce0 | ||
|
|
9165d27f9f | ||
|
|
b8b991398a | ||
|
|
a9a17f206e | ||
|
|
9d432546bf | ||
|
|
3c557ebd8e | ||
|
|
4efeb52cba | ||
|
|
60422c66f9 | ||
|
|
b63872afbb | ||
|
|
a31980b590 | ||
|
|
e07a3c7976 | ||
|
|
9d9a1be062 | ||
|
|
8208b3f844 | ||
|
|
ecb8297b1f | ||
|
|
1553596f84 | ||
|
|
022d9c58c2 | ||
|
|
a6cc4d80f0 | ||
|
|
7fffe3ed96 | ||
|
|
9b93a595f5 | ||
|
|
c34e08b802 | ||
|
|
eb14bb58c6 | ||
|
|
aa28069d8b | ||
|
|
a1e272f64c | ||
|
|
9908a9c662 | ||
|
|
aa089820ab | ||
|
|
0230bafae1 | ||
|
|
de577adc67 | ||
|
|
fed17d49e3 | ||
|
|
d80763f974 | ||
|
|
331e982bdb | ||
|
|
4ca7e6a6bf | ||
|
|
6ac6e0733a | ||
|
|
79d21b516b | ||
|
|
7232187f4d | ||
|
|
fe98270b3f | ||
|
|
5a3e20fc38 | ||
|
|
4ef2b111da | ||
|
|
97471626b4 | ||
|
|
4bd236b64c | ||
|
|
615dd2ecf4 | ||
|
|
1c1887f9cc | ||
|
|
d3f11a640d | ||
|
|
2341da7a06 | ||
|
|
2c468d64fb | ||
|
|
9d9b74d740 | ||
|
|
a90d4419a6 | ||
|
|
68756c79f3 | ||
|
|
8ad081e7b5 | ||
|
|
6b76704817 | ||
|
|
c03c509e73 | ||
|
|
d9db4f6c45 | ||
|
|
c89d59fe96 | ||
|
|
02b6d3748b | ||
|
|
7c3abe28b9 | ||
|
|
a39b8ccc2d | ||
|
|
5638d4ab89 | ||
|
|
37bdad290c | ||
|
|
8911434da5 | ||
|
|
8a2bbcebfd | ||
|
|
61f01f8305 | ||
|
|
a35d77b7f0 | ||
|
|
40ea1abbb4 | ||
|
|
785bfe9837 | ||
|
|
31cd54bcff | ||
|
|
35c8bb4e75 | ||
|
|
6b9ac22029 | ||
|
|
7bf3c78f57 | ||
|
|
34ee16899e | ||
|
|
0938685ae7 | ||
|
|
b400436fba | ||
|
|
2745c92fc8 | ||
|
|
34c0131b2d | ||
|
|
c9abfdcc04 | ||
|
|
a878d7aaea | ||
|
|
93aa7cea1a | ||
|
|
f00e6296e9 | ||
|
|
91354a71cc | ||
|
|
c78cb6e1d6 | ||
|
|
71430a9f65 | ||
|
|
3e93f847fd |
2
.gitignore
vendored
2
.gitignore
vendored
@@ -39,6 +39,8 @@ lib*.pc
|
|||||||
|
|
||||||
# test output
|
# test output
|
||||||
/results/
|
/results/
|
||||||
|
/regression.diffs
|
||||||
|
/regression.out
|
||||||
|
|
||||||
/doc/Makefile
|
/doc/Makefile
|
||||||
|
|
||||||
|
|||||||
@@ -2,7 +2,7 @@ License and Contributions
|
|||||||
=========================
|
=========================
|
||||||
|
|
||||||
`repmgr` is licensed under the GPL v3. All of its code and documentation is
|
`repmgr` is licensed under the GPL v3. All of its code and documentation is
|
||||||
Copyright 2010-2017, 2ndQuadrant Limited. See the files COPYRIGHT and LICENSE for
|
Copyright 2010-2018, 2ndQuadrant Limited. See the files COPYRIGHT and LICENSE for
|
||||||
details.
|
details.
|
||||||
|
|
||||||
The development of repmgr has primarily been sponsored by 2ndQuadrant customers.
|
The development of repmgr has primarily been sponsored by 2ndQuadrant customers.
|
||||||
|
|||||||
@@ -1,4 +1,4 @@
|
|||||||
Copyright (c) 2010-2017, 2ndQuadrant Limited
|
Copyright (c) 2010-2018, 2ndQuadrant Limited
|
||||||
All rights reserved.
|
All rights reserved.
|
||||||
|
|
||||||
This program is free software: you can redistribute it and/or modify
|
This program is free software: you can redistribute it and/or modify
|
||||||
@@ -12,5 +12,5 @@ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|||||||
GNU General Public License for more details.
|
GNU General Public License for more details.
|
||||||
|
|
||||||
You should have received a copy of the GNU General Public License
|
You should have received a copy of the GNU General Public License
|
||||||
along with this program. If not, see http://www.gnu.org/licenses/
|
along with this program. If not, see https://www.gnu.org/licenses/
|
||||||
to obtain one.
|
to obtain one.
|
||||||
|
|||||||
8
FAQ.md
Normal file
8
FAQ.md
Normal file
@@ -0,0 +1,8 @@
|
|||||||
|
FAQ - Frequently Asked Questions about repmgr
|
||||||
|
=============================================
|
||||||
|
|
||||||
|
The repmgr 4 FAQ is located here: [repmgr FAQ (Frequently Asked Questions)](https://repmgr.org/docs/4.0/appendix-faq.html "repmgr FAQ")
|
||||||
|
|
||||||
|
The repmgr 3.x FAQ can be found here:
|
||||||
|
|
||||||
|
https://github.com/2ndQuadrant/repmgr/blob/REL3_3_STABLE/FAQ.md
|
||||||
171
HISTORY
171
HISTORY
@@ -1,6 +1,171 @@
|
|||||||
4.0 2017-10-04
|
4.2.0 2018-??-??
|
||||||
Complete rewrite with many changes; see file "doc/upgrading-from-repmgr3.md"
|
repmgr: add parameter "shutdown_check_timeout" for use by "standby switchover";
|
||||||
for details.
|
GitHub #504 (Ian)
|
||||||
|
repmgr: add "--node-id" option to "repmgr cluster cleanup"; GitHub #493 (Ian)
|
||||||
|
repmgr: report unreachable nodes when running "repmgr cluster (matrix|crosscheck);
|
||||||
|
GitHub #246 (Ian)
|
||||||
|
repmgr: add configuration file parameter "repmgr_bindir"; GitHub #246 (Ian)
|
||||||
|
repmgr: fix "Missing replication slots" label in "node check"; GitHub #507 (Ian)
|
||||||
|
repmgrd: fix parsing of -d/--daemonize option (Ian)
|
||||||
|
repmgrd: support "pausing" of repmgrd (Ian)
|
||||||
|
|
||||||
|
4.1.1 2018-09-05
|
||||||
|
logging: explicitly log the text of failed queries as ERRORs to
|
||||||
|
assist logfile analysis; GitHub #498
|
||||||
|
repmgr: truncate version string, if necessary; GitHub #490 (Ian)
|
||||||
|
repmgr: improve messages emitted during "standby promote" (Ian)
|
||||||
|
repmgr: "standby clone" - don't copy external config files in --dry-run
|
||||||
|
mode; GitHub #491 (Ian)
|
||||||
|
repmgr: add "cluster_cleanup" event; GitHub #492 (Ian)
|
||||||
|
repmgr: (standby switchover) improve detection of free walsenders;
|
||||||
|
GitHub #495 (Ian)
|
||||||
|
repmgr: (node rejoin) improve replication slot handling; GitHub #499 (Ian)
|
||||||
|
repmgrd: ensure that sending SIGHUP always results in the log file
|
||||||
|
being reopened; GitHub #485 (Ian)
|
||||||
|
repmgrd: report version number *after* logger initialisation; GitHub #487 (Ian)
|
||||||
|
repmgrd: fix startup on witness node when local data is stale; GitHub #488/#489 (Ian)
|
||||||
|
repmgrd: improve cascaded standby failover handling; GitHub #480 (Ian)
|
||||||
|
repmgrd: improve reconnection handling (Ian)
|
||||||
|
|
||||||
|
4.1.0 2018-07-31
|
||||||
|
repmgr: change default log_level to INFO, add documentation; GitHub #470 (Ian)
|
||||||
|
repmgr: add "--missing-slots" check to "repmgr node check" (Ian)
|
||||||
|
repmgr: improve command line error handling; GitHub #464 (Ian)
|
||||||
|
repmgr: fix "standby register --wait-sync" when no timeout provided (Ian)
|
||||||
|
repmgr: "cluster show" returns non-zero value if an issue encountered;
|
||||||
|
GitHub #456 (Ian)
|
||||||
|
repmgr: "node check" and "node status" returns non-zero value if an issue
|
||||||
|
encountered (Ian)
|
||||||
|
repmgr: add CSV output mode to "cluster event"; GitHub #471 (Ian)
|
||||||
|
repmgr: add -q/--quiet option to suppress non-error output; GitHub #468 (Ian)
|
||||||
|
repmgr: "node status" returns non-zero value if an issue encountered (Ian)
|
||||||
|
repmgr: enable "recovery_min_apply_delay" to be 0; GitHub #448 (Ian)
|
||||||
|
repmgr: "cluster cleanup" - add missing help options; GitHub #461/#462 (gclough)
|
||||||
|
repmgr: ensure witness node follows new primary after switchover;
|
||||||
|
GitHub #453 (Ian)
|
||||||
|
repmgr: fix witness node handling in "node check"/"node status";
|
||||||
|
GitHub #451 (Ian)
|
||||||
|
repmgr: fix "primary_slot_name" when using "standby clone" with --recovery-conf-only;
|
||||||
|
GitHub #474 (Ian)
|
||||||
|
repmgr: don't perform a switchover if an exclusive backup is running;
|
||||||
|
GitHub #476 (Martín)
|
||||||
|
repmgr: enable "witness unregister" to be run on any node; GitHub #472 (Ian)
|
||||||
|
repmgrd: create a PID file by default; GitHub #457 (Ian)
|
||||||
|
repmgrd: daemonize process by default; GitHub #458 (Ian)
|
||||||
|
|
||||||
|
4.0.6 2018-06-14
|
||||||
|
repmgr: (witness register) prevent registration of a witness server with the
|
||||||
|
same name as an existing node (Ian)
|
||||||
|
repmgr: (standby follow) check node has actually connected to new primary
|
||||||
|
before reporting success; GitHub #444 (Ian)
|
||||||
|
repmgr: (standby clone) improve handling of external configuration file copying,
|
||||||
|
including consideration in --dry-run check; GitHub #443 (Ian)
|
||||||
|
repmgr: (standby clone) don't require presence of "user" parameter in
|
||||||
|
conninfo string; GitHub #437 (Ian)
|
||||||
|
repmgr: (standby clone) improve documentation of --recovery-conf-only
|
||||||
|
mode; GitHub #438 (Ian)
|
||||||
|
repmgr: (node rejoin) fix bug when parsing --config-files parameter;
|
||||||
|
GitHub #442 (Ian)
|
||||||
|
repmgr: when using --dry-run, force log level to INFO to ensure output
|
||||||
|
will always be displayed; GitHub #441 (Ian)
|
||||||
|
repmgr: (cluster matrix/crosscheck) return non-zero exit code if node
|
||||||
|
connection issues detected; GitHub #447 (Ian)
|
||||||
|
repmgrd: ensure local node is counted as quorum member; GitHub #439 (Ian)
|
||||||
|
|
||||||
|
4.0.5 2018-05-02
|
||||||
|
repmgr: poll demoted primary after restart as a standby during a
|
||||||
|
switchover operation; GitHub #408 (Ian)
|
||||||
|
repmgr: add configuration parameter "config_directory"; GitHub #424 (Ian)
|
||||||
|
repmgr: add "dbname=replication" to all replication connection strings;
|
||||||
|
GitHub #421 (Ian)
|
||||||
|
repmgr: add sanity check if --upstream-node-id not supplied when executing
|
||||||
|
"standby register"; GitHub #395 (Ian)
|
||||||
|
repmgr: enable provision of "archive_cleanup_command" in recovery.conf;
|
||||||
|
GitHub #416 (Ian)
|
||||||
|
repmgr: actively check for node to rejoin cluster; GitHub #415 (Ian)
|
||||||
|
repmgr: enable pg_rewind to be used with PostgreSQL 9.3/9.4; GitHub #413 (Ian)
|
||||||
|
repmgr: fix minimum accepted value for "degraded_monitoring_timeout";
|
||||||
|
GitHub #411 (Ian)
|
||||||
|
repmgr: fix superuser password handling; GitHub #400 (Ian)
|
||||||
|
repmgr: fix parsing of "archive_ready_critical" configuration file
|
||||||
|
parameter; GitHub #426 (Ian)
|
||||||
|
repmgr: fix display of conninfo parsing error messages (Ian)
|
||||||
|
repmgr: fix "repmgr cluster crosscheck" output; GitHub #389 (Ian)
|
||||||
|
repmgrd: prevent standby connection handle from going stale (Ian)
|
||||||
|
repmgrd: fix memory leaks in witness code; GitHub #402 (AndrzejNowicki, Martín)
|
||||||
|
repmgrd: handle "pg_ctl promote" timeout; GitHub #425 (Ian)
|
||||||
|
repmgrd: handle failover situation with only two nodes in the primary
|
||||||
|
location, and at least one node in another location; GitHub #407 (Ian)
|
||||||
|
repmgrd: set "connect_timeout=2" when pinging a server (Ian)
|
||||||
|
|
||||||
|
4.0.4 2018-03-09
|
||||||
|
repmgr: add "standby clone --recovery-conf-only" option; GitHub #382 (Ian)
|
||||||
|
repmgr: make "standby promote" timeout values configurable; GitHub #387 (Ian)
|
||||||
|
repmgr: improve replication slot warnings generated by "node status";
|
||||||
|
GitHub #385 (Ian)
|
||||||
|
repmgr: remove restriction on replication slots when cloning from
|
||||||
|
a Barman server; GitHub #379 (Ian)
|
||||||
|
repmgr: ensure "node rejoin" honours "--dry-run" option; GitHub #383 (Ian)
|
||||||
|
repmgr: fix --superuser handling when cloning a standby; GitHub #380 (Ian)
|
||||||
|
repmgr: update various help options; GitHub #391, #392 (hasegeli)
|
||||||
|
repmgrd: add event "repmgrd_shutdown"; GitHub #393 (Ian)
|
||||||
|
repmgrd: improve detection of status change from primary to standby (Ian)
|
||||||
|
repmgrd: improve log output in various situations (Ian)
|
||||||
|
repmgrd: improve reconnection to the local node after a failover (Ian)
|
||||||
|
repmgrd: ensure witness server connects to new primary after a failover (Ian)
|
||||||
|
|
||||||
|
4.0.3 2018-02-15
|
||||||
|
repmgr: improve switchover handling when "pg_ctl" used to control the
|
||||||
|
server and logging output is not explicitly redirected (Ian)
|
||||||
|
repmgr: improve switchover log messages and exit code when old primary could
|
||||||
|
not be shut down cleanly (Ian)
|
||||||
|
repmgr: check demotion candidate can make a replication connection to the
|
||||||
|
promotion candidate before executing a switchover; GitHub #370 (Ian)
|
||||||
|
repmgr: add check for sufficient walsenders/replication slots before executing
|
||||||
|
a switchover; GitHub #371 (Ian)
|
||||||
|
repmgr: add --dry-run mode to "repmgr standby follow"; GitHub #368 (Ian)
|
||||||
|
repmgr: provide information about the primary node for "standby_register" and
|
||||||
|
"standby_follow" event notifications; GitHub #375 (Ian)
|
||||||
|
repmgr: add "standby_register_sync" event notification; GitHub #374 (Ian)
|
||||||
|
repmgr: output any connection error messages in "cluster show"'s list of
|
||||||
|
warnings; GitHub #369 (Ian)
|
||||||
|
repmgr: ensure an inactive data directory can be deleted; GitHub #366 (Ian)
|
||||||
|
repmgr: fix upstream node display in "repmgr node status"; GitHub #363 (fanf2)
|
||||||
|
repmgr: improve/clarify documentation and update --help output for
|
||||||
|
"primary unregister"; GitHub #373 (Ian)
|
||||||
|
repmgr: allow replication slots when Barman is configured; GitHub #379 (Ian)
|
||||||
|
repmgr: fix parsing of "pg_basebackup_options"; GitHub #376 (Ian)
|
||||||
|
repmgr: ensure "pg_subtrans" directory is created when cloning a standby in
|
||||||
|
Barman mode (Ian)
|
||||||
|
repmgr: fix primary node check in "witness register"; GitHub #377 (Ian)
|
||||||
|
|
||||||
|
4.0.2 2018-01-18
|
||||||
|
repmgr: add missing -W option to getopt_long() invocation; GitHub #350 (Ian)
|
||||||
|
repmgr: automatically create slot name if missing; GitHub #343 (Ian)
|
||||||
|
repmgr: fixes to parsing output of remote repmgr invocations; GitHub #349 (Ian)
|
||||||
|
repmgr: BDR support - create missing connection replication set
|
||||||
|
if required; GitHub #347 (Ian)
|
||||||
|
repmgr: handle missing node record in "repmgr node rejoin"; GitHub #358 (Ian)
|
||||||
|
repmgr: enable documentation to be build as single HTML file; GitHub #353 (fanf2)
|
||||||
|
repmgr: recognize "--terse" option for "repmgr cluster event"; GitHub #360 (Ian)
|
||||||
|
repmgr: add "--wait-start" option for "repmgr standby register"; GitHub #356 (Ian)
|
||||||
|
repmgr: add "%p" event notification parameter for "repmgr standby switchover"
|
||||||
|
containing the node ID of the demoted primary (Ian)
|
||||||
|
docs: various fixes and updates (Ian, Daymel, Martín, ams)
|
||||||
|
|
||||||
|
4.0.1 2017-12-13
|
||||||
|
repmgr: ensure "repmgr node check --action=" returns appropriate return
|
||||||
|
code; GitHub #340 (Ian)
|
||||||
|
repmgr: add missing schema qualification in get_all_node_records_with_upstream()
|
||||||
|
query GitHub #341 (Martín)
|
||||||
|
repmgr: initialise "voting_term" table in application, not extension SQL;
|
||||||
|
GitHub #344 (Ian)
|
||||||
|
repmgr: delete any replication slots copied by pg_rewind; GitHub #334 (Ian)
|
||||||
|
repmgr: fix configuration file sanity check; GitHub #342 (Ian)
|
||||||
|
|
||||||
|
4.0.0 2017-11-21
|
||||||
|
Complete rewrite with many changes; for details see the repmgr 4.0.0 release
|
||||||
|
notes at: https://repmgr.org/docs/4.0/release-4.0.0.html
|
||||||
|
|
||||||
3.3.2 2017-06-01
|
3.3.2 2017-06-01
|
||||||
Add support for PostgreSQL 10 (Ian)
|
Add support for PostgreSQL 10 (Ian)
|
||||||
|
|||||||
20
Makefile.in
20
Makefile.in
@@ -11,7 +11,11 @@ EXTENSION = repmgr
|
|||||||
|
|
||||||
DATA = \
|
DATA = \
|
||||||
repmgr--unpackaged--4.0.sql \
|
repmgr--unpackaged--4.0.sql \
|
||||||
repmgr--4.0.sql
|
repmgr--4.0.sql \
|
||||||
|
repmgr--4.0--4.1.sql \
|
||||||
|
repmgr--4.1.sql \
|
||||||
|
repmgr--4.1--4.2.sql \
|
||||||
|
repmgr--4.2.sql
|
||||||
|
|
||||||
REGRESS = repmgr_extension
|
REGRESS = repmgr_extension
|
||||||
|
|
||||||
@@ -26,20 +30,26 @@ all: \
|
|||||||
PG_CPPFLAGS = -std=gnu89 -I$(includedir_internal) -I$(libpq_srcdir) -Wall -Wmissing-prototypes -Wmissing-declarations $(EXTRA_CFLAGS)
|
PG_CPPFLAGS = -std=gnu89 -I$(includedir_internal) -I$(libpq_srcdir) -Wall -Wmissing-prototypes -Wmissing-declarations $(EXTRA_CFLAGS)
|
||||||
SHLIB_LINK = $(libpq)
|
SHLIB_LINK = $(libpq)
|
||||||
|
|
||||||
HEADERS = $(wildcard *.h)
|
|
||||||
|
|
||||||
OBJS = \
|
OBJS = \
|
||||||
repmgr.o
|
repmgr.o
|
||||||
|
|
||||||
include Makefile.global
|
include Makefile.global
|
||||||
|
|
||||||
|
ifeq ($(vpath_build),yes)
|
||||||
|
HEADERS = $(wildcard *.h)
|
||||||
|
else
|
||||||
|
HEADERS_built = $(wildcard *.h)
|
||||||
|
endif
|
||||||
|
|
||||||
$(info Building against PostgreSQL $(MAJORVERSION))
|
$(info Building against PostgreSQL $(MAJORVERSION))
|
||||||
|
|
||||||
REPMGR_CLIENT_OBJS = repmgr-client.o \
|
REPMGR_CLIENT_OBJS = repmgr-client.o \
|
||||||
repmgr-action-primary.o repmgr-action-standby.o repmgr-action-bdr.o repmgr-action-cluster.o repmgr-action-node.o \
|
repmgr-action-primary.o repmgr-action-standby.o repmgr-action-witness.o \
|
||||||
|
repmgr-action-bdr.o repmgr-action-cluster.o repmgr-action-node.o repmgr-action-daemon.o \
|
||||||
configfile.o log.o strutil.o controldata.o dirutil.o compat.o dbutils.o
|
configfile.o log.o strutil.o controldata.o dirutil.o compat.o dbutils.o
|
||||||
REPMGRD_OBJS = repmgrd.o repmgrd-physical.o repmgrd-bdr.o configfile.o log.o dbutils.o strutil.o controldata.o
|
REPMGRD_OBJS = repmgrd.o repmgrd-physical.o repmgrd-bdr.o configfile.o log.o dbutils.o strutil.o controldata.o compat.o
|
||||||
DATE=$(shell date "+%Y-%m-%d")
|
DATE=$(shell date "+%Y-%m-%d")
|
||||||
|
|
||||||
repmgr_version.h: repmgr_version.h.in
|
repmgr_version.h: repmgr_version.h.in
|
||||||
@@ -77,9 +87,11 @@ additional-clean:
|
|||||||
rm -f repmgr-client.o
|
rm -f repmgr-client.o
|
||||||
rm -f repmgr-action-primary.o
|
rm -f repmgr-action-primary.o
|
||||||
rm -f repmgr-action-standby.o
|
rm -f repmgr-action-standby.o
|
||||||
|
rm -f repmgr-action-witness.o
|
||||||
rm -f repmgr-action-bdr.o
|
rm -f repmgr-action-bdr.o
|
||||||
rm -f repmgr-action-node.o
|
rm -f repmgr-action-node.o
|
||||||
rm -f repmgr-action-cluster.o
|
rm -f repmgr-action-cluster.o
|
||||||
|
rm -f repmgr-action-daemon.o
|
||||||
rm -f repmgrd.o
|
rm -f repmgrd.o
|
||||||
rm -f repmgrd-physical.o
|
rm -f repmgrd-physical.o
|
||||||
rm -f repmgrd-bdr.o
|
rm -f repmgrd-bdr.o
|
||||||
|
|||||||
20
TODO.md
Normal file
20
TODO.md
Normal file
@@ -0,0 +1,20 @@
|
|||||||
|
TODO
|
||||||
|
====
|
||||||
|
|
||||||
|
This file contains a list of improvements which are desireable and/or have
|
||||||
|
been requested, and which we aim to address/implement when time and resources
|
||||||
|
permit.
|
||||||
|
|
||||||
|
It is *not* a roadmap and there's no guarantee of any item being implemented
|
||||||
|
within any given timeframe.
|
||||||
|
|
||||||
|
|
||||||
|
Enable suspension of repmgrd failover
|
||||||
|
-------------------------------------
|
||||||
|
|
||||||
|
When performing maintenance, e.g. a switchover, it's necessary to stop all
|
||||||
|
repmgrd nodes to prevent unintended failover; this is obviously inconvenient.
|
||||||
|
We'll need to implement some way of notifying each repmgrd to suspend automatic
|
||||||
|
failover until further notice.
|
||||||
|
|
||||||
|
Requested in GitHub #410 ( https://github.com/2ndQuadrant/repmgr/issues/410 )
|
||||||
2
compat.c
2
compat.c
@@ -6,7 +6,7 @@
|
|||||||
* supported PostgreSQL versions. They're unlikely to change but
|
* supported PostgreSQL versions. They're unlikely to change but
|
||||||
* it would be worth keeping an eye on them for any fixes/improvements.
|
* it would be worth keeping an eye on them for any fixes/improvements.
|
||||||
*
|
*
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* Portions Copyright (c) 1996-2013, PostgreSQL Global Development Group
|
* Portions Copyright (c) 1996-2013, PostgreSQL Global Development Group
|
||||||
* Portions Copyright (c) 1994, Regents of the University of California
|
* Portions Copyright (c) 1994, Regents of the University of California
|
||||||
|
|||||||
2
compat.h
2
compat.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* compat.h
|
* compat.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* Portions Copyright (c) 1996-2013, PostgreSQL Global Development Group
|
* Portions Copyright (c) 1996-2013, PostgreSQL Global Development Group
|
||||||
* Portions Copyright (c) 1994, Regents of the University of California
|
* Portions Copyright (c) 1994, Regents of the University of California
|
||||||
|
|||||||
@@ -1,4 +1,2 @@
|
|||||||
/* config.h.in. Generated from configure.in by autoheader. */
|
/* config.h.in. Generated from configure.in by autoheader. */
|
||||||
|
|
||||||
/* Only build repmgr for BDR */
|
|
||||||
#undef BDR_ONLY
|
|
||||||
|
|||||||
416
configfile.c
416
configfile.c
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* config.c - parse repmgr.conf and other configuration-related functionality
|
* config.c - parse repmgr.conf and other configuration-related functionality
|
||||||
*
|
*
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -28,10 +28,8 @@ char config_file_path[MAXPGPATH] = "";
|
|||||||
static bool config_file_provided = false;
|
static bool config_file_provided = false;
|
||||||
bool config_file_found = false;
|
bool config_file_found = false;
|
||||||
|
|
||||||
|
static void parse_config(t_configuration_options *options, bool terse);
|
||||||
static void _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *warning_list);
|
static void _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *warning_list);
|
||||||
static bool parse_bool(const char *s,
|
|
||||||
const char *config_item,
|
|
||||||
ItemList *error_list);
|
|
||||||
|
|
||||||
static void _parse_line(char *buf, char *name, char *value);
|
static void _parse_line(char *buf, char *name, char *value);
|
||||||
static void parse_event_notifications_list(t_configuration_options *options, const char *arg);
|
static void parse_event_notifications_list(t_configuration_options *options, const char *arg);
|
||||||
@@ -73,6 +71,56 @@ load_config(const char *config_file, bool verbose, bool terse, t_configuration_o
|
|||||||
strncpy(config_file_path, config_file, MAXPGPATH);
|
strncpy(config_file_path, config_file, MAXPGPATH);
|
||||||
canonicalize_path(config_file_path);
|
canonicalize_path(config_file_path);
|
||||||
|
|
||||||
|
/* relative path supplied - convert to absolute path */
|
||||||
|
if (config_file_path[0] != '/')
|
||||||
|
{
|
||||||
|
PQExpBufferData fullpath;
|
||||||
|
char *pwd = NULL;
|
||||||
|
|
||||||
|
initPQExpBuffer(&fullpath);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* we'll attempt to use $PWD to derive the effective path; getcwd()
|
||||||
|
* will likely resolve symlinks, which may result in a path which
|
||||||
|
* isn't permanent (e.g. if filesystem mountpoints change).
|
||||||
|
*/
|
||||||
|
pwd = getenv("PWD");
|
||||||
|
|
||||||
|
if (pwd != NULL)
|
||||||
|
{
|
||||||
|
appendPQExpBufferStr(&fullpath, pwd);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
/* $PWD not available - fall back to getcwd() */
|
||||||
|
char cwd[MAXPGPATH] = "";
|
||||||
|
|
||||||
|
if (getcwd(cwd, MAXPGPATH) == NULL)
|
||||||
|
{
|
||||||
|
log_error(_("unable to execute getcwd()"));
|
||||||
|
log_detail("%s", strerror(errno));
|
||||||
|
|
||||||
|
termPQExpBuffer(&fullpath);
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
appendPQExpBufferStr(&fullpath, cwd);
|
||||||
|
}
|
||||||
|
|
||||||
|
appendPQExpBuffer(&fullpath,
|
||||||
|
"/%s", config_file_path);
|
||||||
|
|
||||||
|
log_debug("relative configuration file converted to:\n \"%s\"",
|
||||||
|
fullpath.data);
|
||||||
|
|
||||||
|
strncpy(config_file_path, fullpath.data, MAXPGPATH);
|
||||||
|
|
||||||
|
termPQExpBuffer(&fullpath);
|
||||||
|
|
||||||
|
canonicalize_path(config_file_path);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
if (stat(config_file_path, &stat_config) != 0)
|
if (stat(config_file_path, &stat_config) != 0)
|
||||||
{
|
{
|
||||||
log_error(_("provided configuration file \"%s\" not found: %s"),
|
log_error(_("provided configuration file \"%s\" not found: %s"),
|
||||||
@@ -81,6 +129,7 @@ load_config(const char *config_file, bool verbose, bool terse, t_configuration_o
|
|||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
if (verbose == true)
|
if (verbose == true)
|
||||||
{
|
{
|
||||||
log_notice(_("using provided configuration file \"%s\""), config_file);
|
log_notice(_("using provided configuration file \"%s\""), config_file);
|
||||||
@@ -187,7 +236,7 @@ end_search:
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
void
|
static void
|
||||||
parse_config(t_configuration_options *options, bool terse)
|
parse_config(t_configuration_options *options, bool terse)
|
||||||
{
|
{
|
||||||
/* Collate configuration file errors here for friendlier reporting */
|
/* Collate configuration file errors here for friendlier reporting */
|
||||||
@@ -234,7 +283,9 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
memset(options->node_name, 0, sizeof(options->node_name));
|
memset(options->node_name, 0, sizeof(options->node_name));
|
||||||
memset(options->conninfo, 0, sizeof(options->conninfo));
|
memset(options->conninfo, 0, sizeof(options->conninfo));
|
||||||
memset(options->data_directory, 0, sizeof(options->data_directory));
|
memset(options->data_directory, 0, sizeof(options->data_directory));
|
||||||
|
memset(options->config_directory, 0, sizeof(options->data_directory));
|
||||||
memset(options->pg_bindir, 0, sizeof(options->pg_bindir));
|
memset(options->pg_bindir, 0, sizeof(options->pg_bindir));
|
||||||
|
memset(options->repmgr_bindir, 0, sizeof(options->repmgr_bindir));
|
||||||
options->replication_type = REPLICATION_TYPE_PHYSICAL;
|
options->replication_type = REPLICATION_TYPE_PHYSICAL;
|
||||||
|
|
||||||
/*-------------
|
/*-------------
|
||||||
@@ -249,7 +300,7 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
options->log_status_interval = DEFAULT_LOG_STATUS_INTERVAL;
|
options->log_status_interval = DEFAULT_LOG_STATUS_INTERVAL;
|
||||||
|
|
||||||
/*-----------------------
|
/*-----------------------
|
||||||
* standby action settings
|
* standby clone settings
|
||||||
*------------------------
|
*------------------------
|
||||||
*/
|
*/
|
||||||
options->use_replication_slots = false;
|
options->use_replication_slots = false;
|
||||||
@@ -260,7 +311,30 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
options->tablespace_mapping.tail = NULL;
|
options->tablespace_mapping.tail = NULL;
|
||||||
memset(options->recovery_min_apply_delay, 0, sizeof(options->recovery_min_apply_delay));
|
memset(options->recovery_min_apply_delay, 0, sizeof(options->recovery_min_apply_delay));
|
||||||
options->recovery_min_apply_delay_provided = false;
|
options->recovery_min_apply_delay_provided = false;
|
||||||
|
memset(options->archive_cleanup_command, 0, sizeof(options->archive_cleanup_command));
|
||||||
options->use_primary_conninfo_password = false;
|
options->use_primary_conninfo_password = false;
|
||||||
|
memset(options->passfile, 0, sizeof(options->passfile));
|
||||||
|
|
||||||
|
/*-------------------------
|
||||||
|
* standby promote settings
|
||||||
|
*-------------------------
|
||||||
|
*/
|
||||||
|
options->promote_check_timeout = DEFAULT_PROMOTE_CHECK_TIMEOUT;
|
||||||
|
options->promote_check_interval = DEFAULT_PROMOTE_CHECK_INTERVAL;
|
||||||
|
|
||||||
|
/*------------------------
|
||||||
|
* standby follow settings
|
||||||
|
*------------------------
|
||||||
|
*/
|
||||||
|
options->primary_follow_timeout = DEFAULT_PRIMARY_FOLLOW_TIMEOUT;
|
||||||
|
options->standby_follow_timeout = DEFAULT_STANDBY_FOLLOW_TIMEOUT;
|
||||||
|
|
||||||
|
/*------------------------
|
||||||
|
* standby switchover settings
|
||||||
|
*------------------------
|
||||||
|
*/
|
||||||
|
options->shutdown_check_timeout = DEFAULT_SHUTDOWN_CHECK_TIMEOUT;
|
||||||
|
options->standby_reconnect_timeout = DEFAULT_STANDBY_RECONNECT_TIMEOUT;
|
||||||
|
|
||||||
/*-----------------
|
/*-----------------
|
||||||
* repmgrd settings
|
* repmgrd settings
|
||||||
@@ -281,7 +355,14 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
options->degraded_monitoring_timeout = -1;
|
options->degraded_monitoring_timeout = -1;
|
||||||
options->async_query_timeout = DEFAULT_ASYNC_QUERY_TIMEOUT;
|
options->async_query_timeout = DEFAULT_ASYNC_QUERY_TIMEOUT;
|
||||||
options->primary_notification_timeout = DEFAULT_PRIMARY_NOTIFICATION_TIMEOUT;
|
options->primary_notification_timeout = DEFAULT_PRIMARY_NOTIFICATION_TIMEOUT;
|
||||||
options->primary_follow_timeout = DEFAULT_PRIMARY_FOLLOW_TIMEOUT;
|
options->repmgrd_standby_startup_timeout = -1; /* defaults to "standby_reconnect_timeout" if not set */
|
||||||
|
memset(options->repmgrd_pid_file, 0, sizeof(options->repmgrd_pid_file));
|
||||||
|
|
||||||
|
/*-------------
|
||||||
|
* witness settings
|
||||||
|
*-------------
|
||||||
|
*/
|
||||||
|
options->witness_sync_interval = DEFAULT_WITNESS_SYNC_INTERVAL;
|
||||||
|
|
||||||
/*-------------
|
/*-------------
|
||||||
* BDR settings
|
* BDR settings
|
||||||
@@ -394,6 +475,9 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
strncpy(options->conninfo, value, MAXLEN);
|
strncpy(options->conninfo, value, MAXLEN);
|
||||||
else if (strcmp(name, "data_directory") == 0)
|
else if (strcmp(name, "data_directory") == 0)
|
||||||
strncpy(options->data_directory, value, MAXPGPATH);
|
strncpy(options->data_directory, value, MAXPGPATH);
|
||||||
|
else if (strcmp(name, "config_directory") == 0)
|
||||||
|
strncpy(options->config_directory, value, MAXPGPATH);
|
||||||
|
|
||||||
else if (strcmp(name, "replication_user") == 0)
|
else if (strcmp(name, "replication_user") == 0)
|
||||||
{
|
{
|
||||||
if (strlen(value) < NAMEDATALEN)
|
if (strlen(value) < NAMEDATALEN)
|
||||||
@@ -404,6 +488,8 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
}
|
}
|
||||||
else if (strcmp(name, "pg_bindir") == 0)
|
else if (strcmp(name, "pg_bindir") == 0)
|
||||||
strncpy(options->pg_bindir, value, MAXPGPATH);
|
strncpy(options->pg_bindir, value, MAXPGPATH);
|
||||||
|
else if (strcmp(name, "repmgr_bindir") == 0)
|
||||||
|
strncpy(options->repmgr_bindir, value, MAXPGPATH);
|
||||||
|
|
||||||
else if (strcmp(name, "replication_type") == 0)
|
else if (strcmp(name, "replication_type") == 0)
|
||||||
{
|
{
|
||||||
@@ -439,13 +525,40 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
parse_time_unit_parameter(name, value, options->recovery_min_apply_delay, error_list);
|
parse_time_unit_parameter(name, value, options->recovery_min_apply_delay, error_list);
|
||||||
options->recovery_min_apply_delay_provided = true;
|
options->recovery_min_apply_delay_provided = true;
|
||||||
}
|
}
|
||||||
|
else if (strcmp(name, "archive_cleanup_command") == 0)
|
||||||
|
strncpy(options->archive_cleanup_command, value, MAXLEN);
|
||||||
else if (strcmp(name, "use_primary_conninfo_password") == 0)
|
else if (strcmp(name, "use_primary_conninfo_password") == 0)
|
||||||
options->use_primary_conninfo_password = parse_bool(value, name, error_list);
|
options->use_primary_conninfo_password = parse_bool(value, name, error_list);
|
||||||
|
else if (strcmp(name, "passfile") == 0)
|
||||||
|
strncpy(options->passfile, value, sizeof(options->passfile));
|
||||||
|
|
||||||
|
/* standby promote settings */
|
||||||
|
else if (strcmp(name, "promote_check_timeout") == 0)
|
||||||
|
options->promote_check_timeout = repmgr_atoi(value, name, error_list, 1);
|
||||||
|
|
||||||
|
else if (strcmp(name, "promote_check_interval") == 0)
|
||||||
|
options->promote_check_interval = repmgr_atoi(value, name, error_list, 1);
|
||||||
|
|
||||||
|
/* standby follow settings */
|
||||||
|
else if (strcmp(name, "primary_follow_timeout") == 0)
|
||||||
|
options->primary_follow_timeout = repmgr_atoi(value, name, error_list, 0);
|
||||||
|
else if (strcmp(name, "standby_follow_timeout") == 0)
|
||||||
|
options->standby_follow_timeout = repmgr_atoi(value, name, error_list, 0);
|
||||||
|
|
||||||
|
/* standby switchover settings */
|
||||||
|
else if (strcmp(name, "shutdown_check_timeout") == 0)
|
||||||
|
options->shutdown_check_timeout = repmgr_atoi(value, name, error_list, 0);
|
||||||
|
else if (strcmp(name, "standby_reconnect_timeout") == 0)
|
||||||
|
options->standby_reconnect_timeout = repmgr_atoi(value, name, error_list, 0);
|
||||||
|
|
||||||
|
/* node rejoin settings */
|
||||||
|
else if (strcmp(name, "node_rejoin_timeout") == 0)
|
||||||
|
options->node_rejoin_timeout = repmgr_atoi(value, name, error_list, 0);
|
||||||
|
|
||||||
/* node check settings */
|
/* node check settings */
|
||||||
else if (strcmp(name, "archive_ready_warning") == 0)
|
else if (strcmp(name, "archive_ready_warning") == 0)
|
||||||
options->archive_ready_warning = repmgr_atoi(value, name, error_list, 1);
|
options->archive_ready_warning = repmgr_atoi(value, name, error_list, 1);
|
||||||
else if (strcmp(name, "archive_ready_critcial") == 0)
|
else if (strcmp(name, "archive_ready_critical") == 0)
|
||||||
options->archive_ready_critical = repmgr_atoi(value, name, error_list, 1);
|
options->archive_ready_critical = repmgr_atoi(value, name, error_list, 1);
|
||||||
else if (strcmp(name, "replication_lag_warning") == 0)
|
else if (strcmp(name, "replication_lag_warning") == 0)
|
||||||
options->replication_lag_warning = repmgr_atoi(value, name, error_list, 1);
|
options->replication_lag_warning = repmgr_atoi(value, name, error_list, 1);
|
||||||
@@ -486,13 +599,19 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
else if (strcmp(name, "monitoring_history") == 0)
|
else if (strcmp(name, "monitoring_history") == 0)
|
||||||
options->monitoring_history = parse_bool(value, name, error_list);
|
options->monitoring_history = parse_bool(value, name, error_list);
|
||||||
else if (strcmp(name, "degraded_monitoring_timeout") == 0)
|
else if (strcmp(name, "degraded_monitoring_timeout") == 0)
|
||||||
options->degraded_monitoring_timeout = repmgr_atoi(value, name, error_list, 1);
|
options->degraded_monitoring_timeout = repmgr_atoi(value, name, error_list, -1);
|
||||||
else if (strcmp(name, "async_query_timeout") == 0)
|
else if (strcmp(name, "async_query_timeout") == 0)
|
||||||
options->async_query_timeout = repmgr_atoi(value, name, error_list, 0);
|
options->async_query_timeout = repmgr_atoi(value, name, error_list, 0);
|
||||||
else if (strcmp(name, "primary_notification_timeout") == 0)
|
else if (strcmp(name, "primary_notification_timeout") == 0)
|
||||||
options->primary_notification_timeout = repmgr_atoi(value, name, error_list, 0);
|
options->primary_notification_timeout = repmgr_atoi(value, name, error_list, 0);
|
||||||
else if (strcmp(name, "primary_follow_timeout") == 0)
|
else if (strcmp(name, "repmgrd_standby_startup_timeout") == 0)
|
||||||
options->primary_follow_timeout = repmgr_atoi(value, name, error_list, 0);
|
options->repmgrd_standby_startup_timeout = repmgr_atoi(value, name, error_list, 0);
|
||||||
|
else if (strcmp(name, "repmgrd_pid_file") == 0)
|
||||||
|
strncpy(options->repmgrd_pid_file, value, MAXPGPATH);
|
||||||
|
|
||||||
|
/* witness settings */
|
||||||
|
else if (strcmp(name, "witness_sync_interval") == 0)
|
||||||
|
options->witness_sync_interval = repmgr_atoi(value, name, error_list, 1);
|
||||||
|
|
||||||
/* BDR settings */
|
/* BDR settings */
|
||||||
else if (strcmp(name, "bdr_local_monitoring_only") == 0)
|
else if (strcmp(name, "bdr_local_monitoring_only") == 0)
|
||||||
@@ -604,7 +723,7 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
* Raise an error if a known parameter is provided with an empty
|
* Raise an error if a known parameter is provided with an empty
|
||||||
* value. Currently there's no reason why empty parameters are needed;
|
* value. Currently there's no reason why empty parameters are needed;
|
||||||
* if we want to accept those, we'd need to add stricter default
|
* if we want to accept those, we'd need to add stricter default
|
||||||
* checking, as currently e.g. an empty `node` value will be converted
|
* checking, as currently e.g. an empty `node_id` value will be converted
|
||||||
* to '0'.
|
* to '0'.
|
||||||
*/
|
*/
|
||||||
if (known_parameter == true && !strlen(value))
|
if (known_parameter == true && !strlen(value))
|
||||||
@@ -670,6 +789,17 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
PQconninfoFree(conninfo_options);
|
PQconninfoFree(conninfo_options);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* set values for parameters which default to other parameters */
|
||||||
|
|
||||||
|
/*
|
||||||
|
* From 4.1, "repmgrd_standby_startup_timeout" replaces "standby_reconnect_timeout"
|
||||||
|
* in repmgrd; fall back to "standby_reconnect_timeout" if no value explicitly provided
|
||||||
|
*/
|
||||||
|
if (options->repmgrd_standby_startup_timeout == -1)
|
||||||
|
{
|
||||||
|
options->repmgrd_standby_startup_timeout = options->standby_reconnect_timeout;
|
||||||
|
}
|
||||||
|
|
||||||
/* add warning about changed "barman_" parameter meanings */
|
/* add warning about changed "barman_" parameter meanings */
|
||||||
if ((options->barman_host[0] == '\0' && options->barman_server[0] != '\0') ||
|
if ((options->barman_host[0] == '\0' && options->barman_server[0] != '\0') ||
|
||||||
(options->barman_host[0] != '\0' && options->barman_server[0] == '\0'))
|
(options->barman_host[0] != '\0' && options->barman_server[0] == '\0'))
|
||||||
@@ -677,7 +807,7 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
item_list_append(error_list,
|
item_list_append(error_list,
|
||||||
_("use \"barman_host\" for the hostname of the Barman server"));
|
_("use \"barman_host\" for the hostname of the Barman server"));
|
||||||
item_list_append(error_list,
|
item_list_append(error_list,
|
||||||
_("use \"barman_server\" for the name of the [server] section in the Barman configururation file"));
|
_("use \"barman_server\" for the name of the [server] section in the Barman configuration file"));
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -694,6 +824,12 @@ _parse_config(t_configuration_options *options, ItemList *error_list, ItemList *
|
|||||||
item_list_append(error_list,
|
item_list_append(error_list,
|
||||||
_("\replication_lag_critical\" must be greater than \"replication_lag_warning\""));
|
_("\replication_lag_critical\" must be greater than \"replication_lag_warning\""));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (options->standby_reconnect_timeout < options->node_rejoin_timeout)
|
||||||
|
{
|
||||||
|
item_list_append(error_list,
|
||||||
|
_("\"standby_reconnect_timeout\" must be equal to or greater than \"node_rejoin_timeout\""));
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@@ -858,12 +994,11 @@ parse_time_unit_parameter(const char *name, const char *value, char *dest, ItemL
|
|||||||
char *ptr = NULL;
|
char *ptr = NULL;
|
||||||
int targ = strtol(value, &ptr, 10);
|
int targ = strtol(value, &ptr, 10);
|
||||||
|
|
||||||
if (targ < 1)
|
if (targ < 0)
|
||||||
{
|
{
|
||||||
if (errors != NULL)
|
if (errors != NULL)
|
||||||
{
|
{
|
||||||
item_list_append_format(
|
item_list_append_format(errors,
|
||||||
errors,
|
|
||||||
_("invalid value provided for \"%s\""),
|
_("invalid value provided for \"%s\""),
|
||||||
name);
|
name);
|
||||||
}
|
}
|
||||||
@@ -917,13 +1052,16 @@ parse_time_unit_parameter(const char *name, const char *value, char *dest, ItemL
|
|||||||
* - promote_delay
|
* - promote_delay
|
||||||
* - reconnect_attempts
|
* - reconnect_attempts
|
||||||
* - reconnect_interval
|
* - reconnect_interval
|
||||||
|
* - repmgrd_standby_startup_timeout
|
||||||
* - retry_promote_interval_secs
|
* - retry_promote_interval_secs
|
||||||
*
|
*
|
||||||
* non-changeable options
|
* non-changeable options (repmgrd references these from the "repmgr.nodes"
|
||||||
|
* table, not the configuration file)
|
||||||
*
|
*
|
||||||
* - node_id
|
* - node_id
|
||||||
* - node_name
|
* - node_name
|
||||||
* - data_directory
|
* - data_directory
|
||||||
|
* - location
|
||||||
* - priority
|
* - priority
|
||||||
* - replication_type
|
* - replication_type
|
||||||
*
|
*
|
||||||
@@ -932,7 +1070,7 @@ parse_time_unit_parameter(const char *name, const char *value, char *dest, ItemL
|
|||||||
|
|
||||||
*/
|
*/
|
||||||
bool
|
bool
|
||||||
reload_config(t_configuration_options *orig_options)
|
reload_config(t_configuration_options *orig_options, t_server_type server_type)
|
||||||
{
|
{
|
||||||
PGconn *conn;
|
PGconn *conn;
|
||||||
t_configuration_options new_options = T_CONFIGURATION_OPTIONS_INITIALIZER;
|
t_configuration_options new_options = T_CONFIGURATION_OPTIONS_INITIALIZER;
|
||||||
@@ -942,17 +1080,50 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
static ItemList config_errors = {NULL, NULL};
|
static ItemList config_errors = {NULL, NULL};
|
||||||
static ItemList config_warnings = {NULL, NULL};
|
static ItemList config_warnings = {NULL, NULL};
|
||||||
|
|
||||||
|
PQExpBufferData errors;
|
||||||
|
|
||||||
log_info(_("reloading configuration file"));
|
log_info(_("reloading configuration file"));
|
||||||
|
|
||||||
_parse_config(&new_options, &config_errors, &config_warnings);
|
_parse_config(&new_options, &config_errors, &config_warnings);
|
||||||
|
|
||||||
|
|
||||||
|
if (server_type == PRIMARY || server_type == STANDBY)
|
||||||
|
{
|
||||||
|
if (new_options.promote_command[0] == '\0')
|
||||||
|
{
|
||||||
|
item_list_append(&config_errors, _("\"promote_command\": required parameter was not found"));
|
||||||
|
}
|
||||||
|
|
||||||
|
if (new_options.follow_command[0] == '\0')
|
||||||
|
{
|
||||||
|
item_list_append(&config_errors, _("\"follow_command\": required parameter was not found"));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
if (config_errors.head != NULL)
|
if (config_errors.head != NULL)
|
||||||
{
|
{
|
||||||
/* XXX dump errors to log */
|
ItemListCell *cell = NULL;
|
||||||
|
|
||||||
log_warning(_("unable to parse new configuration, retaining current configuration"));
|
log_warning(_("unable to parse new configuration, retaining current configuration"));
|
||||||
|
|
||||||
|
initPQExpBuffer(&errors);
|
||||||
|
|
||||||
|
appendPQExpBufferStr(&errors,
|
||||||
|
"following errors were detected:\n");
|
||||||
|
|
||||||
|
for (cell = config_errors.head; cell; cell = cell->next)
|
||||||
|
{
|
||||||
|
appendPQExpBuffer(&errors,
|
||||||
|
" %s\n", cell->string);
|
||||||
|
}
|
||||||
|
|
||||||
|
log_detail("%s", errors.data);
|
||||||
|
termPQExpBuffer(&errors);
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
/* The following options cannot be changed */
|
/* The following options cannot be changed */
|
||||||
|
|
||||||
if (new_options.node_id != orig_options->node_id)
|
if (new_options.node_id != orig_options->node_id)
|
||||||
@@ -961,7 +1132,7 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (strcmp(new_options.node_name, orig_options->node_name) != 0)
|
if (strncmp(new_options.node_name, orig_options->node_name, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
log_warning(_("\"node_name\" cannot be changed, keeping current configuration"));
|
log_warning(_("\"node_name\" cannot be changed, keeping current configuration"));
|
||||||
return false;
|
return false;
|
||||||
@@ -1005,7 +1176,7 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
}
|
}
|
||||||
|
|
||||||
/* conninfo */
|
/* conninfo */
|
||||||
if (strcmp(orig_options->conninfo, new_options.conninfo) != 0)
|
if (strncmp(orig_options->conninfo, new_options.conninfo, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
/* Test conninfo string works */
|
/* Test conninfo string works */
|
||||||
conn = establish_db_connection(new_options.conninfo, false);
|
conn = establish_db_connection(new_options.conninfo, false);
|
||||||
@@ -1032,7 +1203,7 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
}
|
}
|
||||||
|
|
||||||
/* event_notification_command */
|
/* event_notification_command */
|
||||||
if (strcmp(orig_options->event_notification_command, new_options.event_notification_command) != 0)
|
if (strncmp(orig_options->event_notification_command, new_options.event_notification_command, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
strncpy(orig_options->event_notification_command, new_options.event_notification_command, MAXLEN);
|
strncpy(orig_options->event_notification_command, new_options.event_notification_command, MAXLEN);
|
||||||
log_info(_("\"event_notification_command\" is now \"%s\""), new_options.event_notification_command);
|
log_info(_("\"event_notification_command\" is now \"%s\""), new_options.event_notification_command);
|
||||||
@@ -1041,7 +1212,7 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
}
|
}
|
||||||
|
|
||||||
/* event_notifications */
|
/* event_notifications */
|
||||||
if (strcmp(orig_options->event_notifications_orig, new_options.event_notifications_orig) != 0)
|
if (strncmp(orig_options->event_notifications_orig, new_options.event_notifications_orig, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
strncpy(orig_options->event_notifications_orig, new_options.event_notifications_orig, MAXLEN);
|
strncpy(orig_options->event_notifications_orig, new_options.event_notifications_orig, MAXLEN);
|
||||||
log_info(_("\"event_notifications\" is now \"%s\""), new_options.event_notifications_orig);
|
log_info(_("\"event_notifications\" is now \"%s\""), new_options.event_notifications_orig);
|
||||||
@@ -1061,7 +1232,7 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
}
|
}
|
||||||
|
|
||||||
/* follow_command */
|
/* follow_command */
|
||||||
if (strcmp(orig_options->follow_command, new_options.follow_command) != 0)
|
if (strncmp(orig_options->follow_command, new_options.follow_command, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
strncpy(orig_options->follow_command, new_options.follow_command, MAXLEN);
|
strncpy(orig_options->follow_command, new_options.follow_command, MAXLEN);
|
||||||
log_info(_("\"follow_command\" is now \"%s\""), new_options.follow_command);
|
log_info(_("\"follow_command\" is now \"%s\""), new_options.follow_command);
|
||||||
@@ -1098,7 +1269,7 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
|
|
||||||
|
|
||||||
/* promote_command */
|
/* promote_command */
|
||||||
if (strcmp(orig_options->promote_command, new_options.promote_command) != 0)
|
if (strncmp(orig_options->promote_command, new_options.promote_command, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
strncpy(orig_options->promote_command, new_options.promote_command, MAXLEN);
|
strncpy(orig_options->promote_command, new_options.promote_command, MAXLEN);
|
||||||
log_info(_("\"promote_command\" is now \"%s\""), new_options.promote_command);
|
log_info(_("\"promote_command\" is now \"%s\""), new_options.promote_command);
|
||||||
@@ -1106,7 +1277,7 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* promote_delay */
|
/* promote_delay (for testing use only; not documented */
|
||||||
if (orig_options->promote_delay != new_options.promote_delay)
|
if (orig_options->promote_delay != new_options.promote_delay)
|
||||||
{
|
{
|
||||||
orig_options->promote_delay = new_options.promote_delay;
|
orig_options->promote_delay = new_options.promote_delay;
|
||||||
@@ -1133,23 +1304,32 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* repmgrd_standby_startup_timeout */
|
||||||
|
if (orig_options->repmgrd_standby_startup_timeout != new_options.repmgrd_standby_startup_timeout)
|
||||||
|
{
|
||||||
|
orig_options->repmgrd_standby_startup_timeout = new_options.repmgrd_standby_startup_timeout;
|
||||||
|
log_info(_("\"repmgrd_standby_startup_timeout\" is now \"%i\""), new_options.repmgrd_standby_startup_timeout);
|
||||||
|
|
||||||
|
config_changed = true;
|
||||||
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Handle changes to logging configuration
|
* Handle changes to logging configuration
|
||||||
*/
|
*/
|
||||||
|
|
||||||
/* log_facility */
|
/* log_facility */
|
||||||
if (strcmp(orig_options->log_facility, new_options.log_facility) != 0)
|
if (strncmp(orig_options->log_facility, new_options.log_facility, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
strcpy(orig_options->log_facility, new_options.log_facility);
|
strncpy(orig_options->log_facility, new_options.log_facility, MAXLEN);
|
||||||
log_info(_("\"log_facility\" is now \"%s\""), new_options.log_facility);
|
log_info(_("\"log_facility\" is now \"%s\""), new_options.log_facility);
|
||||||
|
|
||||||
log_config_changed = true;
|
log_config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* log_file */
|
/* log_file */
|
||||||
if (strcmp(orig_options->log_file, new_options.log_file) != 0)
|
if (strncmp(orig_options->log_file, new_options.log_file, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
strcpy(orig_options->log_file, new_options.log_file);
|
strncpy(orig_options->log_file, new_options.log_file, MAXLEN);
|
||||||
log_info(_("\"log_file\" is now \"%s\""), new_options.log_file);
|
log_info(_("\"log_file\" is now \"%s\""), new_options.log_file);
|
||||||
|
|
||||||
log_config_changed = true;
|
log_config_changed = true;
|
||||||
@@ -1157,9 +1337,9 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
|
|
||||||
|
|
||||||
/* log_level */
|
/* log_level */
|
||||||
if (strcmp(orig_options->log_level, new_options.log_level) != 0)
|
if (strncmp(orig_options->log_level, new_options.log_level, MAXLEN) != 0)
|
||||||
{
|
{
|
||||||
strcpy(orig_options->log_level, new_options.log_level);
|
strncpy(orig_options->log_level, new_options.log_level, MAXLEN);
|
||||||
log_info(_("\"log_level\" is now \"%s\""), new_options.log_level);
|
log_info(_("\"log_level\" is now \"%s\""), new_options.log_level);
|
||||||
|
|
||||||
log_config_changed = true;
|
log_config_changed = true;
|
||||||
@@ -1225,13 +1405,23 @@ exit_with_config_file_errors(ItemList *config_errors, ItemList *config_warnings,
|
|||||||
|
|
||||||
|
|
||||||
void
|
void
|
||||||
exit_with_cli_errors(ItemList *error_list)
|
exit_with_cli_errors(ItemList *error_list, const char *repmgr_command)
|
||||||
{
|
{
|
||||||
fprintf(stderr, _("The following command line errors were encountered:\n"));
|
fprintf(stderr, _("The following command line errors were encountered:\n"));
|
||||||
|
|
||||||
print_item_list(error_list);
|
print_item_list(error_list);
|
||||||
|
|
||||||
fprintf(stderr, _("Try \"%s --help\" for more information.\n"), progname());
|
if (repmgr_command != NULL)
|
||||||
|
{
|
||||||
|
fprintf(stderr, _("Try \"%s --help\" or \"%s %s --help\" for more information.\n"),
|
||||||
|
progname(),
|
||||||
|
progname(),
|
||||||
|
repmgr_command);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
fprintf(stderr, _("Try \"%s --help\" for more information.\n"), progname());
|
||||||
|
}
|
||||||
|
|
||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
}
|
}
|
||||||
@@ -1336,11 +1526,14 @@ repmgr_atoi(const char *value, const char *config_item, ItemList *error_list, in
|
|||||||
*
|
*
|
||||||
* https://www.postgresql.org/docs/current/static/config-setting.html
|
* https://www.postgresql.org/docs/current/static/config-setting.html
|
||||||
*/
|
*/
|
||||||
static bool
|
bool
|
||||||
parse_bool(const char *s, const char *config_item, ItemList *error_list)
|
parse_bool(const char *s, const char *config_item, ItemList *error_list)
|
||||||
{
|
{
|
||||||
PQExpBufferData errors;
|
PQExpBufferData errors;
|
||||||
|
|
||||||
|
if (s == NULL)
|
||||||
|
return true;
|
||||||
|
|
||||||
if (strcasecmp(s, "0") == 0)
|
if (strcasecmp(s, "0") == 0)
|
||||||
return false;
|
return false;
|
||||||
|
|
||||||
@@ -1533,31 +1726,112 @@ clear_event_notification_list(t_configuration_options *options)
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
bool
|
int
|
||||||
parse_pg_basebackup_options(const char *pg_basebackup_options, t_basebackup_options *backup_options, int server_version_num, ItemList *error_list)
|
parse_output_to_argv(const char *string, char ***argv_array)
|
||||||
{
|
{
|
||||||
int options_len = 0;
|
int options_len = 0;
|
||||||
char *options_string = NULL;
|
char *options_string = NULL;
|
||||||
char *options_string_ptr = NULL;
|
char *options_string_ptr = NULL;
|
||||||
|
int c = 1,
|
||||||
|
argc_item = 1;
|
||||||
|
char *argv_item = NULL;
|
||||||
|
char **local_argv_array = NULL;
|
||||||
|
ItemListCell *cell;
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Add parsed options to this list, then copy to an array to pass to
|
* Add parsed options to this list, then copy to an array to pass to
|
||||||
* getopt
|
* getopt
|
||||||
*/
|
*/
|
||||||
static ItemList option_argv = {NULL, NULL};
|
ItemList option_argv = {NULL, NULL};
|
||||||
|
|
||||||
char *argv_item = NULL;
|
options_len = strlen(string) + 1;
|
||||||
int c,
|
options_string = pg_malloc0(options_len);
|
||||||
argc_item = 1;
|
options_string_ptr = options_string;
|
||||||
|
|
||||||
|
/* Copy the string before operating on it with strtok() */
|
||||||
|
strncpy(options_string, string, options_len);
|
||||||
|
|
||||||
|
/* Extract arguments into a list and keep a count of the total */
|
||||||
|
while ((argv_item = strtok(options_string_ptr, " ")) != NULL)
|
||||||
|
{
|
||||||
|
item_list_append(&option_argv, trim(argv_item));
|
||||||
|
|
||||||
|
argc_item++;
|
||||||
|
|
||||||
|
if (options_string_ptr != NULL)
|
||||||
|
options_string_ptr = NULL;
|
||||||
|
}
|
||||||
|
|
||||||
|
pfree(options_string);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Array of argument values to pass to getopt_long - this will need to
|
||||||
|
* include an empty string as the first value (normally this would be the
|
||||||
|
* program name)
|
||||||
|
*/
|
||||||
|
local_argv_array = pg_malloc0(sizeof(char *) * (argc_item + 2));
|
||||||
|
|
||||||
|
/* Insert a blank dummy program name at the start of the array */
|
||||||
|
local_argv_array[0] = pg_malloc0(1);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Copy the previously extracted arguments from our list to the array
|
||||||
|
*/
|
||||||
|
for (cell = option_argv.head; cell; cell = cell->next)
|
||||||
|
{
|
||||||
|
int argv_len = strlen(cell->string) + 1;
|
||||||
|
|
||||||
|
local_argv_array[c] = (char *)pg_malloc0(argv_len);
|
||||||
|
|
||||||
|
strncpy(local_argv_array[c], cell->string, argv_len);
|
||||||
|
|
||||||
|
c++;
|
||||||
|
}
|
||||||
|
|
||||||
|
local_argv_array[c] = NULL;
|
||||||
|
|
||||||
|
item_list_free(&option_argv);
|
||||||
|
|
||||||
|
*argv_array = local_argv_array;
|
||||||
|
|
||||||
|
return argc_item;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
free_parsed_argv(char ***argv_array)
|
||||||
|
{
|
||||||
|
char **local_argv_array = *argv_array;
|
||||||
|
int i = 0;
|
||||||
|
|
||||||
|
while (local_argv_array[i] != NULL)
|
||||||
|
{
|
||||||
|
pfree((char *)local_argv_array[i]);
|
||||||
|
i++;
|
||||||
|
}
|
||||||
|
|
||||||
|
pfree((char **)local_argv_array);
|
||||||
|
*argv_array = NULL;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
bool
|
||||||
|
parse_pg_basebackup_options(const char *pg_basebackup_options, t_basebackup_options *backup_options, int server_version_num, ItemList *error_list)
|
||||||
|
{
|
||||||
|
bool backup_options_ok = true;
|
||||||
|
|
||||||
|
int c = 0,
|
||||||
|
argc_item = 0;
|
||||||
|
|
||||||
char **argv_array = NULL;
|
char **argv_array = NULL;
|
||||||
ItemListCell *cell = NULL;
|
|
||||||
|
|
||||||
int optindex = 0;
|
int optindex = 0;
|
||||||
|
|
||||||
struct option *long_options = NULL;
|
struct option *long_options = NULL;
|
||||||
|
|
||||||
bool backup_options_ok = true;
|
|
||||||
|
|
||||||
/* We're only interested in these options */
|
/* We're only interested in these options */
|
||||||
static struct option long_options_9[] =
|
static struct option long_options_9[] =
|
||||||
@@ -1583,56 +1857,12 @@ parse_pg_basebackup_options(const char *pg_basebackup_options, t_basebackup_opti
|
|||||||
if (!strlen(pg_basebackup_options))
|
if (!strlen(pg_basebackup_options))
|
||||||
return backup_options_ok;
|
return backup_options_ok;
|
||||||
|
|
||||||
options_len = strlen(pg_basebackup_options) + 1;
|
|
||||||
options_string = pg_malloc(options_len);
|
|
||||||
options_string_ptr = options_string;
|
|
||||||
|
|
||||||
if (server_version_num >= 100000)
|
if (server_version_num >= 100000)
|
||||||
long_options = long_options_10;
|
long_options = long_options_10;
|
||||||
else
|
else
|
||||||
long_options = long_options_9;
|
long_options = long_options_9;
|
||||||
|
|
||||||
/* Copy the string before operating on it with strtok() */
|
argc_item = parse_output_to_argv(pg_basebackup_options, &argv_array);
|
||||||
strncpy(options_string, pg_basebackup_options, options_len);
|
|
||||||
|
|
||||||
/* Extract arguments into a list and keep a count of the total */
|
|
||||||
while ((argv_item = strtok(options_string_ptr, " ")) != NULL)
|
|
||||||
{
|
|
||||||
item_list_append(&option_argv, argv_item);
|
|
||||||
|
|
||||||
argc_item++;
|
|
||||||
|
|
||||||
if (options_string_ptr != NULL)
|
|
||||||
options_string_ptr = NULL;
|
|
||||||
}
|
|
||||||
|
|
||||||
/*
|
|
||||||
* Array of argument values to pass to getopt_long - this will need to
|
|
||||||
* include an empty string as the first value (normally this would be the
|
|
||||||
* program name)
|
|
||||||
*/
|
|
||||||
argv_array = pg_malloc0(sizeof(char *) * (argc_item + 2));
|
|
||||||
|
|
||||||
/* Insert a blank dummy program name at the start of the array */
|
|
||||||
argv_array[0] = pg_malloc0(1);
|
|
||||||
|
|
||||||
c = 1;
|
|
||||||
|
|
||||||
/*
|
|
||||||
* Copy the previously extracted arguments from our list to the array
|
|
||||||
*/
|
|
||||||
for (cell = option_argv.head; cell; cell = cell->next)
|
|
||||||
{
|
|
||||||
int argv_len = strlen(cell->string) + 1;
|
|
||||||
|
|
||||||
argv_array[c] = pg_malloc0(argv_len);
|
|
||||||
|
|
||||||
strncpy(argv_array[c], cell->string, argv_len);
|
|
||||||
|
|
||||||
c++;
|
|
||||||
}
|
|
||||||
|
|
||||||
argv_array[c] = NULL;
|
|
||||||
|
|
||||||
/* Reset getopt's optind variable */
|
/* Reset getopt's optind variable */
|
||||||
optind = 0;
|
optind = 0;
|
||||||
@@ -1676,15 +1906,7 @@ parse_pg_basebackup_options(const char *pg_basebackup_options, t_basebackup_opti
|
|||||||
backup_options_ok = false;
|
backup_options_ok = false;
|
||||||
}
|
}
|
||||||
|
|
||||||
pfree(options_string);
|
free_parsed_argv(&argv_array);
|
||||||
|
|
||||||
{
|
|
||||||
int i;
|
|
||||||
|
|
||||||
for (i = 0; i < argc_item + 2; i++)
|
|
||||||
pfree(argv_array[i]);
|
|
||||||
}
|
|
||||||
pfree(argv_array);
|
|
||||||
|
|
||||||
return backup_options_ok;
|
return backup_options_ok;
|
||||||
}
|
}
|
||||||
|
|||||||
65
configfile.h
65
configfile.h
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* configfile.h
|
* configfile.h
|
||||||
*
|
*
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
@@ -73,7 +73,9 @@ typedef struct
|
|||||||
char conninfo[MAXLEN];
|
char conninfo[MAXLEN];
|
||||||
char replication_user[NAMEDATALEN];
|
char replication_user[NAMEDATALEN];
|
||||||
char data_directory[MAXPGPATH];
|
char data_directory[MAXPGPATH];
|
||||||
|
char config_directory[MAXPGPATH];
|
||||||
char pg_bindir[MAXPGPATH];
|
char pg_bindir[MAXPGPATH];
|
||||||
|
char repmgr_bindir[MAXPGPATH];
|
||||||
int replication_type;
|
int replication_type;
|
||||||
|
|
||||||
/* log settings */
|
/* log settings */
|
||||||
@@ -82,14 +84,31 @@ typedef struct
|
|||||||
char log_file[MAXLEN];
|
char log_file[MAXLEN];
|
||||||
int log_status_interval;
|
int log_status_interval;
|
||||||
|
|
||||||
/* standby action settings */
|
/* standby clone settings */
|
||||||
bool use_replication_slots;
|
bool use_replication_slots;
|
||||||
char pg_basebackup_options[MAXLEN];
|
char pg_basebackup_options[MAXLEN];
|
||||||
char restore_command[MAXLEN];
|
char restore_command[MAXLEN];
|
||||||
TablespaceList tablespace_mapping;
|
TablespaceList tablespace_mapping;
|
||||||
char recovery_min_apply_delay[MAXLEN];
|
char recovery_min_apply_delay[MAXLEN];
|
||||||
bool recovery_min_apply_delay_provided;
|
bool recovery_min_apply_delay_provided;
|
||||||
|
char archive_cleanup_command[MAXLEN];
|
||||||
bool use_primary_conninfo_password;
|
bool use_primary_conninfo_password;
|
||||||
|
char passfile[MAXPGPATH];
|
||||||
|
|
||||||
|
/* standby promote settings */
|
||||||
|
int promote_check_timeout;
|
||||||
|
int promote_check_interval;
|
||||||
|
|
||||||
|
/* standby follow settings */
|
||||||
|
int primary_follow_timeout;
|
||||||
|
int standby_follow_timeout;
|
||||||
|
|
||||||
|
/* standby switchover settings */
|
||||||
|
int shutdown_check_timeout;
|
||||||
|
int standby_reconnect_timeout;
|
||||||
|
|
||||||
|
/* node rejoin settings */
|
||||||
|
int node_rejoin_timeout;
|
||||||
|
|
||||||
/* node check settings */
|
/* node check settings */
|
||||||
int archive_ready_warning;
|
int archive_ready_warning;
|
||||||
@@ -97,6 +116,9 @@ typedef struct
|
|||||||
int replication_lag_warning;
|
int replication_lag_warning;
|
||||||
int replication_lag_critical;
|
int replication_lag_critical;
|
||||||
|
|
||||||
|
/* witness settings */
|
||||||
|
int witness_sync_interval;
|
||||||
|
|
||||||
/* repmgrd settings */
|
/* repmgrd settings */
|
||||||
failover_mode_opt failover;
|
failover_mode_opt failover;
|
||||||
char location[MAXLEN];
|
char location[MAXLEN];
|
||||||
@@ -110,7 +132,8 @@ typedef struct
|
|||||||
int degraded_monitoring_timeout;
|
int degraded_monitoring_timeout;
|
||||||
int async_query_timeout;
|
int async_query_timeout;
|
||||||
int primary_notification_timeout;
|
int primary_notification_timeout;
|
||||||
int primary_follow_timeout;
|
int repmgrd_standby_startup_timeout;
|
||||||
|
char repmgrd_pid_file[MAXPGPATH];
|
||||||
|
|
||||||
/* BDR settings */
|
/* BDR settings */
|
||||||
bool bdr_local_monitoring_only;
|
bool bdr_local_monitoring_only;
|
||||||
@@ -149,14 +172,26 @@ typedef struct
|
|||||||
|
|
||||||
#define T_CONFIGURATION_OPTIONS_INITIALIZER { \
|
#define T_CONFIGURATION_OPTIONS_INITIALIZER { \
|
||||||
/* node information */ \
|
/* node information */ \
|
||||||
UNKNOWN_NODE_ID, "", "", "", "", "", REPLICATION_TYPE_PHYSICAL, \
|
UNKNOWN_NODE_ID, "", "", "", "", "", "", "", REPLICATION_TYPE_PHYSICAL, \
|
||||||
/* log settings */ \
|
/* log settings */ \
|
||||||
"", "", "", DEFAULT_LOG_STATUS_INTERVAL, \
|
"", "", "", DEFAULT_LOG_STATUS_INTERVAL, \
|
||||||
/* standby action settings */ \
|
/* standby clone settings */ \
|
||||||
false, "", "", { NULL, NULL }, "", false, false, \
|
false, "", "", { NULL, NULL }, "", false, "", false, "", \
|
||||||
|
/* standby promote settings */ \
|
||||||
|
DEFAULT_PROMOTE_CHECK_TIMEOUT, DEFAULT_PROMOTE_CHECK_INTERVAL, \
|
||||||
|
/* standby follow settings */ \
|
||||||
|
DEFAULT_PRIMARY_FOLLOW_TIMEOUT, \
|
||||||
|
DEFAULT_STANDBY_FOLLOW_TIMEOUT, \
|
||||||
|
/* standby switchover settings */ \
|
||||||
|
DEFAULT_SHUTDOWN_CHECK_TIMEOUT, \
|
||||||
|
DEFAULT_STANDBY_RECONNECT_TIMEOUT, \
|
||||||
|
/* node rejoin settings */ \
|
||||||
|
DEFAULT_NODE_REJOIN_TIMEOUT, \
|
||||||
/* node check settings */ \
|
/* node check settings */ \
|
||||||
DEFAULT_ARCHIVE_READY_WARNING, DEFAULT_ARCHIVE_READY_CRITICAL, \
|
DEFAULT_ARCHIVE_READY_WARNING, DEFAULT_ARCHIVE_READY_CRITICAL, \
|
||||||
DEFAULT_REPLICATION_LAG_WARNING, DEFAULT_REPLICATION_LAG_CRITICAL, \
|
DEFAULT_REPLICATION_LAG_WARNING, DEFAULT_REPLICATION_LAG_CRITICAL, \
|
||||||
|
/* witness settings */ \
|
||||||
|
DEFAULT_WITNESS_SYNC_INTERVAL, \
|
||||||
/* repmgrd settings */ \
|
/* repmgrd settings */ \
|
||||||
FAILOVER_MANUAL, DEFAULT_LOCATION, DEFAULT_PRIORITY, "", "", \
|
FAILOVER_MANUAL, DEFAULT_LOCATION, DEFAULT_PRIORITY, "", "", \
|
||||||
DEFAULT_MONITORING_INTERVAL, \
|
DEFAULT_MONITORING_INTERVAL, \
|
||||||
@@ -165,7 +200,7 @@ typedef struct
|
|||||||
false, -1, \
|
false, -1, \
|
||||||
DEFAULT_ASYNC_QUERY_TIMEOUT, \
|
DEFAULT_ASYNC_QUERY_TIMEOUT, \
|
||||||
DEFAULT_PRIMARY_NOTIFICATION_TIMEOUT, \
|
DEFAULT_PRIMARY_NOTIFICATION_TIMEOUT, \
|
||||||
DEFAULT_PRIMARY_FOLLOW_TIMEOUT, \
|
-1, "", \
|
||||||
/* BDR settings */ \
|
/* BDR settings */ \
|
||||||
false, DEFAULT_BDR_RECOVERY_TIMEOUT, \
|
false, DEFAULT_BDR_RECOVERY_TIMEOUT, \
|
||||||
/* service settings */ \
|
/* service settings */ \
|
||||||
@@ -241,30 +276,36 @@ typedef struct
|
|||||||
"", "", "", "" \
|
"", "", "", "" \
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#include "dbutils.h"
|
||||||
|
|
||||||
void set_progname(const char *argv0);
|
void set_progname(const char *argv0);
|
||||||
const char *progname(void);
|
const char *progname(void);
|
||||||
|
|
||||||
void load_config(const char *config_file, bool verbose, bool terse, t_configuration_options *options, char *argv0);
|
void load_config(const char *config_file, bool verbose, bool terse, t_configuration_options *options, char *argv0);
|
||||||
void parse_config(t_configuration_options *options, bool terse);
|
bool reload_config(t_configuration_options *orig_options, t_server_type server_type);
|
||||||
bool reload_config(t_configuration_options *orig_options);
|
|
||||||
|
|
||||||
bool parse_recovery_conf(const char *data_dir, t_recovery_conf *conf);
|
bool parse_recovery_conf(const char *data_dir, t_recovery_conf *conf);
|
||||||
|
|
||||||
|
bool parse_bool(const char *s,
|
||||||
|
const char *config_item,
|
||||||
|
ItemList *error_list);
|
||||||
|
|
||||||
int repmgr_atoi(const char *s,
|
int repmgr_atoi(const char *s,
|
||||||
const char *config_item,
|
const char *config_item,
|
||||||
ItemList *error_list,
|
ItemList *error_list,
|
||||||
int minval);
|
int minval);
|
||||||
|
|
||||||
|
|
||||||
bool parse_pg_basebackup_options(const char *pg_basebackup_options,
|
bool parse_pg_basebackup_options(const char *pg_basebackup_options,
|
||||||
t_basebackup_options *backup_options,
|
t_basebackup_options *backup_options,
|
||||||
int server_version_num,
|
int server_version_num,
|
||||||
ItemList *error_list);
|
ItemList *error_list);
|
||||||
|
|
||||||
|
int parse_output_to_argv(const char *string, char ***argv_array);
|
||||||
|
void free_parsed_argv(char ***argv_array);
|
||||||
|
|
||||||
|
|
||||||
/* called by repmgr-client and repmgrd */
|
/* called by repmgr-client and repmgrd */
|
||||||
void exit_with_cli_errors(ItemList *error_list);
|
void exit_with_cli_errors(ItemList *error_list, const char *repmgr_command);
|
||||||
void print_item_list(ItemList *item_list);
|
void print_item_list(ItemList *item_list);
|
||||||
|
|
||||||
#endif /* _REPMGR_CONFIGFILE_H_ */
|
#endif /* _REPMGR_CONFIGFILE_H_ */
|
||||||
|
|||||||
42
configure
vendored
42
configure
vendored
@@ -1,6 +1,6 @@
|
|||||||
#! /bin/sh
|
#! /bin/sh
|
||||||
# Guess values for system-dependent variables and create Makefiles.
|
# Guess values for system-dependent variables and create Makefiles.
|
||||||
# Generated by GNU Autoconf 2.69 for repmgr 4.0.
|
# Generated by GNU Autoconf 2.69 for repmgr 4.2.
|
||||||
#
|
#
|
||||||
# Report bugs to <pgsql-bugs@postgresql.org>.
|
# Report bugs to <pgsql-bugs@postgresql.org>.
|
||||||
#
|
#
|
||||||
@@ -11,7 +11,7 @@
|
|||||||
# This configure script is free software; the Free Software Foundation
|
# This configure script is free software; the Free Software Foundation
|
||||||
# gives unlimited permission to copy, distribute and modify it.
|
# gives unlimited permission to copy, distribute and modify it.
|
||||||
#
|
#
|
||||||
# Copyright (c) 2010-2017, 2ndQuadrant Ltd.
|
# Copyright (c) 2010-2018, 2ndQuadrant Ltd.
|
||||||
## -------------------- ##
|
## -------------------- ##
|
||||||
## M4sh Initialization. ##
|
## M4sh Initialization. ##
|
||||||
## -------------------- ##
|
## -------------------- ##
|
||||||
@@ -582,8 +582,8 @@ MAKEFLAGS=
|
|||||||
# Identity of this package.
|
# Identity of this package.
|
||||||
PACKAGE_NAME='repmgr'
|
PACKAGE_NAME='repmgr'
|
||||||
PACKAGE_TARNAME='repmgr'
|
PACKAGE_TARNAME='repmgr'
|
||||||
PACKAGE_VERSION='4.0'
|
PACKAGE_VERSION='4.2'
|
||||||
PACKAGE_STRING='repmgr 4.0'
|
PACKAGE_STRING='repmgr 4.2'
|
||||||
PACKAGE_BUGREPORT='pgsql-bugs@postgresql.org'
|
PACKAGE_BUGREPORT='pgsql-bugs@postgresql.org'
|
||||||
PACKAGE_URL='https://2ndquadrant.com/en/resources/repmgr/'
|
PACKAGE_URL='https://2ndquadrant.com/en/resources/repmgr/'
|
||||||
|
|
||||||
@@ -633,7 +633,6 @@ SHELL'
|
|||||||
ac_subst_files=''
|
ac_subst_files=''
|
||||||
ac_user_opts='
|
ac_user_opts='
|
||||||
enable_option_checking
|
enable_option_checking
|
||||||
with_bdr_only
|
|
||||||
'
|
'
|
||||||
ac_precious_vars='build_alias
|
ac_precious_vars='build_alias
|
||||||
host_alias
|
host_alias
|
||||||
@@ -1179,7 +1178,7 @@ if test "$ac_init_help" = "long"; then
|
|||||||
# Omit some internal or obsolete options to make the list less imposing.
|
# Omit some internal or obsolete options to make the list less imposing.
|
||||||
# This message is too long to be a string in the A/UX 3.1 sh.
|
# This message is too long to be a string in the A/UX 3.1 sh.
|
||||||
cat <<_ACEOF
|
cat <<_ACEOF
|
||||||
\`configure' configures repmgr 4.0 to adapt to many kinds of systems.
|
\`configure' configures repmgr 4.2 to adapt to many kinds of systems.
|
||||||
|
|
||||||
Usage: $0 [OPTION]... [VAR=VALUE]...
|
Usage: $0 [OPTION]... [VAR=VALUE]...
|
||||||
|
|
||||||
@@ -1240,15 +1239,10 @@ fi
|
|||||||
|
|
||||||
if test -n "$ac_init_help"; then
|
if test -n "$ac_init_help"; then
|
||||||
case $ac_init_help in
|
case $ac_init_help in
|
||||||
short | recursive ) echo "Configuration of repmgr 4.0:";;
|
short | recursive ) echo "Configuration of repmgr 4.2:";;
|
||||||
esac
|
esac
|
||||||
cat <<\_ACEOF
|
cat <<\_ACEOF
|
||||||
|
|
||||||
Optional Packages:
|
|
||||||
--with-PACKAGE[=ARG] use PACKAGE [ARG=yes]
|
|
||||||
--without-PACKAGE do not use PACKAGE (same as --with-PACKAGE=no)
|
|
||||||
--with-bdr-only BDR-only build
|
|
||||||
|
|
||||||
Some influential environment variables:
|
Some influential environment variables:
|
||||||
PG_CONFIG Location to find pg_config for target PostgreSQL (default PATH)
|
PG_CONFIG Location to find pg_config for target PostgreSQL (default PATH)
|
||||||
|
|
||||||
@@ -1319,14 +1313,14 @@ fi
|
|||||||
test -n "$ac_init_help" && exit $ac_status
|
test -n "$ac_init_help" && exit $ac_status
|
||||||
if $ac_init_version; then
|
if $ac_init_version; then
|
||||||
cat <<\_ACEOF
|
cat <<\_ACEOF
|
||||||
repmgr configure 4.0
|
repmgr configure 4.2
|
||||||
generated by GNU Autoconf 2.69
|
generated by GNU Autoconf 2.69
|
||||||
|
|
||||||
Copyright (C) 2012 Free Software Foundation, Inc.
|
Copyright (C) 2012 Free Software Foundation, Inc.
|
||||||
This configure script is free software; the Free Software Foundation
|
This configure script is free software; the Free Software Foundation
|
||||||
gives unlimited permission to copy, distribute and modify it.
|
gives unlimited permission to copy, distribute and modify it.
|
||||||
|
|
||||||
Copyright (c) 2010-2017, 2ndQuadrant Ltd.
|
Copyright (c) 2010-2018, 2ndQuadrant Ltd.
|
||||||
_ACEOF
|
_ACEOF
|
||||||
exit
|
exit
|
||||||
fi
|
fi
|
||||||
@@ -1338,7 +1332,7 @@ cat >config.log <<_ACEOF
|
|||||||
This file contains any messages produced by compilers while
|
This file contains any messages produced by compilers while
|
||||||
running configure, to aid debugging if configure makes a mistake.
|
running configure, to aid debugging if configure makes a mistake.
|
||||||
|
|
||||||
It was created by repmgr $as_me 4.0, which was
|
It was created by repmgr $as_me 4.2, which was
|
||||||
generated by GNU Autoconf 2.69. Invocation command line was
|
generated by GNU Autoconf 2.69. Invocation command line was
|
||||||
|
|
||||||
$ $0 $@
|
$ $0 $@
|
||||||
@@ -1694,20 +1688,6 @@ ac_config_headers="$ac_config_headers config.h"
|
|||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
# Check whether --with-bdr_only was given.
|
|
||||||
if test "${with_bdr_only+set}" = set; then :
|
|
||||||
withval=$with_bdr_only;
|
|
||||||
fi
|
|
||||||
|
|
||||||
if test "x$with_bdr_only" != "x"; then :
|
|
||||||
|
|
||||||
$as_echo "#define BDR_ONLY \"1\"" >>confdefs.h
|
|
||||||
|
|
||||||
|
|
||||||
fi
|
|
||||||
|
|
||||||
|
|
||||||
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for a sed that does not truncate output" >&5
|
{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for a sed that does not truncate output" >&5
|
||||||
$as_echo_n "checking for a sed that does not truncate output... " >&6; }
|
$as_echo_n "checking for a sed that does not truncate output... " >&6; }
|
||||||
if ${ac_cv_path_SED+:} false; then :
|
if ${ac_cv_path_SED+:} false; then :
|
||||||
@@ -2379,7 +2359,7 @@ cat >>$CONFIG_STATUS <<\_ACEOF || ac_write_fail=1
|
|||||||
# report actual input values of CONFIG_FILES etc. instead of their
|
# report actual input values of CONFIG_FILES etc. instead of their
|
||||||
# values after options handling.
|
# values after options handling.
|
||||||
ac_log="
|
ac_log="
|
||||||
This file was extended by repmgr $as_me 4.0, which was
|
This file was extended by repmgr $as_me 4.2, which was
|
||||||
generated by GNU Autoconf 2.69. Invocation command line was
|
generated by GNU Autoconf 2.69. Invocation command line was
|
||||||
|
|
||||||
CONFIG_FILES = $CONFIG_FILES
|
CONFIG_FILES = $CONFIG_FILES
|
||||||
@@ -2442,7 +2422,7 @@ _ACEOF
|
|||||||
cat >>$CONFIG_STATUS <<_ACEOF || ac_write_fail=1
|
cat >>$CONFIG_STATUS <<_ACEOF || ac_write_fail=1
|
||||||
ac_cs_config="`$as_echo "$ac_configure_args" | sed 's/^ //; s/[\\""\`\$]/\\\\&/g'`"
|
ac_cs_config="`$as_echo "$ac_configure_args" | sed 's/^ //; s/[\\""\`\$]/\\\\&/g'`"
|
||||||
ac_cs_version="\\
|
ac_cs_version="\\
|
||||||
repmgr config.status 4.0
|
repmgr config.status 4.2
|
||||||
configured by $0, generated by GNU Autoconf 2.69,
|
configured by $0, generated by GNU Autoconf 2.69,
|
||||||
with options \\"\$ac_cs_config\\"
|
with options \\"\$ac_cs_config\\"
|
||||||
|
|
||||||
|
|||||||
10
configure.in
10
configure.in
@@ -1,17 +1,11 @@
|
|||||||
AC_INIT([repmgr], [4.0], [pgsql-bugs@postgresql.org], [repmgr], [https://2ndquadrant.com/en/resources/repmgr/])
|
AC_INIT([repmgr], [4.2], [pgsql-bugs@postgresql.org], [repmgr], [https://2ndquadrant.com/en/resources/repmgr/])
|
||||||
|
|
||||||
AC_COPYRIGHT([Copyright (c) 2010-2017, 2ndQuadrant Ltd.])
|
AC_COPYRIGHT([Copyright (c) 2010-2018, 2ndQuadrant Ltd.])
|
||||||
|
|
||||||
AC_CONFIG_HEADER(config.h)
|
AC_CONFIG_HEADER(config.h)
|
||||||
|
|
||||||
AC_ARG_VAR([PG_CONFIG], [Location to find pg_config for target PostgreSQL (default PATH)])
|
AC_ARG_VAR([PG_CONFIG], [Location to find pg_config for target PostgreSQL (default PATH)])
|
||||||
|
|
||||||
AC_ARG_WITH([bdr_only], [AS_HELP_STRING([--with-bdr-only], [BDR-only build])])
|
|
||||||
AS_IF([test "x$with_bdr_only" != "x"],
|
|
||||||
[AC_DEFINE([BDR_ONLY], ["1"], [Only build repmgr for BDR])]
|
|
||||||
)
|
|
||||||
|
|
||||||
|
|
||||||
AC_PROG_SED
|
AC_PROG_SED
|
||||||
|
|
||||||
if test -z "$PG_CONFIG"; then
|
if test -z "$PG_CONFIG"; then
|
||||||
|
|||||||
159
controldata.c
159
controldata.c
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* controldata.c
|
* controldata.c
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* Portions Copyright (c) 1996-2016, PostgreSQL Global Development Group
|
* Portions Copyright (c) 1996-2016, PostgreSQL Global Development Group
|
||||||
* Portions Copyright (c) 1994, Regents of the University of California
|
* Portions Copyright (c) 1994, Regents of the University of California
|
||||||
@@ -37,13 +37,8 @@ get_system_identifier(const char *data_directory)
|
|||||||
uint64 system_identifier = UNKNOWN_SYSTEM_IDENTIFIER;
|
uint64 system_identifier = UNKNOWN_SYSTEM_IDENTIFIER;
|
||||||
|
|
||||||
control_file_info = get_controlfile(data_directory);
|
control_file_info = get_controlfile(data_directory);
|
||||||
|
system_identifier = control_file_info->system_identifier;
|
||||||
|
|
||||||
if (control_file_info->control_file_processed == true)
|
|
||||||
system_identifier = control_file_info->control_file->system_identifier;
|
|
||||||
else
|
|
||||||
system_identifier = UNKNOWN_SYSTEM_IDENTIFIER;
|
|
||||||
|
|
||||||
pfree(control_file_info->control_file);
|
|
||||||
pfree(control_file_info);
|
pfree(control_file_info);
|
||||||
|
|
||||||
return system_identifier;
|
return system_identifier;
|
||||||
@@ -57,13 +52,8 @@ get_db_state(const char *data_directory)
|
|||||||
|
|
||||||
control_file_info = get_controlfile(data_directory);
|
control_file_info = get_controlfile(data_directory);
|
||||||
|
|
||||||
if (control_file_info->control_file_processed == true)
|
state = control_file_info->state;
|
||||||
state = control_file_info->control_file->state;
|
|
||||||
else
|
|
||||||
/* if we were unable to parse the control file, assume DB is shut down */
|
|
||||||
state = DB_SHUTDOWNED;
|
|
||||||
|
|
||||||
pfree(control_file_info->control_file);
|
|
||||||
pfree(control_file_info);
|
pfree(control_file_info);
|
||||||
|
|
||||||
return state;
|
return state;
|
||||||
@@ -78,12 +68,8 @@ get_latest_checkpoint_location(const char *data_directory)
|
|||||||
|
|
||||||
control_file_info = get_controlfile(data_directory);
|
control_file_info = get_controlfile(data_directory);
|
||||||
|
|
||||||
if (control_file_info->control_file_processed == false)
|
checkPoint = control_file_info->checkPoint;
|
||||||
return InvalidXLogRecPtr;
|
|
||||||
|
|
||||||
checkPoint = control_file_info->control_file->checkPoint;
|
|
||||||
|
|
||||||
pfree(control_file_info->control_file);
|
|
||||||
pfree(control_file_info);
|
pfree(control_file_info);
|
||||||
|
|
||||||
return checkPoint;
|
return checkPoint;
|
||||||
@@ -98,16 +84,8 @@ get_data_checksum_version(const char *data_directory)
|
|||||||
|
|
||||||
control_file_info = get_controlfile(data_directory);
|
control_file_info = get_controlfile(data_directory);
|
||||||
|
|
||||||
if (control_file_info->control_file_processed == false)
|
data_checksum_version = (int) control_file_info->data_checksum_version;
|
||||||
{
|
|
||||||
data_checksum_version = -1;
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
data_checksum_version = (int) control_file_info->control_file->data_checksum_version;
|
|
||||||
}
|
|
||||||
|
|
||||||
pfree(control_file_info->control_file);
|
|
||||||
pfree(control_file_info);
|
pfree(control_file_info);
|
||||||
|
|
||||||
return data_checksum_version;
|
return data_checksum_version;
|
||||||
@@ -139,33 +117,109 @@ describe_db_state(DBState state)
|
|||||||
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* we maintain our own version of get_controlfile() as we need cross-version
|
* We maintain our own version of get_controlfile() as we need cross-version
|
||||||
* compatibility, and also don't care if the file isn't readable.
|
* compatibility, and also don't care if the file isn't readable.
|
||||||
*/
|
*/
|
||||||
static ControlFileInfo *
|
static ControlFileInfo *
|
||||||
get_controlfile(const char *DataDir)
|
get_controlfile(const char *DataDir)
|
||||||
{
|
{
|
||||||
ControlFileInfo *control_file_info;
|
ControlFileInfo *control_file_info;
|
||||||
int fd;
|
FILE *fp = NULL;
|
||||||
|
int fd, ret, version_num;
|
||||||
|
char PgVersionPath[MAXPGPATH] = "";
|
||||||
char ControlFilePath[MAXPGPATH] = "";
|
char ControlFilePath[MAXPGPATH] = "";
|
||||||
|
char file_version_string[64] = "";
|
||||||
|
long file_major, file_minor;
|
||||||
|
char *endptr = NULL;
|
||||||
|
void *ControlFileDataPtr = NULL;
|
||||||
|
int expected_size = 0;
|
||||||
|
|
||||||
control_file_info = palloc0(sizeof(ControlFileInfo));
|
control_file_info = palloc0(sizeof(ControlFileInfo));
|
||||||
|
|
||||||
|
/* set default values */
|
||||||
control_file_info->control_file_processed = false;
|
control_file_info->control_file_processed = false;
|
||||||
control_file_info->control_file = palloc0(sizeof(ControlFileData));
|
control_file_info->system_identifier = UNKNOWN_SYSTEM_IDENTIFIER;
|
||||||
|
control_file_info->state = DB_SHUTDOWNED;
|
||||||
|
control_file_info->checkPoint = InvalidXLogRecPtr;
|
||||||
|
control_file_info->data_checksum_version = -1;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Read PG_VERSION, as we'll need to determine which struct to read
|
||||||
|
* the control file contents into
|
||||||
|
*/
|
||||||
|
snprintf(PgVersionPath, MAXPGPATH, "%s/PG_VERSION", DataDir);
|
||||||
|
|
||||||
|
fp = fopen(PgVersionPath, "r");
|
||||||
|
|
||||||
|
if (fp == NULL)
|
||||||
|
{
|
||||||
|
log_warning(_("could not open file \"%s\" for reading"),
|
||||||
|
PgVersionPath);
|
||||||
|
log_detail("%s", strerror(errno));
|
||||||
|
return control_file_info;
|
||||||
|
}
|
||||||
|
|
||||||
|
file_version_string[0] = '\0';
|
||||||
|
|
||||||
|
ret = fscanf(fp, "%63s", file_version_string);
|
||||||
|
fclose(fp);
|
||||||
|
|
||||||
|
if (ret != 1 || endptr == file_version_string)
|
||||||
|
{
|
||||||
|
log_warning(_("unable to determine major version number from PG_VERSION"));
|
||||||
|
|
||||||
|
return control_file_info;
|
||||||
|
}
|
||||||
|
|
||||||
|
file_major = strtol(file_version_string, &endptr, 10);
|
||||||
|
file_minor = 0;
|
||||||
|
|
||||||
|
if (*endptr == '.')
|
||||||
|
file_minor = strtol(endptr + 1, NULL, 10);
|
||||||
|
|
||||||
|
version_num = ((int) file_major * 10000) + ((int) file_minor * 100);
|
||||||
|
|
||||||
|
if (version_num < 90300)
|
||||||
|
{
|
||||||
|
log_warning(_("Data directory appears to be initialised for %s"), file_version_string);
|
||||||
|
return control_file_info;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
snprintf(ControlFilePath, MAXPGPATH, "%s/global/pg_control", DataDir);
|
snprintf(ControlFilePath, MAXPGPATH, "%s/global/pg_control", DataDir);
|
||||||
|
|
||||||
if ((fd = open(ControlFilePath, O_RDONLY | PG_BINARY, 0)) == -1)
|
if ((fd = open(ControlFilePath, O_RDONLY | PG_BINARY, 0)) == -1)
|
||||||
{
|
{
|
||||||
log_debug("could not open file \"%s\" for reading: %s",
|
log_warning(_("could not open file \"%s\" for reading"),
|
||||||
ControlFilePath, strerror(errno));
|
ControlFilePath);
|
||||||
|
log_detail("%s", strerror(errno));
|
||||||
return control_file_info;
|
return control_file_info;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (read(fd, control_file_info->control_file, sizeof(ControlFileData)) != sizeof(ControlFileData))
|
|
||||||
|
if (version_num >= 90500)
|
||||||
{
|
{
|
||||||
log_debug("could not read file \"%s\": %s",
|
expected_size = sizeof(ControlFileData95);
|
||||||
ControlFilePath, strerror(errno));
|
ControlFileDataPtr = palloc0(expected_size);
|
||||||
|
}
|
||||||
|
else if (version_num >= 90400)
|
||||||
|
{
|
||||||
|
expected_size = sizeof(ControlFileData94);
|
||||||
|
ControlFileDataPtr = palloc0(expected_size);
|
||||||
|
}
|
||||||
|
else if (version_num >= 90300)
|
||||||
|
{
|
||||||
|
expected_size = sizeof(ControlFileData93);
|
||||||
|
ControlFileDataPtr = palloc0(expected_size);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
if (read(fd, ControlFileDataPtr, expected_size) != expected_size)
|
||||||
|
{
|
||||||
|
log_warning(_("could not read file \"%s\""),
|
||||||
|
ControlFilePath);
|
||||||
|
log_detail("%s", strerror(errno));
|
||||||
|
|
||||||
return control_file_info;
|
return control_file_info;
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -173,6 +227,41 @@ get_controlfile(const char *DataDir)
|
|||||||
|
|
||||||
control_file_info->control_file_processed = true;
|
control_file_info->control_file_processed = true;
|
||||||
|
|
||||||
|
if (version_num >= 110000)
|
||||||
|
{
|
||||||
|
ControlFileData11 *ptr = (struct ControlFileData11 *)ControlFileDataPtr;
|
||||||
|
control_file_info->system_identifier = ptr->system_identifier;
|
||||||
|
control_file_info->state = ptr->state;
|
||||||
|
control_file_info->checkPoint = ptr->checkPoint;
|
||||||
|
control_file_info->data_checksum_version = ptr->data_checksum_version;
|
||||||
|
}
|
||||||
|
else if (version_num >= 90500)
|
||||||
|
{
|
||||||
|
ControlFileData95 *ptr = (struct ControlFileData95 *)ControlFileDataPtr;
|
||||||
|
control_file_info->system_identifier = ptr->system_identifier;
|
||||||
|
control_file_info->state = ptr->state;
|
||||||
|
control_file_info->checkPoint = ptr->checkPoint;
|
||||||
|
control_file_info->data_checksum_version = ptr->data_checksum_version;
|
||||||
|
}
|
||||||
|
else if (version_num >= 90400)
|
||||||
|
{
|
||||||
|
ControlFileData94 *ptr = (struct ControlFileData94 *)ControlFileDataPtr;
|
||||||
|
control_file_info->system_identifier = ptr->system_identifier;
|
||||||
|
control_file_info->state = ptr->state;
|
||||||
|
control_file_info->checkPoint = ptr->checkPoint;
|
||||||
|
control_file_info->data_checksum_version = ptr->data_checksum_version;
|
||||||
|
}
|
||||||
|
else if (version_num >= 90300)
|
||||||
|
{
|
||||||
|
ControlFileData93 *ptr = (struct ControlFileData93 *)ControlFileDataPtr;
|
||||||
|
control_file_info->system_identifier = ptr->system_identifier;
|
||||||
|
control_file_info->state = ptr->state;
|
||||||
|
control_file_info->checkPoint = ptr->checkPoint;
|
||||||
|
control_file_info->data_checksum_version = ptr->data_checksum_version;
|
||||||
|
}
|
||||||
|
|
||||||
|
pfree(ControlFileDataPtr);
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* We don't check the CRC here as we're potentially checking a pg_control
|
* We don't check the CRC here as we're potentially checking a pg_control
|
||||||
* file from a different PostgreSQL version to the one repmgr was compiled
|
* file from a different PostgreSQL version to the one repmgr was compiled
|
||||||
|
|||||||
318
controldata.h
318
controldata.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* controldata.h
|
* controldata.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* Portions Copyright (c) 1996-2016, PostgreSQL Global Development Group
|
* Portions Copyright (c) 1996-2016, PostgreSQL Global Development Group
|
||||||
* Portions Copyright (c) 1994, Regents of the University of California
|
* Portions Copyright (c) 1994, Regents of the University of California
|
||||||
@@ -12,12 +12,326 @@
|
|||||||
#include "postgres_fe.h"
|
#include "postgres_fe.h"
|
||||||
#include "catalog/pg_control.h"
|
#include "catalog/pg_control.h"
|
||||||
|
|
||||||
|
/*
|
||||||
|
* A simplified representation of pg_control containing only those fields
|
||||||
|
* required by repmgr.
|
||||||
|
*/
|
||||||
typedef struct
|
typedef struct
|
||||||
{
|
{
|
||||||
bool control_file_processed;
|
bool control_file_processed;
|
||||||
ControlFileData *control_file;
|
uint64 system_identifier;
|
||||||
|
DBState state;
|
||||||
|
XLogRecPtr checkPoint;
|
||||||
|
uint32 data_checksum_version;
|
||||||
} ControlFileInfo;
|
} ControlFileInfo;
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
/* Same for 9.3, 9.4 */
|
||||||
|
typedef struct CheckPoint93
|
||||||
|
{
|
||||||
|
XLogRecPtr redo; /* next RecPtr available when we began to
|
||||||
|
* create CheckPoint (i.e. REDO start point) */
|
||||||
|
TimeLineID ThisTimeLineID; /* current TLI */
|
||||||
|
TimeLineID PrevTimeLineID; /* previous TLI, if this record begins a new
|
||||||
|
* timeline (equals ThisTimeLineID otherwise) */
|
||||||
|
bool fullPageWrites; /* current full_page_writes */
|
||||||
|
uint32 nextXidEpoch; /* higher-order bits of nextXid */
|
||||||
|
TransactionId nextXid; /* next free XID */
|
||||||
|
Oid nextOid; /* next free OID */
|
||||||
|
MultiXactId nextMulti; /* next free MultiXactId */
|
||||||
|
MultiXactOffset nextMultiOffset; /* next free MultiXact offset */
|
||||||
|
TransactionId oldestXid; /* cluster-wide minimum datfrozenxid */
|
||||||
|
Oid oldestXidDB; /* database with minimum datfrozenxid */
|
||||||
|
MultiXactId oldestMulti; /* cluster-wide minimum datminmxid */
|
||||||
|
Oid oldestMultiDB; /* database with minimum datminmxid */
|
||||||
|
pg_time_t time; /* time stamp of checkpoint */
|
||||||
|
|
||||||
|
TransactionId oldestActiveXid;
|
||||||
|
} CheckPoint93;
|
||||||
|
|
||||||
|
|
||||||
|
/* Same for 9.5, 9.6, 10, HEAD */
|
||||||
|
typedef struct CheckPoint95
|
||||||
|
{
|
||||||
|
XLogRecPtr redo; /* next RecPtr available when we began to
|
||||||
|
* create CheckPoint (i.e. REDO start point) */
|
||||||
|
TimeLineID ThisTimeLineID; /* current TLI */
|
||||||
|
TimeLineID PrevTimeLineID; /* previous TLI, if this record begins a new
|
||||||
|
* timeline (equals ThisTimeLineID otherwise) */
|
||||||
|
bool fullPageWrites; /* current full_page_writes */
|
||||||
|
uint32 nextXidEpoch; /* higher-order bits of nextXid */
|
||||||
|
TransactionId nextXid; /* next free XID */
|
||||||
|
Oid nextOid; /* next free OID */
|
||||||
|
MultiXactId nextMulti; /* next free MultiXactId */
|
||||||
|
MultiXactOffset nextMultiOffset; /* next free MultiXact offset */
|
||||||
|
TransactionId oldestXid; /* cluster-wide minimum datfrozenxid */
|
||||||
|
Oid oldestXidDB; /* database with minimum datfrozenxid */
|
||||||
|
MultiXactId oldestMulti; /* cluster-wide minimum datminmxid */
|
||||||
|
Oid oldestMultiDB; /* database with minimum datminmxid */
|
||||||
|
pg_time_t time; /* time stamp of checkpoint */
|
||||||
|
TransactionId oldestCommitTsXid; /* oldest Xid with valid commit
|
||||||
|
* timestamp */
|
||||||
|
TransactionId newestCommitTsXid; /* newest Xid with valid commit
|
||||||
|
* timestamp */
|
||||||
|
|
||||||
|
TransactionId oldestActiveXid;
|
||||||
|
} CheckPoint95;
|
||||||
|
|
||||||
|
|
||||||
|
typedef struct ControlFileData93
|
||||||
|
{
|
||||||
|
uint64 system_identifier;
|
||||||
|
|
||||||
|
uint32 pg_control_version; /* PG_CONTROL_VERSION */
|
||||||
|
uint32 catalog_version_no; /* see catversion.h */
|
||||||
|
|
||||||
|
DBState state; /* see enum above */
|
||||||
|
pg_time_t time; /* time stamp of last pg_control update */
|
||||||
|
XLogRecPtr checkPoint; /* last check point record ptr */
|
||||||
|
XLogRecPtr prevCheckPoint; /* previous check point record ptr */
|
||||||
|
|
||||||
|
CheckPoint93 checkPointCopy; /* copy of last check point record */
|
||||||
|
|
||||||
|
XLogRecPtr unloggedLSN; /* current fake LSN value, for unlogged rels */
|
||||||
|
|
||||||
|
XLogRecPtr minRecoveryPoint;
|
||||||
|
TimeLineID minRecoveryPointTLI;
|
||||||
|
XLogRecPtr backupStartPoint;
|
||||||
|
XLogRecPtr backupEndPoint;
|
||||||
|
bool backupEndRequired;
|
||||||
|
|
||||||
|
int wal_level;
|
||||||
|
int MaxConnections;
|
||||||
|
int max_prepared_xacts;
|
||||||
|
int max_locks_per_xact;
|
||||||
|
|
||||||
|
uint32 maxAlign; /* alignment requirement for tuples */
|
||||||
|
double floatFormat; /* constant 1234567.0 */
|
||||||
|
|
||||||
|
uint32 blcksz; /* data block size for this DB */
|
||||||
|
uint32 relseg_size; /* blocks per segment of large relation */
|
||||||
|
|
||||||
|
uint32 xlog_blcksz; /* block size within WAL files */
|
||||||
|
uint32 xlog_seg_size; /* size of each WAL segment */
|
||||||
|
|
||||||
|
uint32 nameDataLen; /* catalog name field width */
|
||||||
|
uint32 indexMaxKeys; /* max number of columns in an index */
|
||||||
|
|
||||||
|
uint32 toast_max_chunk_size; /* chunk size in TOAST tables */
|
||||||
|
|
||||||
|
/* flag indicating internal format of timestamp, interval, time */
|
||||||
|
bool enableIntTimes; /* int64 storage enabled? */
|
||||||
|
|
||||||
|
/* flags indicating pass-by-value status of various types */
|
||||||
|
bool float4ByVal; /* float4 pass-by-value? */
|
||||||
|
bool float8ByVal; /* float8, int8, etc pass-by-value? */
|
||||||
|
|
||||||
|
/* Are data pages protected by checksums? Zero if no checksum version */
|
||||||
|
uint32 data_checksum_version;
|
||||||
|
|
||||||
|
} ControlFileData93;
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Following fields added since 9.3:
|
||||||
|
*
|
||||||
|
* int max_worker_processes;
|
||||||
|
* int max_prepared_xacts;
|
||||||
|
* int max_locks_per_xact;
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
typedef struct ControlFileData94
|
||||||
|
{
|
||||||
|
uint64 system_identifier;
|
||||||
|
|
||||||
|
uint32 pg_control_version; /* PG_CONTROL_VERSION */
|
||||||
|
uint32 catalog_version_no; /* see catversion.h */
|
||||||
|
|
||||||
|
DBState state; /* see enum above */
|
||||||
|
pg_time_t time; /* time stamp of last pg_control update */
|
||||||
|
XLogRecPtr checkPoint; /* last check point record ptr */
|
||||||
|
XLogRecPtr prevCheckPoint; /* previous check point record ptr */
|
||||||
|
|
||||||
|
CheckPoint93 checkPointCopy; /* copy of last check point record */
|
||||||
|
|
||||||
|
XLogRecPtr unloggedLSN; /* current fake LSN value, for unlogged rels */
|
||||||
|
|
||||||
|
XLogRecPtr minRecoveryPoint;
|
||||||
|
TimeLineID minRecoveryPointTLI;
|
||||||
|
XLogRecPtr backupStartPoint;
|
||||||
|
XLogRecPtr backupEndPoint;
|
||||||
|
bool backupEndRequired;
|
||||||
|
|
||||||
|
int wal_level;
|
||||||
|
bool wal_log_hints;
|
||||||
|
int MaxConnections;
|
||||||
|
int max_worker_processes;
|
||||||
|
int max_prepared_xacts;
|
||||||
|
int max_locks_per_xact;
|
||||||
|
|
||||||
|
uint32 maxAlign; /* alignment requirement for tuples */
|
||||||
|
double floatFormat; /* constant 1234567.0 */
|
||||||
|
|
||||||
|
uint32 blcksz; /* data block size for this DB */
|
||||||
|
uint32 relseg_size; /* blocks per segment of large relation */
|
||||||
|
|
||||||
|
uint32 xlog_blcksz; /* block size within WAL files */
|
||||||
|
uint32 xlog_seg_size; /* size of each WAL segment */
|
||||||
|
|
||||||
|
uint32 nameDataLen; /* catalog name field width */
|
||||||
|
uint32 indexMaxKeys; /* max number of columns in an index */
|
||||||
|
|
||||||
|
uint32 toast_max_chunk_size; /* chunk size in TOAST tables */
|
||||||
|
uint32 loblksize; /* chunk size in pg_largeobject */
|
||||||
|
|
||||||
|
bool enableIntTimes; /* int64 storage enabled? */
|
||||||
|
|
||||||
|
bool float4ByVal; /* float4 pass-by-value? */
|
||||||
|
bool float8ByVal; /* float8, int8, etc pass-by-value? */
|
||||||
|
|
||||||
|
/* Are data pages protected by checksums? Zero if no checksum version */
|
||||||
|
uint32 data_checksum_version;
|
||||||
|
|
||||||
|
} ControlFileData94;
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Following field added since 9.4:
|
||||||
|
*
|
||||||
|
* bool track_commit_timestamp;
|
||||||
|
*
|
||||||
|
* Unchanged in 9.6
|
||||||
|
*
|
||||||
|
* In 10, following field appended *after* "data_checksum_version":
|
||||||
|
*
|
||||||
|
* char mock_authentication_nonce[MOCK_AUTH_NONCE_LEN];
|
||||||
|
*
|
||||||
|
* (but we don't care about that)
|
||||||
|
*/
|
||||||
|
|
||||||
|
typedef struct ControlFileData95
|
||||||
|
{
|
||||||
|
uint64 system_identifier;
|
||||||
|
|
||||||
|
uint32 pg_control_version; /* PG_CONTROL_VERSION */
|
||||||
|
uint32 catalog_version_no; /* see catversion.h */
|
||||||
|
|
||||||
|
DBState state; /* see enum above */
|
||||||
|
pg_time_t time; /* time stamp of last pg_control update */
|
||||||
|
XLogRecPtr checkPoint; /* last check point record ptr */
|
||||||
|
XLogRecPtr prevCheckPoint; /* previous check point record ptr */
|
||||||
|
|
||||||
|
CheckPoint95 checkPointCopy; /* copy of last check point record */
|
||||||
|
|
||||||
|
XLogRecPtr unloggedLSN; /* current fake LSN value, for unlogged rels */
|
||||||
|
|
||||||
|
XLogRecPtr minRecoveryPoint;
|
||||||
|
TimeLineID minRecoveryPointTLI;
|
||||||
|
XLogRecPtr backupStartPoint;
|
||||||
|
XLogRecPtr backupEndPoint;
|
||||||
|
bool backupEndRequired;
|
||||||
|
|
||||||
|
int wal_level;
|
||||||
|
bool wal_log_hints;
|
||||||
|
int MaxConnections;
|
||||||
|
int max_worker_processes;
|
||||||
|
int max_prepared_xacts;
|
||||||
|
int max_locks_per_xact;
|
||||||
|
bool track_commit_timestamp;
|
||||||
|
|
||||||
|
uint32 maxAlign; /* alignment requirement for tuples */
|
||||||
|
double floatFormat; /* constant 1234567.0 */
|
||||||
|
|
||||||
|
uint32 blcksz; /* data block size for this DB */
|
||||||
|
uint32 relseg_size; /* blocks per segment of large relation */
|
||||||
|
|
||||||
|
uint32 xlog_blcksz; /* block size within WAL files */
|
||||||
|
uint32 xlog_seg_size; /* size of each WAL segment */
|
||||||
|
|
||||||
|
uint32 nameDataLen; /* catalog name field width */
|
||||||
|
uint32 indexMaxKeys; /* max number of columns in an index */
|
||||||
|
|
||||||
|
uint32 toast_max_chunk_size; /* chunk size in TOAST tables */
|
||||||
|
uint32 loblksize; /* chunk size in pg_largeobject */
|
||||||
|
|
||||||
|
bool enableIntTimes; /* int64 storage enabled? */
|
||||||
|
|
||||||
|
bool float4ByVal; /* float4 pass-by-value? */
|
||||||
|
bool float8ByVal; /* float8, int8, etc pass-by-value? */
|
||||||
|
|
||||||
|
uint32 data_checksum_version;
|
||||||
|
|
||||||
|
} ControlFileData95;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Following field removed in 11:
|
||||||
|
*
|
||||||
|
* XLogRecPtr prevCheckPoint;
|
||||||
|
*
|
||||||
|
* In 10, following field appended *after* "data_checksum_version":
|
||||||
|
*
|
||||||
|
* char mock_authentication_nonce[MOCK_AUTH_NONCE_LEN];
|
||||||
|
*
|
||||||
|
* (but we don't care about that)
|
||||||
|
*/
|
||||||
|
|
||||||
|
typedef struct ControlFileData11
|
||||||
|
{
|
||||||
|
uint64 system_identifier;
|
||||||
|
|
||||||
|
uint32 pg_control_version; /* PG_CONTROL_VERSION */
|
||||||
|
uint32 catalog_version_no; /* see catversion.h */
|
||||||
|
|
||||||
|
DBState state; /* see enum above */
|
||||||
|
pg_time_t time; /* time stamp of last pg_control update */
|
||||||
|
XLogRecPtr checkPoint; /* last check point record ptr */
|
||||||
|
|
||||||
|
CheckPoint95 checkPointCopy; /* copy of last check point record */
|
||||||
|
|
||||||
|
XLogRecPtr unloggedLSN; /* current fake LSN value, for unlogged rels */
|
||||||
|
|
||||||
|
XLogRecPtr minRecoveryPoint;
|
||||||
|
TimeLineID minRecoveryPointTLI;
|
||||||
|
XLogRecPtr backupStartPoint;
|
||||||
|
XLogRecPtr backupEndPoint;
|
||||||
|
bool backupEndRequired;
|
||||||
|
|
||||||
|
int wal_level;
|
||||||
|
bool wal_log_hints;
|
||||||
|
int MaxConnections;
|
||||||
|
int max_worker_processes;
|
||||||
|
int max_prepared_xacts;
|
||||||
|
int max_locks_per_xact;
|
||||||
|
bool track_commit_timestamp;
|
||||||
|
|
||||||
|
uint32 maxAlign; /* alignment requirement for tuples */
|
||||||
|
double floatFormat; /* constant 1234567.0 */
|
||||||
|
|
||||||
|
uint32 blcksz; /* data block size for this DB */
|
||||||
|
uint32 relseg_size; /* blocks per segment of large relation */
|
||||||
|
|
||||||
|
uint32 xlog_blcksz; /* block size within WAL files */
|
||||||
|
uint32 xlog_seg_size; /* size of each WAL segment */
|
||||||
|
|
||||||
|
uint32 nameDataLen; /* catalog name field width */
|
||||||
|
uint32 indexMaxKeys; /* max number of columns in an index */
|
||||||
|
|
||||||
|
uint32 toast_max_chunk_size; /* chunk size in TOAST tables */
|
||||||
|
uint32 loblksize; /* chunk size in pg_largeobject */
|
||||||
|
|
||||||
|
bool enableIntTimes; /* int64 storage enabled? */
|
||||||
|
|
||||||
|
bool float4ByVal; /* float4 pass-by-value? */
|
||||||
|
bool float8ByVal; /* float8, int8, etc pass-by-value? */
|
||||||
|
|
||||||
|
uint32 data_checksum_version;
|
||||||
|
|
||||||
|
} ControlFileData11;
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
extern DBState get_db_state(const char *data_directory);
|
extern DBState get_db_state(const char *data_directory);
|
||||||
extern const char *describe_db_state(DBState state);
|
extern const char *describe_db_state(DBState state);
|
||||||
extern int get_data_checksum_version(const char *data_directory);
|
extern int get_data_checksum_version(const char *data_directory);
|
||||||
|
|||||||
121
dbutils.h
121
dbutils.h
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* dbutils.h
|
* dbutils.h
|
||||||
*
|
*
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -28,8 +28,10 @@
|
|||||||
#include "strutil.h"
|
#include "strutil.h"
|
||||||
#include "voting.h"
|
#include "voting.h"
|
||||||
|
|
||||||
#define REPMGR_NODES_COLUMNS "node_id, type, upstream_node_id, node_name, conninfo, repluser, slot_name, location, priority, active, config_file, '' AS upstream_node_name "
|
#define REPMGR_NODES_COLUMNS "n.node_id, n.type, n.upstream_node_id, n.node_name, n.conninfo, n.repluser, n.slot_name, n.location, n.priority, n.active, n.config_file, '' AS upstream_node_name "
|
||||||
#define BDR_NODES_COLUMNS "node_sysid, node_timeline, node_dboid, node_status, node_name, node_local_dsn, node_init_from_dsn, node_read_only, node_seq_id"
|
#define BDR2_NODES_COLUMNS "node_sysid, node_timeline, node_dboid, node_name, node_local_dsn, ''"
|
||||||
|
#define BDR3_NODES_COLUMNS "ns.node_id, 0, 0, ns.node_name, ns.interface_connstr, ns.peer_state_name"
|
||||||
|
|
||||||
|
|
||||||
#define ERRBUFF_SIZE 512
|
#define ERRBUFF_SIZE 512
|
||||||
|
|
||||||
@@ -38,6 +40,7 @@ typedef enum
|
|||||||
UNKNOWN = 0,
|
UNKNOWN = 0,
|
||||||
PRIMARY,
|
PRIMARY,
|
||||||
STANDBY,
|
STANDBY,
|
||||||
|
WITNESS,
|
||||||
BDR
|
BDR
|
||||||
} t_server_type;
|
} t_server_type;
|
||||||
|
|
||||||
@@ -73,17 +76,18 @@ typedef enum
|
|||||||
{
|
{
|
||||||
NODE_STATUS_UNKNOWN = -1,
|
NODE_STATUS_UNKNOWN = -1,
|
||||||
NODE_STATUS_UP,
|
NODE_STATUS_UP,
|
||||||
|
NODE_STATUS_SHUTTING_DOWN,
|
||||||
NODE_STATUS_DOWN,
|
NODE_STATUS_DOWN,
|
||||||
NODE_STATUS_UNCLEAN_SHUTDOWN
|
NODE_STATUS_UNCLEAN_SHUTDOWN
|
||||||
} NodeStatus;
|
} NodeStatus;
|
||||||
|
|
||||||
typedef enum
|
typedef enum
|
||||||
{
|
{
|
||||||
VR_VOTE_REFUSED = -1,
|
CONN_UNKNOWN = -1,
|
||||||
VR_POSITIVE_VOTE,
|
CONN_OK,
|
||||||
VR_NEGATIVE_VOTE
|
CONN_BAD,
|
||||||
} VoteRequestResult;
|
CONN_ERROR
|
||||||
|
} ConnectionStatus;
|
||||||
|
|
||||||
typedef enum
|
typedef enum
|
||||||
{
|
{
|
||||||
@@ -92,6 +96,14 @@ typedef enum
|
|||||||
SLOT_ACTIVE
|
SLOT_ACTIVE
|
||||||
} ReplSlotStatus;
|
} ReplSlotStatus;
|
||||||
|
|
||||||
|
typedef enum
|
||||||
|
{
|
||||||
|
BACKUP_STATE_UNKNOWN = -1,
|
||||||
|
BACKUP_STATE_IN_BACKUP,
|
||||||
|
BACKUP_STATE_NO_BACKUP
|
||||||
|
} BackupState;
|
||||||
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Struct to store node information
|
* Struct to store node information
|
||||||
*/
|
*/
|
||||||
@@ -181,11 +193,13 @@ typedef struct s_event_info
|
|||||||
{
|
{
|
||||||
char *node_name;
|
char *node_name;
|
||||||
char *conninfo_str;
|
char *conninfo_str;
|
||||||
|
int node_id;
|
||||||
} t_event_info;
|
} t_event_info;
|
||||||
|
|
||||||
#define T_EVENT_INFO_INITIALIZER { \
|
#define T_EVENT_INFO_INITIALIZER { \
|
||||||
NULL, \
|
NULL, \
|
||||||
NULL \
|
NULL, \
|
||||||
|
UNKNOWN_NODE_ID \
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@@ -233,18 +247,14 @@ typedef struct s_bdr_node_info
|
|||||||
char node_sysid[MAXLEN];
|
char node_sysid[MAXLEN];
|
||||||
uint32 node_timeline;
|
uint32 node_timeline;
|
||||||
uint32 node_dboid;
|
uint32 node_dboid;
|
||||||
char node_status;
|
|
||||||
char node_name[MAXLEN];
|
char node_name[MAXLEN];
|
||||||
char node_local_dsn[MAXLEN];
|
char node_local_dsn[MAXLEN];
|
||||||
char node_init_from_dsn[MAXLEN];
|
char peer_state_name[MAXLEN];
|
||||||
bool read_only;
|
|
||||||
uint32 node_seq_id;
|
|
||||||
} t_bdr_node_info;
|
} t_bdr_node_info;
|
||||||
|
|
||||||
#define T_BDR_NODE_INFO_INITIALIZER { \
|
#define T_BDR_NODE_INFO_INITIALIZER { \
|
||||||
"", InvalidOid, InvalidOid, \
|
"", InvalidOid, InvalidOid, \
|
||||||
'?', "", "", "", \
|
"", "", "" \
|
||||||
false, -1 \
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@@ -317,6 +327,21 @@ typedef struct
|
|||||||
UNKNOWN_TIMELINE_ID, \
|
UNKNOWN_TIMELINE_ID, \
|
||||||
InvalidXLogRecPtr \
|
InvalidXLogRecPtr \
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
typedef struct RepmgrdInfo {
|
||||||
|
int node_id;
|
||||||
|
int pid;
|
||||||
|
char pid_text[MAXLEN];
|
||||||
|
char pid_file[MAXLEN];
|
||||||
|
bool pg_running;
|
||||||
|
char pg_running_text[MAXLEN];
|
||||||
|
bool running;
|
||||||
|
char repmgrd_running[MAXLEN];
|
||||||
|
bool paused;
|
||||||
|
} RepmgrdInfo;
|
||||||
|
|
||||||
|
|
||||||
/* global variables */
|
/* global variables */
|
||||||
|
|
||||||
extern int server_version_num;
|
extern int server_version_num;
|
||||||
@@ -339,9 +364,6 @@ bool atobool(const char *value);
|
|||||||
PGconn *establish_db_connection(const char *conninfo,
|
PGconn *establish_db_connection(const char *conninfo,
|
||||||
const bool exit_on_error);
|
const bool exit_on_error);
|
||||||
PGconn *establish_db_connection_quiet(const char *conninfo);
|
PGconn *establish_db_connection_quiet(const char *conninfo);
|
||||||
PGconn *establish_db_connection_as_user(const char *conninfo,
|
|
||||||
const char *user,
|
|
||||||
const bool exit_on_error);
|
|
||||||
|
|
||||||
PGconn *establish_db_connection_by_params(t_conninfo_param_list *param_list,
|
PGconn *establish_db_connection_by_params(t_conninfo_param_list *param_list,
|
||||||
const bool exit_on_error);
|
const bool exit_on_error);
|
||||||
@@ -352,10 +374,11 @@ PGconn *get_primary_connection(PGconn *standby_conn, int *primary_id, char *p
|
|||||||
PGconn *get_primary_connection_quiet(PGconn *standby_conn, int *primary_id, char *primary_conninfo_out);
|
PGconn *get_primary_connection_quiet(PGconn *standby_conn, int *primary_id, char *primary_conninfo_out);
|
||||||
|
|
||||||
bool is_superuser_connection(PGconn *conn, t_connection_user *userinfo);
|
bool is_superuser_connection(PGconn *conn, t_connection_user *userinfo);
|
||||||
|
void close_connection(PGconn **conn);
|
||||||
|
|
||||||
/* conninfo manipulation functions */
|
/* conninfo manipulation functions */
|
||||||
bool get_conninfo_value(const char *conninfo, const char *keyword, char *output);
|
bool get_conninfo_value(const char *conninfo, const char *keyword, char *output);
|
||||||
|
bool get_conninfo_default_value(const char *param, char *output, int maxlen);
|
||||||
void initialize_conninfo_params(t_conninfo_param_list *param_list, bool set_defaults);
|
void initialize_conninfo_params(t_conninfo_param_list *param_list, bool set_defaults);
|
||||||
void free_conninfo_params(t_conninfo_param_list *param_list);
|
void free_conninfo_params(t_conninfo_param_list *param_list);
|
||||||
void copy_conninfo_params(t_conninfo_param_list *dest_list, t_conninfo_param_list *source_list);
|
void copy_conninfo_params(t_conninfo_param_list *dest_list, t_conninfo_param_list *source_list);
|
||||||
@@ -363,8 +386,10 @@ void conn_to_param_list(PGconn *conn, t_conninfo_param_list *param_list);
|
|||||||
void param_set(t_conninfo_param_list *param_list, const char *param, const char *value);
|
void param_set(t_conninfo_param_list *param_list, const char *param, const char *value);
|
||||||
void param_set_ine(t_conninfo_param_list *param_list, const char *param, const char *value);
|
void param_set_ine(t_conninfo_param_list *param_list, const char *param, const char *value);
|
||||||
char *param_get(t_conninfo_param_list *param_list, const char *param);
|
char *param_get(t_conninfo_param_list *param_list, const char *param);
|
||||||
bool parse_conninfo_string(const char *conninfo_str, t_conninfo_param_list *param_list, char *errmsg, bool ignore_local_params);
|
bool parse_conninfo_string(const char *conninfo_str, t_conninfo_param_list *param_list, char **errmsg, bool ignore_local_params);
|
||||||
char *param_list_to_string(t_conninfo_param_list *param_list);
|
char *param_list_to_string(t_conninfo_param_list *param_list);
|
||||||
|
bool has_passfile(void);
|
||||||
|
|
||||||
|
|
||||||
/* transaction functions */
|
/* transaction functions */
|
||||||
bool begin_transaction(PGconn *conn);
|
bool begin_transaction(PGconn *conn);
|
||||||
@@ -375,10 +400,8 @@ bool check_cluster_schema(PGconn *conn);
|
|||||||
/* GUC manipulation functions */
|
/* GUC manipulation functions */
|
||||||
bool set_config(PGconn *conn, const char *config_param, const char *config_value);
|
bool set_config(PGconn *conn, const char *config_param, const char *config_value);
|
||||||
bool set_config_bool(PGconn *conn, const char *config_param, bool state);
|
bool set_config_bool(PGconn *conn, const char *config_param, bool state);
|
||||||
int guc_set(PGconn *conn, const char *parameter, const char *op,
|
int guc_set(PGconn *conn, const char *parameter, const char *op, const char *value);
|
||||||
const char *value);
|
int guc_set_typed(PGconn *conn, const char *parameter, const char *op, const char *value, const char *datatype);
|
||||||
int guc_set_typed(PGconn *conn, const char *parameter, const char *op,
|
|
||||||
const char *value, const char *datatype);
|
|
||||||
bool get_pg_setting(PGconn *conn, const char *setting, char *output);
|
bool get_pg_setting(PGconn *conn, const char *setting, char *output);
|
||||||
|
|
||||||
/* server information functions */
|
/* server information functions */
|
||||||
@@ -386,10 +409,16 @@ bool get_cluster_size(PGconn *conn, char *size);
|
|||||||
int get_server_version(PGconn *conn, char *server_version);
|
int get_server_version(PGconn *conn, char *server_version);
|
||||||
RecoveryType get_recovery_type(PGconn *conn);
|
RecoveryType get_recovery_type(PGconn *conn);
|
||||||
int get_primary_node_id(PGconn *conn);
|
int get_primary_node_id(PGconn *conn);
|
||||||
bool can_use_pg_rewind(PGconn *conn, const char *data_directory, PQExpBufferData *reason);
|
|
||||||
int get_ready_archive_files(PGconn *conn, const char *data_directory);
|
int get_ready_archive_files(PGconn *conn, const char *data_directory);
|
||||||
bool identify_system(PGconn *repl_conn, t_system_identification *identification);
|
bool identify_system(PGconn *repl_conn, t_system_identification *identification);
|
||||||
bool repmgrd_set_local_node_id(PGconn *conn, int local_node_id);
|
bool repmgrd_set_local_node_id(PGconn *conn, int local_node_id);
|
||||||
|
int repmgrd_get_local_node_id(PGconn *conn);
|
||||||
|
BackupState server_in_exclusive_backup_mode(PGconn *conn);
|
||||||
|
void repmgrd_set_pid(PGconn *conn, pid_t repmgrd_pid, const char *pidfile);
|
||||||
|
pid_t repmgrd_get_pid(PGconn *conn);
|
||||||
|
bool repmgrd_is_running(PGconn *conn);
|
||||||
|
bool repmgrd_is_paused(PGconn *conn);
|
||||||
|
bool repmgrd_pause(PGconn *conn, bool pause);
|
||||||
|
|
||||||
/* extension functions */
|
/* extension functions */
|
||||||
ExtensionStatus get_repmgr_extension_status(PGconn *conn);
|
ExtensionStatus get_repmgr_extension_status(PGconn *conn);
|
||||||
@@ -404,27 +433,35 @@ t_server_type parse_node_type(const char *type);
|
|||||||
const char *get_node_type_string(t_server_type type);
|
const char *get_node_type_string(t_server_type type);
|
||||||
|
|
||||||
RecordStatus get_node_record(PGconn *conn, int node_id, t_node_info *node_info);
|
RecordStatus get_node_record(PGconn *conn, int node_id, t_node_info *node_info);
|
||||||
|
RecordStatus get_node_record_with_upstream(PGconn *conn, int node_id, t_node_info *node_info);
|
||||||
|
|
||||||
RecordStatus get_node_record_by_name(PGconn *conn, const char *node_name, t_node_info *node_info);
|
RecordStatus get_node_record_by_name(PGconn *conn, const char *node_name, t_node_info *node_info);
|
||||||
t_node_info *get_node_record_pointer(PGconn *conn, int node_id);
|
t_node_info *get_node_record_pointer(PGconn *conn, int node_id);
|
||||||
|
|
||||||
bool get_local_node_record(PGconn *conn, int node_id, t_node_info *node_info);
|
bool get_local_node_record(PGconn *conn, int node_id, t_node_info *node_info);
|
||||||
bool get_primary_node_record(PGconn *conn, t_node_info *node_info);
|
bool get_primary_node_record(PGconn *conn, t_node_info *node_info);
|
||||||
|
|
||||||
void get_all_node_records(PGconn *conn, NodeInfoList *node_list);
|
bool get_all_node_records(PGconn *conn, NodeInfoList *node_list);
|
||||||
void get_downstream_node_records(PGconn *conn, int node_id, NodeInfoList *nodes);
|
void get_downstream_node_records(PGconn *conn, int node_id, NodeInfoList *nodes);
|
||||||
void get_active_sibling_node_records(PGconn *conn, int node_id, int upstream_node_id, NodeInfoList *node_list);
|
void get_active_sibling_node_records(PGconn *conn, int node_id, int upstream_node_id, NodeInfoList *node_list);
|
||||||
void get_node_records_by_priority(PGconn *conn, NodeInfoList *node_list);
|
void get_node_records_by_priority(PGconn *conn, NodeInfoList *node_list);
|
||||||
void get_all_node_records_with_upstream(PGconn *conn, NodeInfoList *node_list);
|
bool get_all_node_records_with_upstream(PGconn *conn, NodeInfoList *node_list);
|
||||||
|
bool get_downstream_nodes_with_missing_slot(PGconn *conn, int this_node_id, NodeInfoList *noede_list);
|
||||||
|
|
||||||
bool create_node_record(PGconn *conn, char *repmgr_action, t_node_info *node_info);
|
bool create_node_record(PGconn *conn, char *repmgr_action, t_node_info *node_info);
|
||||||
bool update_node_record(PGconn *conn, char *repmgr_action, t_node_info *node_info);
|
bool update_node_record(PGconn *conn, char *repmgr_action, t_node_info *node_info);
|
||||||
bool delete_node_record(PGconn *conn, int node);
|
bool delete_node_record(PGconn *conn, int node);
|
||||||
|
bool truncate_node_records(PGconn *conn);
|
||||||
|
|
||||||
bool update_node_record_set_active(PGconn *conn, int this_node_id, bool active);
|
bool update_node_record_set_active(PGconn *conn, int this_node_id, bool active);
|
||||||
bool update_node_record_set_primary(PGconn *conn, int this_node_id);
|
bool update_node_record_set_primary(PGconn *conn, int this_node_id);
|
||||||
|
bool update_node_record_set_active_standby(PGconn *conn, int this_node_id);
|
||||||
bool update_node_record_set_upstream(PGconn *conn, int this_node_id, int new_upstream_node_id);
|
bool update_node_record_set_upstream(PGconn *conn, int this_node_id, int new_upstream_node_id);
|
||||||
bool update_node_record_status(PGconn *conn, int this_node_id, char *type, int upstream_node_id, bool active);
|
bool update_node_record_status(PGconn *conn, int this_node_id, char *type, int upstream_node_id, bool active);
|
||||||
bool update_node_record_conn_priority(PGconn *conn, t_configuration_options *options);
|
bool update_node_record_conn_priority(PGconn *conn, t_configuration_options *options);
|
||||||
|
bool update_node_record_slot_name(PGconn *primary_conn, int node_id, char *slot_name);
|
||||||
|
|
||||||
|
bool witness_copy_node_records(PGconn *primary_conn, PGconn *witness_conn);
|
||||||
|
|
||||||
void clear_node_info_list(NodeInfoList *nodes);
|
void clear_node_info_list(NodeInfoList *nodes);
|
||||||
|
|
||||||
@@ -438,11 +475,15 @@ void config_file_list_add(t_configfile_list *list, const char *file, const char
|
|||||||
bool create_event_record(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
bool create_event_record(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
||||||
bool create_event_notification(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
bool create_event_notification(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
||||||
bool create_event_notification_extended(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details, t_event_info *event_info);
|
bool create_event_notification_extended(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details, t_event_info *event_info);
|
||||||
|
PGresult *get_event_records(PGconn *conn, int node_id, const char *node_name, const char *event, bool all, int limit);
|
||||||
|
|
||||||
/* replication slot functions */
|
/* replication slot functions */
|
||||||
|
void create_slot_name(char *slot_name, int node_id);
|
||||||
bool create_replication_slot(PGconn *conn, char *slot_name, int server_version_num, PQExpBufferData *error_msg);
|
bool create_replication_slot(PGconn *conn, char *slot_name, int server_version_num, PQExpBufferData *error_msg);
|
||||||
bool drop_replication_slot(PGconn *conn, char *slot_name);
|
bool drop_replication_slot(PGconn *conn, char *slot_name);
|
||||||
RecordStatus get_slot_record(PGconn *conn, char *slot_name, t_replication_slot *record);
|
RecordStatus get_slot_record(PGconn *conn, char *slot_name, t_replication_slot *record);
|
||||||
|
int get_free_replication_slot_count(PGconn *conn);
|
||||||
|
int get_inactive_replication_slots(PGconn *conn, KeyValueList *list);
|
||||||
|
|
||||||
/* tablespace functions */
|
/* tablespace functions */
|
||||||
bool get_tablespace_name_by_location(PGconn *conn, const char *location, char *name);
|
bool get_tablespace_name_by_location(PGconn *conn, const char *location, char *name);
|
||||||
@@ -453,6 +494,8 @@ int wait_connection_availability(PGconn *conn, long long timeout);
|
|||||||
|
|
||||||
/* node availability functions */
|
/* node availability functions */
|
||||||
bool is_server_available(const char *conninfo);
|
bool is_server_available(const char *conninfo);
|
||||||
|
bool is_server_available_params(t_conninfo_param_list *param_list);
|
||||||
|
ExecStatusType connection_ping(PGconn *conn);
|
||||||
|
|
||||||
/* monitoring functions */
|
/* monitoring functions */
|
||||||
void
|
void
|
||||||
@@ -468,15 +511,15 @@ add_monitoring_record(PGconn *primary_conn,
|
|||||||
long long unsigned int apply_lag_bytes
|
long long unsigned int apply_lag_bytes
|
||||||
);
|
);
|
||||||
|
|
||||||
int get_number_of_monitoring_records_to_delete(PGconn *primary_conn, int keep_history);
|
int get_number_of_monitoring_records_to_delete(PGconn *primary_conn, int keep_history, int node_id);
|
||||||
bool delete_monitoring_records(PGconn *primary_conn, int keep_history);
|
bool delete_monitoring_records(PGconn *primary_conn, int keep_history, int node_id);
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
/* node voting functions */
|
/* node voting functions */
|
||||||
NodeVotingStatus get_voting_status(PGconn *conn);
|
void initialize_voting_term(PGconn *conn);
|
||||||
VoteRequestResult request_vote(PGconn *conn, t_node_info *this_node, t_node_info *other_node, int electoral_term);
|
int get_current_term(PGconn *conn);
|
||||||
int set_voting_status_initiated(PGconn *conn);
|
void increment_current_term(PGconn *conn);
|
||||||
bool announce_candidature(PGconn *conn, t_node_info *this_node, t_node_info *other_node, int electoral_term);
|
bool announce_candidature(PGconn *conn, t_node_info *this_node, t_node_info *other_node, int electoral_term);
|
||||||
void notify_follow_primary(PGconn *conn, int primary_node_id);
|
void notify_follow_primary(PGconn *conn, int primary_node_id);
|
||||||
bool get_new_primary(PGconn *conn, int *primary_node_id);
|
bool get_new_primary(PGconn *conn, int *primary_node_id);
|
||||||
@@ -487,24 +530,32 @@ XLogRecPtr get_current_wal_lsn(PGconn *conn);
|
|||||||
XLogRecPtr get_last_wal_receive_location(PGconn *conn);
|
XLogRecPtr get_last_wal_receive_location(PGconn *conn);
|
||||||
bool get_replication_info(PGconn *conn, ReplInfo *replication_info);
|
bool get_replication_info(PGconn *conn, ReplInfo *replication_info);
|
||||||
int get_replication_lag_seconds(PGconn *conn);
|
int get_replication_lag_seconds(PGconn *conn);
|
||||||
void get_node_replication_stats(PGconn *conn, t_node_info *node_info);
|
void get_node_replication_stats(PGconn *conn, int server_version_num, t_node_info *node_info);
|
||||||
bool is_downstream_node_attached(PGconn *conn, char *node_name);
|
bool is_downstream_node_attached(PGconn *conn, char *node_name);
|
||||||
|
|
||||||
/* BDR functions */
|
/* BDR functions */
|
||||||
|
int get_bdr_version_num(void);
|
||||||
void get_all_bdr_node_records(PGconn *conn, BdrNodeInfoList *node_list);
|
void get_all_bdr_node_records(PGconn *conn, BdrNodeInfoList *node_list);
|
||||||
RecordStatus get_bdr_node_record_by_name(PGconn *conn, const char *node_name, t_bdr_node_info *node_info);
|
RecordStatus get_bdr_node_record_by_name(PGconn *conn, const char *node_name, t_bdr_node_info *node_info);
|
||||||
bool is_bdr_db(PGconn *conn, PQExpBufferData *output);
|
bool is_bdr_db(PGconn *conn, PQExpBufferData *output);
|
||||||
|
bool is_bdr_db_quiet(PGconn *conn);
|
||||||
bool is_active_bdr_node(PGconn *conn, const char *node_name);
|
bool is_active_bdr_node(PGconn *conn, const char *node_name);
|
||||||
bool is_bdr_repmgr(PGconn *conn);
|
bool is_bdr_repmgr(PGconn *conn);
|
||||||
|
char *get_default_bdr_replication_set(PGconn *conn);
|
||||||
bool is_table_in_bdr_replication_set(PGconn *conn, const char *tablename, const char *set);
|
bool is_table_in_bdr_replication_set(PGconn *conn, const char *tablename, const char *set);
|
||||||
bool add_table_to_bdr_replication_set(PGconn *conn, const char *tablename, const char *set);
|
bool add_table_to_bdr_replication_set(PGconn *conn, const char *tablename, const char *set);
|
||||||
void add_extension_tables_to_bdr_replication_set(PGconn *conn);
|
void add_extension_tables_to_bdr_replication_set(PGconn *conn);
|
||||||
|
bool bdr_node_name_matches(PGconn *conn, const char *node_name, PQExpBufferData *bdr_local_node_name);
|
||||||
bool bdr_node_exists(PGconn *conn, const char *node_name);
|
|
||||||
ReplSlotStatus get_bdr_node_replication_slot_status(PGconn *conn, const char *node_name);
|
ReplSlotStatus get_bdr_node_replication_slot_status(PGconn *conn, const char *node_name);
|
||||||
void get_bdr_other_node_name(PGconn *conn, int node_id, char *name_buf);
|
void get_bdr_other_node_name(PGconn *conn, int node_id, char *name_buf);
|
||||||
|
|
||||||
bool am_bdr_failover_handler(PGconn *conn, int node_id);
|
bool am_bdr_failover_handler(PGconn *conn, int node_id);
|
||||||
void unset_bdr_failover_handler(PGconn *conn);
|
void unset_bdr_failover_handler(PGconn *conn);
|
||||||
|
bool bdr_node_has_repmgr_set(PGconn *conn, const char *node_name);
|
||||||
|
bool bdr_node_set_repmgr_set(PGconn *conn, const char *node_name);
|
||||||
|
|
||||||
|
/* miscellaneous debugging functions */
|
||||||
|
const char *print_node_status(NodeStatus node_status);
|
||||||
|
const char *print_pqping_status(PGPing ping_status);
|
||||||
|
|
||||||
#endif /* _REPMGR_DBUTILS_H_ */
|
#endif /* _REPMGR_DBUTILS_H_ */
|
||||||
|
|||||||
208
dirutil.c
208
dirutil.c
@@ -3,7 +3,7 @@
|
|||||||
* dirmod.c
|
* dirmod.c
|
||||||
* directory handling functions
|
* directory handling functions
|
||||||
*
|
*
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -21,6 +21,7 @@
|
|||||||
|
|
||||||
#include <unistd.h>
|
#include <unistd.h>
|
||||||
#include <dirent.h>
|
#include <dirent.h>
|
||||||
|
#include <signal.h>
|
||||||
#include <sys/stat.h>
|
#include <sys/stat.h>
|
||||||
#include <errno.h>
|
#include <errno.h>
|
||||||
#include <stdio.h>
|
#include <stdio.h>
|
||||||
@@ -34,34 +35,33 @@
|
|||||||
#include "dirutil.h"
|
#include "dirutil.h"
|
||||||
#include "strutil.h"
|
#include "strutil.h"
|
||||||
#include "log.h"
|
#include "log.h"
|
||||||
|
#include "controldata.h"
|
||||||
|
|
||||||
static int unlink_dir_callback(const char *fpath, const struct stat *sb, int typeflag, struct FTW *ftwbuf);
|
static int unlink_dir_callback(const char *fpath, const struct stat *sb, int typeflag, struct FTW *ftwbuf);
|
||||||
|
|
||||||
|
/* PID can be negative if backend is standalone */
|
||||||
|
typedef long pgpid_t;
|
||||||
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* make sure the directory either doesn't exist or is empty
|
* Check if a directory exists, and if so whether it is empty.
|
||||||
* we use this function to check the new data directory and
|
|
||||||
* the directories for tablespaces
|
|
||||||
*
|
*
|
||||||
* This is the same check initdb does on the new PGDATA dir
|
* This function is used for checking both the data directory
|
||||||
*
|
* and tablespace directories.
|
||||||
* Returns 0 if nonexistent, 1 if exists and empty, 2 if not empty,
|
|
||||||
* or -1 if trouble accessing directory
|
|
||||||
*/
|
*/
|
||||||
int
|
DataDirState
|
||||||
check_dir(char *path)
|
check_dir(char *path)
|
||||||
{
|
{
|
||||||
DIR *chkdir;
|
DIR *chkdir = NULL;
|
||||||
struct dirent *file;
|
struct dirent *file = NULL;
|
||||||
int result = 1;
|
int result = DIR_EMPTY;
|
||||||
|
|
||||||
errno = 0;
|
errno = 0;
|
||||||
|
|
||||||
chkdir = opendir(path);
|
chkdir = opendir(path);
|
||||||
|
|
||||||
if (!chkdir)
|
if (!chkdir)
|
||||||
return (errno == ENOENT) ? 0 : -1;
|
return (errno == ENOENT) ? DIR_NOENT : DIR_ERROR;
|
||||||
|
|
||||||
while ((file = readdir(chkdir)) != NULL)
|
while ((file = readdir(chkdir)) != NULL)
|
||||||
{
|
{
|
||||||
@@ -73,25 +73,15 @@ check_dir(char *path)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
result = 2; /* not empty */
|
result = DIR_NOT_EMPTY;
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifdef WIN32
|
|
||||||
|
|
||||||
/*
|
|
||||||
* This fix is in mingw cvs (runtime/mingwex/dirent.c rev 1.4), but not in
|
|
||||||
* released version
|
|
||||||
*/
|
|
||||||
if (GetLastError() == ERROR_NO_MORE_FILES)
|
|
||||||
errno = 0;
|
|
||||||
#endif
|
|
||||||
|
|
||||||
closedir(chkdir);
|
closedir(chkdir);
|
||||||
|
|
||||||
if (errno != 0)
|
if (errno != 0)
|
||||||
return -1; /* some kind of I/O error? */
|
return DIR_ERROR; /* some kind of I/O error? */
|
||||||
|
|
||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
@@ -106,12 +96,13 @@ create_dir(char *path)
|
|||||||
if (mkdir_p(path, 0700) == 0)
|
if (mkdir_p(path, 0700) == 0)
|
||||||
return true;
|
return true;
|
||||||
|
|
||||||
log_error(_("unable to create directory \"%s\": %s"),
|
log_error(_("unable to create directory \"%s\""), path);
|
||||||
path, strerror(errno));
|
log_detail("%s", strerror(errno));
|
||||||
|
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
bool
|
bool
|
||||||
set_dir_permissions(char *path)
|
set_dir_permissions(char *path)
|
||||||
{
|
{
|
||||||
@@ -146,26 +137,6 @@ mkdir_p(char *path, mode_t omode)
|
|||||||
oumask = 0;
|
oumask = 0;
|
||||||
retval = 0;
|
retval = 0;
|
||||||
|
|
||||||
#ifdef WIN32
|
|
||||||
/* skip network and drive specifiers for win32 */
|
|
||||||
if (strlen(p) >= 2)
|
|
||||||
{
|
|
||||||
if (p[0] == '/' && p[1] == '/')
|
|
||||||
{
|
|
||||||
/* network drive */
|
|
||||||
p = strstr(p + 2, "/");
|
|
||||||
if (p == NULL)
|
|
||||||
return 1;
|
|
||||||
}
|
|
||||||
else if (p[1] == ':' &&
|
|
||||||
((p[0] >= 'a' && p[0] <= 'z') ||
|
|
||||||
(p[0] >= 'A' && p[0] <= 'Z')))
|
|
||||||
{
|
|
||||||
/* local drive */
|
|
||||||
p += 2;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
|
|
||||||
if (p[0] == '/') /* Skip leading '/'. */
|
if (p[0] == '/') /* Skip leading '/'. */
|
||||||
++p;
|
++p;
|
||||||
@@ -242,17 +213,91 @@ is_pg_dir(char *path)
|
|||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Attempt to determine if a PostgreSQL data directory is in use
|
||||||
|
* by reading the pidfile. This is the same mechanism used by
|
||||||
|
* "pg_ctl".
|
||||||
|
*
|
||||||
|
* This function will abort with appropriate log messages if a file error
|
||||||
|
* is encountered, as the user will need to address the situation before
|
||||||
|
* any further useful progress can be made.
|
||||||
|
*/
|
||||||
|
PgDirState
|
||||||
|
is_pg_running(char *path)
|
||||||
|
{
|
||||||
|
long pid;
|
||||||
|
FILE *pidf;
|
||||||
|
|
||||||
|
char pid_file[MAXPGPATH];
|
||||||
|
|
||||||
|
/* it's reasonable to assume the pidfile name will not change */
|
||||||
|
snprintf(pid_file, MAXPGPATH, "%s/postmaster.pid", path);
|
||||||
|
|
||||||
|
pidf = fopen(pid_file, "r");
|
||||||
|
if (pidf == NULL)
|
||||||
|
{
|
||||||
|
/*
|
||||||
|
* No PID file - PostgreSQL shouldn't be running. From 9.3 (the
|
||||||
|
* earliesty version we care about) removal of the PID file will
|
||||||
|
* cause the postmaster to shut down, so it's highly unlikely
|
||||||
|
* that PostgreSQL will still be running.
|
||||||
|
*/
|
||||||
|
if (errno == ENOENT)
|
||||||
|
{
|
||||||
|
return PG_DIR_NOT_RUNNING;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
log_error(_("unable to open PostgreSQL PID file \"%s\""), pid_file);
|
||||||
|
log_detail("%s", strerror(errno));
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* In the unlikely event we're unable to extract a PID from the PID file,
|
||||||
|
* log a warning but assume we're not dealing with a running instance
|
||||||
|
* as PostgreSQL should have shut itself down in these cases anyway.
|
||||||
|
*/
|
||||||
|
if (fscanf(pidf, "%ld", &pid) != 1)
|
||||||
|
{
|
||||||
|
/* Is the file empty? */
|
||||||
|
if (ftell(pidf) == 0 && feof(pidf))
|
||||||
|
{
|
||||||
|
log_warning(_("PostgreSQL PID file \"%s\" is empty"), path);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
log_warning(_("invalid data in PostgreSQL PID file \"%s\""), path);
|
||||||
|
}
|
||||||
|
|
||||||
|
return PG_DIR_NOT_RUNNING;
|
||||||
|
}
|
||||||
|
|
||||||
|
fclose(pidf);
|
||||||
|
|
||||||
|
if (pid == getpid())
|
||||||
|
return PG_DIR_NOT_RUNNING;
|
||||||
|
|
||||||
|
if (pid == getppid())
|
||||||
|
return PG_DIR_NOT_RUNNING;
|
||||||
|
|
||||||
|
if (kill(pid, 0) == 0)
|
||||||
|
return PG_DIR_RUNNING;
|
||||||
|
|
||||||
|
return PG_DIR_NOT_RUNNING;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
bool
|
bool
|
||||||
create_pg_dir(char *path, bool force)
|
create_pg_dir(char *path, bool force)
|
||||||
{
|
{
|
||||||
bool pg_dir = false;
|
/* Check this directory can be used as a PGDATA dir */
|
||||||
|
|
||||||
/* Check this directory could be used as a PGDATA dir */
|
|
||||||
switch (check_dir(path))
|
switch (check_dir(path))
|
||||||
{
|
{
|
||||||
case 0:
|
case DIR_NOENT:
|
||||||
/* dir not there, must create it */
|
/* directory does not exist, attempt to create it */
|
||||||
log_info(_("creating directory \"%s\"..."), path);
|
log_info(_("creating directory \"%s\"..."), path);
|
||||||
|
|
||||||
if (!create_dir(path))
|
if (!create_dir(path))
|
||||||
@@ -262,55 +307,62 @@ create_pg_dir(char *path, bool force)
|
|||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
case 1:
|
case DIR_EMPTY:
|
||||||
/* Present but empty, fix permissions and use it */
|
/* exists but empty, fix permissions and use it */
|
||||||
log_info(_("checking and correcting permissions on existing directory %s"),
|
log_info(_("checking and correcting permissions on existing directory \"%s\""),
|
||||||
path);
|
path);
|
||||||
|
|
||||||
if (!set_dir_permissions(path))
|
if (!set_dir_permissions(path))
|
||||||
{
|
{
|
||||||
log_error(_("unable to change permissions of directory \"%s\":\n %s"),
|
log_error(_("unable to change permissions of directory \"%s\""), path);
|
||||||
path, strerror(errno));
|
log_detail("%s", strerror(errno));
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
case 2:
|
case DIR_NOT_EMPTY:
|
||||||
/* Present and not empty */
|
/* exists but is not empty */
|
||||||
log_warning(_("directory \"%s\" exists but is not empty"),
|
log_warning(_("directory \"%s\" exists but is not empty"),
|
||||||
path);
|
path);
|
||||||
|
|
||||||
pg_dir = is_pg_dir(path);
|
if (is_pg_dir(path))
|
||||||
|
|
||||||
if (pg_dir && force)
|
|
||||||
{
|
{
|
||||||
/* TODO: check DB state, if not running overwrite */
|
if (force == true)
|
||||||
|
|
||||||
if (false)
|
|
||||||
{
|
{
|
||||||
log_notice(_("deleting existing data directory \"%s\""), path);
|
log_notice(_("-F/--force provided - deleting existing data directory \"%s\""), path);
|
||||||
nftw(path, unlink_dir_callback, 64, FTW_DEPTH | FTW_PHYS);
|
nftw(path, unlink_dir_callback, 64, FTW_DEPTH | FTW_PHYS);
|
||||||
|
return true;
|
||||||
}
|
}
|
||||||
/* Let it continue */
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
else if (pg_dir && !force)
|
|
||||||
{
|
|
||||||
log_hint(_("This looks like a PostgreSQL directory.\n"
|
|
||||||
"If you are sure you want to clone here, "
|
|
||||||
"please check there is no PostgreSQL server "
|
|
||||||
"running and use the -F/--force option"));
|
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
else
|
||||||
return false;
|
{
|
||||||
default:
|
if (force == true)
|
||||||
|
{
|
||||||
|
log_notice(_("deleting existing directory \"%s\""), path);
|
||||||
|
nftw(path, unlink_dir_callback, 64, FTW_DEPTH | FTW_PHYS);
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case DIR_ERROR:
|
||||||
log_error(_("could not access directory \"%s\": %s"),
|
log_error(_("could not access directory \"%s\": %s"),
|
||||||
path, strerror(errno));
|
path, strerror(errno));
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
int
|
||||||
|
rmdir_recursive(char *path)
|
||||||
|
{
|
||||||
|
return nftw(path, unlink_dir_callback, 64, FTW_DEPTH | FTW_PHYS);
|
||||||
|
}
|
||||||
|
|
||||||
static int
|
static int
|
||||||
unlink_dir_callback(const char *fpath, const struct stat *sb, int typeflag, struct FTW *ftwbuf)
|
unlink_dir_callback(const char *fpath, const struct stat *sb, int typeflag, struct FTW *ftwbuf)
|
||||||
{
|
{
|
||||||
|
|||||||
21
dirutil.h
21
dirutil.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* dirutil.h
|
* dirutil.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -19,12 +19,29 @@
|
|||||||
#ifndef _DIRUTIL_H_
|
#ifndef _DIRUTIL_H_
|
||||||
#define _DIRUTIL_H_
|
#define _DIRUTIL_H_
|
||||||
|
|
||||||
|
typedef enum
|
||||||
|
{
|
||||||
|
DIR_ERROR = -1,
|
||||||
|
DIR_NOENT,
|
||||||
|
DIR_EMPTY,
|
||||||
|
DIR_NOT_EMPTY
|
||||||
|
} DataDirState;
|
||||||
|
|
||||||
|
typedef enum
|
||||||
|
{
|
||||||
|
PG_DIR_ERROR = -1,
|
||||||
|
PG_DIR_NOT_RUNNING,
|
||||||
|
PG_DIR_RUNNING
|
||||||
|
} PgDirState;
|
||||||
|
|
||||||
extern int mkdir_p(char *path, mode_t omode);
|
extern int mkdir_p(char *path, mode_t omode);
|
||||||
extern bool set_dir_permissions(char *path);
|
extern bool set_dir_permissions(char *path);
|
||||||
|
|
||||||
extern int check_dir(char *path);
|
extern DataDirState check_dir(char *path);
|
||||||
extern bool create_dir(char *path);
|
extern bool create_dir(char *path);
|
||||||
extern bool is_pg_dir(char *path);
|
extern bool is_pg_dir(char *path);
|
||||||
|
extern PgDirState is_pg_running(char *path);
|
||||||
extern bool create_pg_dir(char *path, bool force);
|
extern bool create_pg_dir(char *path, bool force);
|
||||||
|
extern int rmdir_recursive(char *path);
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
2
doc/.gitignore
vendored
2
doc/.gitignore
vendored
@@ -2,4 +2,6 @@ HTML.index
|
|||||||
bookindex.sgml
|
bookindex.sgml
|
||||||
html-stamp
|
html-stamp
|
||||||
html/
|
html/
|
||||||
|
nochunks.dsl
|
||||||
|
repmgr.html
|
||||||
version.sgml
|
version.sgml
|
||||||
|
|||||||
@@ -10,7 +10,7 @@ SGMLINCLUDE = -D . -D ${srcdir}
|
|||||||
|
|
||||||
SPFLAGS += -wall -wno-unused-param -wno-empty -wfully-tagged
|
SPFLAGS += -wall -wno-unused-param -wno-empty -wfully-tagged
|
||||||
|
|
||||||
JADE.html.call = $(JADE) $(JADEFLAGS) $(SPFLAGS) $(SGMLINCLUDE) $(CATALOG) -d stylesheet.dsl -t sgml -i output-html
|
JADE.html.call = $(JADE) $(JADEFLAGS) $(SPFLAGS) $(SGMLINCLUDE) $(CATALOG) -t sgml -i output-html
|
||||||
|
|
||||||
ALLSGML := $(wildcard $(srcdir)/*.sgml)
|
ALLSGML := $(wildcard $(srcdir)/*.sgml)
|
||||||
# to build bookindex
|
# to build bookindex
|
||||||
@@ -26,10 +26,15 @@ html: html-stamp
|
|||||||
|
|
||||||
html-stamp: repmgr.sgml $(ALLSGML) $(GENERATED_SGML) stylesheet.dsl website-docs.css
|
html-stamp: repmgr.sgml $(ALLSGML) $(GENERATED_SGML) stylesheet.dsl website-docs.css
|
||||||
$(MKDIR_P) html
|
$(MKDIR_P) html
|
||||||
$(JADE.html.call) -i include-index $<
|
$(JADE.html.call) -d stylesheet.dsl -i include-index $<
|
||||||
cp $(srcdir)/stylesheet.css $(srcdir)/website-docs.css html/
|
cp $(srcdir)/stylesheet.css $(srcdir)/website-docs.css html/
|
||||||
touch $@
|
touch $@
|
||||||
|
|
||||||
|
repmgr.html: repmgr.sgml $(ALLSGML) $(GENERATED_SGML) stylesheet.dsl website-docs.css
|
||||||
|
sed '/html-index-filename/a\
|
||||||
|
(define nochunks #t)' <stylesheet.dsl >nochunks.dsl
|
||||||
|
$(JADE.html.call) -d nochunks.dsl -i include-index $< >repmgr.html
|
||||||
|
|
||||||
version.sgml: ${repmgr_top_builddir}/repmgr_version.h
|
version.sgml: ${repmgr_top_builddir}/repmgr_version.h
|
||||||
{ \
|
{ \
|
||||||
echo "<!ENTITY repmgrversion \"$(REPMGR_VERSION)\">"; \
|
echo "<!ENTITY repmgrversion \"$(REPMGR_VERSION)\">"; \
|
||||||
@@ -37,7 +42,7 @@ version.sgml: ${repmgr_top_builddir}/repmgr_version.h
|
|||||||
|
|
||||||
HTML.index: repmgr.sgml $(ALMOSTALLSGML) stylesheet.dsl
|
HTML.index: repmgr.sgml $(ALMOSTALLSGML) stylesheet.dsl
|
||||||
@$(MKDIR_P) html
|
@$(MKDIR_P) html
|
||||||
$(JADE.html.call) -V html-index $<
|
$(JADE.html.call) -d stylesheet.dsl -V html-index $<
|
||||||
|
|
||||||
website-docs.css:
|
website-docs.css:
|
||||||
@$(MKDIR_P) html
|
@$(MKDIR_P) html
|
||||||
|
|||||||
357
doc/appendix-faq.sgml
Normal file
357
doc/appendix-faq.sgml
Normal file
@@ -0,0 +1,357 @@
|
|||||||
|
<appendix id="appendix-faq" xreflabel="FAQ">
|
||||||
|
<indexterm>
|
||||||
|
<primary>FAQ (Frequently Asked Questions)</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>FAQ (Frequently Asked Questions)</title>
|
||||||
|
|
||||||
|
<sect1 id="faq-general" xreflabel="General">
|
||||||
|
<title>General</title>
|
||||||
|
|
||||||
|
<sect2 id="faq-xrepmgr-version-diff" xreflabel="Version differences">
|
||||||
|
<title>What's the difference between the repmgr versions?</title>
|
||||||
|
<para>
|
||||||
|
&repmgr; 4 is a complete rewrite of the existing &repmgr; code base
|
||||||
|
and implements &repmgr; as a PostgreSQL extension. It
|
||||||
|
supports all PostgreSQL versions from 9.3 (although some &repmgr;
|
||||||
|
features are not available for PostgreSQL 9.3 and 9.4).
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
&repmgr; 3.x builds on the improved replication facilities added
|
||||||
|
in PostgreSQL 9.3, as well as improved automated failover support
|
||||||
|
via <application>repmgrd</application>, and is not compatible with PostgreSQL 9.2
|
||||||
|
and earlier. We recommend upgrading to &repmgr; 4, as the &repmgr; 3.x
|
||||||
|
series will no longer be actively maintained.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
&repmgr; 2.x supports PostgreSQL 9.0 ~ 9.3. While it is compatible
|
||||||
|
with PostgreSQL 9.3, we recommend using repmgr 4.x. &repmgr; 2.x is
|
||||||
|
no longer maintained.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-replication-slots-advantage" xreflabel="Advantages of replication slots">
|
||||||
|
<title>What's the advantage of using replication slots?</title>
|
||||||
|
<para>
|
||||||
|
Replication slots, introduced in PostgreSQL 9.4, ensure that the
|
||||||
|
primary server will retain WAL files until they have been consumed
|
||||||
|
by all standby servers. This makes WAL file management much easier,
|
||||||
|
and if used &repmgr; will no longer insist on a fixed minimum number
|
||||||
|
(default: 5000) of WAL files being retained.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
However this does mean that if a standby is no longer connected to the
|
||||||
|
primary, the presence of the replication slot will cause WAL files
|
||||||
|
to be retained indefinitely.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-replication-slots-number" xreflabel="Number of replication slots">
|
||||||
|
<title>How many replication slots should I define in <varname>max_replication_slots</varname>?</title>
|
||||||
|
<para>
|
||||||
|
Normally at least same number as the number of standbys which will connect
|
||||||
|
to the node. Note that changes to <varname>max_replication_slots</varname> require a server
|
||||||
|
restart to take effect, and as there is no particular penalty for unused
|
||||||
|
replication slots, setting a higher figure will make adding new nodes
|
||||||
|
easier.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-hash-index" xreflabel="Hash indexes">
|
||||||
|
<title>Does &repmgr; support hash indexes?</title>
|
||||||
|
<para>
|
||||||
|
Before PostgreSQL 10, hash indexes were not WAL logged and are therefore not suitable
|
||||||
|
for use in streaming replication in PostgreSQL 9.6 and earlier. See the
|
||||||
|
<ulink url="https://www.postgresql.org/docs/9.6/static/sql-createindex.html#AEN80279">PostgreSQL documentation</ulink>
|
||||||
|
for details.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
From PostgreSQL 10, this restriction has been lifted and hash indexes can be used
|
||||||
|
in a streaming replication cluster.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-upgrades" xreflabel="Upgrading PostgreSQL with repmgr">
|
||||||
|
<title>Can &repmgr; assist with upgrading a PostgreSQL cluster?</title>
|
||||||
|
<para>
|
||||||
|
For <emphasis>minor</emphasis> version upgrades, e.g. from 9.6.7 to 9.6.8, a common
|
||||||
|
approach is to upgrade a standby to the latest version, perform a
|
||||||
|
<link linkend="performing-switchover">switchover</link> promoting it to a primary,
|
||||||
|
then upgrade the former primary.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For <emphasis>major</emphasis> version upgrades (e.g. from PostgreSQL 9.6 to PostgreSQL 10),
|
||||||
|
the traditional approach is to "reseed" a cluster by upgrading a single
|
||||||
|
node with <ulink url="https://www.postgresql.org/docs/current/static/pgupgrade.html">pg_upgrade</ulink>
|
||||||
|
and recloning standbys from this.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To minimize downtime during major upgrades, for more recent PostgreSQL
|
||||||
|
versions (PostgreSQL 9.4 and later),
|
||||||
|
<ulink url="https://www.2ndquadrant.com/en/resources/pglogical/">pglogical</ulink>
|
||||||
|
can be used to set up a parallel cluster using the newer PostgreSQL version,
|
||||||
|
which can be kept in sync with the existing production cluster until the
|
||||||
|
new cluster is ready to be put into production.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-libdir-repmgr-error">
|
||||||
|
<title>What does this error mean: <literal>ERROR: could not access file "$libdir/repmgr"</literal>?</title>
|
||||||
|
<para>
|
||||||
|
It means the &repmgr; extension code is not installed in the
|
||||||
|
PostgreSQL application directory. This typically happens when using PostgreSQL
|
||||||
|
packages provided by a third-party vendor, which often have different
|
||||||
|
filesystem layouts.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Either use PostgreSQL packages provided by the community or 2ndQuadrant; if this
|
||||||
|
is not possible, contact your vendor for assistance.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-old-packages">
|
||||||
|
<title>How can I obtain old versions of &repmgr; packages?</title>
|
||||||
|
<para>
|
||||||
|
See appendix <xref linkend="packages-old-versions"> for details.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="faq-repmgr" xreflabel="repmgr">
|
||||||
|
<title><command>repmgr</command></title>
|
||||||
|
|
||||||
|
<sect2 id="faq-register-existing-node" xreflabel="registering an existing node">
|
||||||
|
<title>Can I register an existing PostgreSQL server with repmgr?</title>
|
||||||
|
<para>
|
||||||
|
Yes, any existing PostgreSQL server which is part of the same replication
|
||||||
|
cluster can be registered with &repmgr;. There's no requirement for a
|
||||||
|
standby to have been cloned using &repmgr;.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-clone-other-source" >
|
||||||
|
<title>Can I use a standby not cloned by &repmgr; as a &repmgr; node?</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
For a standby which has been manually cloned or recovered from an external
|
||||||
|
backup manager such as Barman, the command
|
||||||
|
<command><link linkend="repmgr-standby-clone">repmgr standby clone --recovery-conf-only</link></command>
|
||||||
|
can be used to create the correct <filename>recovery.conf</filename> file for
|
||||||
|
use with &repmgr; (and will create a replication slot if required). Once this has been done,
|
||||||
|
<link linkend="repmgr-standby-register">register the node</link> as usual.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-recovery-conf" >
|
||||||
|
<title>What does &repmgr; write in <filename>recovery.conf</filename>, and what options can be set there?</title>
|
||||||
|
<para>
|
||||||
|
See section <link linkend="repmgr-standby-clone-recovery-conf">Customising recovery.conf</link>.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-failed-primary-standby" xreflabel="Reintegrate a failed primary as a standby">
|
||||||
|
<title>How can a failed primary be re-added as a standby?</title>
|
||||||
|
<para>
|
||||||
|
This is a two-stage process. First, the failed primary's data directory
|
||||||
|
must be re-synced with the current primary; secondly the failed primary
|
||||||
|
needs to be re-registered as a standby.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
It's possible to use <command>pg_rewind</command> to re-synchronise the existing data
|
||||||
|
directory, which will usually be much
|
||||||
|
faster than re-cloning the server. However <command>pg_rewind</command> can only
|
||||||
|
be used if PostgreSQL either has <varname>wal_log_hints</varname> enabled, or
|
||||||
|
data checksums were enabled when the cluster was initialized.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Note that <command>pg_rewind</command> is available as part of the core PostgreSQL
|
||||||
|
distribution from PostgreSQL 9.5, and as a third-party utility for PostgreSQL 9.3 and 9.4.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
&repmgr; provides the command <command>repmgr node rejoin</command> which can
|
||||||
|
optionally execute <command>pg_rewind</command>; see the <xref linkend="repmgr-node-rejoin">
|
||||||
|
documentation for details, in particular the section <xref linkend="repmgr-node-rejoin-pg-rewind">.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If <command>pg_rewind</command> cannot be used, then the data directory will need
|
||||||
|
to be re-cloned from scratch.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-check-configuration" xreflabel="Check PostgreSQL configuration">
|
||||||
|
<title>Is there an easy way to check my primary server is correctly configured for use with &repmgr;?</title>
|
||||||
|
<para>
|
||||||
|
Execute <command><link linkend="repmgr-standby-clone">repmgr standby clone</link></command>
|
||||||
|
with the <literal>--dry-run</literal> option; this will report any configuration problems
|
||||||
|
which need to be rectified.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-clone-skip-config-files" xreflabel="">
|
||||||
|
<title>When cloning a standby, how can I get &repmgr; to copy
|
||||||
|
<filename>postgresql.conf</filename> and <filename>pg_hba.conf</filename> from the PostgreSQL configuration
|
||||||
|
directory in <filename>/etc</filename>?</title>
|
||||||
|
<para>
|
||||||
|
Use the command line option <literal>--copy-external-config-files</literal>. For more details
|
||||||
|
see <xref linkend="repmgr-standby-clone-config-file-copying">.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-shared-preload-libaries-no-repmgrd" xreflabel="shared_preload_libraries without repmgrd">
|
||||||
|
<title>Do I need to include <literal>shared_preload_libraries = 'repmgr'</literal>
|
||||||
|
in <filename>postgresql.conf</filename> if I'm not using <application>repmgrd</application>?</title>
|
||||||
|
<para>
|
||||||
|
No, the <literal>repmgr</literal> shared library is only needed when running <application>repmgrd</application>.
|
||||||
|
If you later decide to run <application>repmgrd</application>, you just need to add
|
||||||
|
<literal>shared_preload_libraries = 'repmgr'</literal> and restart PostgreSQL.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-permissions" xreflabel="Replication permission problems">
|
||||||
|
<title>I've provided replication permission for the <literal>repmgr</literal> user in <filename>pg_hba.conf</filename>
|
||||||
|
but <command>repmgr</command>/<application>repmgrd</application> complains it can't connect to the server... Why?</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr</command> and <application>repmgrd</application> need to be able to connect to the repmgr database
|
||||||
|
with a normal connection to query metadata. The <literal>replication</literal> connection
|
||||||
|
permission is for PostgreSQL's streaming replication (and doesn't necessarily need to be the <literal>repmgr</literal> user).
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-clone-provide-primary-conninfo" xreflabel="Providing primary connection parameters">
|
||||||
|
<title>When cloning a standby, why do I need to provide the connection parameters
|
||||||
|
for the primary server on the command line, not in the configuration file?</title>
|
||||||
|
<para>
|
||||||
|
Cloning a standby is a one-time action; the role of the server being cloned
|
||||||
|
from could change, so fixing it in the configuration file would create
|
||||||
|
confusion. If &repmgr; needs to establish a connection to the primary
|
||||||
|
server, it can retrieve this from the <literal>repmgr.nodes</literal> table on the local
|
||||||
|
node, and if necessary scan the replication cluster until it locates the active primary.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-clone-waldir-xlogdir" xreflabel="Providing a custom WAL directory">
|
||||||
|
<title>When cloning a standby, how do I ensure the WAL files are placed in a custom directory?</title>
|
||||||
|
<para>
|
||||||
|
Provide the option <literal>--waldir</literal> (<literal>--xlogdir</literal> in PostgreSQL 9.6
|
||||||
|
and earlier) with the absolute path to the WAL directory in <varname>pg_basebackup_options</varname>.
|
||||||
|
For more details see <xref linkend="cloning-advanced-pg-basebackup-options">.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-events-no-fkey" xreflabel="No foreign key on node_id in repmgr.events">
|
||||||
|
<title>Why is there no foreign key on the <literal>node_id</literal> column in the <literal>repmgr.events</literal>
|
||||||
|
table?</title>
|
||||||
|
<para>
|
||||||
|
Under some circumstances event notifications can be generated for servers
|
||||||
|
which have not yet been registered; it's also useful to retain a record
|
||||||
|
of events which includes servers removed from the replication cluster
|
||||||
|
which no longer have an entry in the <literal>repmgr.nodes</literal> table.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgr-recovery-conf-quoted-values" xreflabel="Quoted values in recovery.conf">
|
||||||
|
<title>Why are some values in <filename>recovery.conf</filename> surrounded by pairs of single quotes?</title>
|
||||||
|
<para>
|
||||||
|
This is to ensure that user-supplied values which are written as parameter values in <filename>recovery.conf</filename>
|
||||||
|
are escaped correctly and do not cause errors when <filename>recovery.conf</filename> is parsed.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The escaping is performed by an internal PostgreSQL routine, which leaves strings consisting
|
||||||
|
of digits and alphabetical characters only as-is, but wraps everything else in pairs of single quotes,
|
||||||
|
even if the string does not contain any characters which need escaping.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="faq-repmgrd" xreflabel="repmgrd">
|
||||||
|
<title><application>repmgrd</application></title>
|
||||||
|
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgrd-prevent-promotion" xreflabel="Prevent standby from being promoted to primary">
|
||||||
|
<title>How can I prevent a node from ever being promoted to primary?</title>
|
||||||
|
<para>
|
||||||
|
In <filename>repmgr.conf</filename>, set its priority to a value of <literal>0</literal>; apply the changed setting with
|
||||||
|
<command><link linkend="repmgr-standby-register">repmgr standby register --force</link></command>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Additionally, if <varname>failover</varname> is set to <literal>manual</literal>, the node will never
|
||||||
|
be considered as a promotion candidate.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgrd-delayed-standby" xreflabel="Delayed standby support">
|
||||||
|
<title>Does <application>repmgrd</application> support delayed standbys?</title>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> can monitor delayed standbys - those set up with
|
||||||
|
<varname>recovery_min_apply_delay</varname> set to a non-zero value
|
||||||
|
in <filename>recovery.conf</filename> - but as it's not currently possible
|
||||||
|
to directly examine the value applied to the standby, <application>repmgrd</application>
|
||||||
|
may not be able to properly evaluate the node as a promotion candidate.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
We recommend that delayed standbys are explicitly excluded from promotion
|
||||||
|
by setting <varname>priority</varname> to <literal>0</literal> in
|
||||||
|
<filename>repmgr.conf</filename>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Note that after registering a delayed standby, <application>repmgrd</application> will only start
|
||||||
|
once the metadata added in the primary node has been replicated.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgrd-logfile-rotate" xreflabel="repmgrd logfile rotation">
|
||||||
|
<title>How can I get <application>repmgrd</application> to rotate its logfile?</title>
|
||||||
|
<para>
|
||||||
|
Configure your system's <literal>logrotate</literal> service to do this; see <xref linkend="repmgrd-log-rotation">.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgrd-recloned-no-start" xreflabel="repmgrd not restarting after node cloned">
|
||||||
|
<title>I've recloned a failed primary as a standby, but <application>repmgrd</application> refuses to start?</title>
|
||||||
|
<para>
|
||||||
|
Check you registered the standby after recloning. If unregistered, the standby
|
||||||
|
cannot be considered as a promotion candidate even if <varname>failover</varname> is set to
|
||||||
|
<literal>automatic</literal>, which is probably not what you want. <application>repmgrd</application> will start if
|
||||||
|
<varname>failover</varname> is set to <literal>manual</literal> so the node's replication status can still
|
||||||
|
be monitored, if desired.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgrd-pg-bindir" xreflabel="repmgrd does not apply pg_bindir to promote_command or follow_command">
|
||||||
|
<title>
|
||||||
|
<application>repmgrd</application> ignores pg_bindir when executing <varname>promote_command</varname> or <varname>follow_command</varname>
|
||||||
|
</title>
|
||||||
|
<para>
|
||||||
|
<varname>promote_command</varname> or <varname>follow_command</varname> can be user-defined scripts,
|
||||||
|
so &repmgr; will not apply <option>pg_bindir</option> even if excuting &repmgr;. Always provide the full
|
||||||
|
path; see <xref linkend="repmgrd-automatic-failover-configuration"> for more details.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="faq-repmgrd-startup-no-upstream" xreflabel="repmgrd does not start if upstream node is not running">
|
||||||
|
<title>
|
||||||
|
<application>repmgrd</application> aborts startup with the error "<literal>upstream node must be running before repmgrd can start</literal>"
|
||||||
|
</title>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> does this to avoid starting up on a replication cluster
|
||||||
|
which is not in a healthy state. If the upstream is unavailable, <application>repmgrd</application>
|
||||||
|
may initiate a failover immediately after starting up, which could have unintended side-effects,
|
||||||
|
particularly if <application>repmgrd</application> is not running on other nodes.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
In particular, it's possible that the node's local copy of the <literal>repmgr.nodes</literal> copy
|
||||||
|
is out-of-date, which may lead to incorrect failover behaviour.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The onus is therefore on the adminstrator to manually set the cluster to a stable, healthy state before
|
||||||
|
starting <application>repmgrd</application>.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
</appendix>
|
||||||
562
doc/appendix-packages.sgml
Normal file
562
doc/appendix-packages.sgml
Normal file
@@ -0,0 +1,562 @@
|
|||||||
|
<appendix id="appendix-packages" xreflabel="Package details">
|
||||||
|
<indexterm>
|
||||||
|
<primary>packages</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>&repmgr; package details</title>
|
||||||
|
<para>
|
||||||
|
This section provides technical details about various &repmgr; binary
|
||||||
|
packages, such as location of the installed binaries and
|
||||||
|
configuration files.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<sect1 id="packages-centos" xreflabel="CentOS packages">
|
||||||
|
<title>CentOS Packages</title>
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>packages</primary>
|
||||||
|
<secondary>CentOS packages</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>CentOS</primary>
|
||||||
|
<secondary>package information</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Currently, &repmgr; RPM packages are provided for versions 6.x and 7.x of CentOS. These should also
|
||||||
|
work on matching versions of Red Hat Enterprise Linux, Scientific Linux and Oracle Enterprise Linux;
|
||||||
|
together with CentOS, these are the same RedHat-based distributions for which the main community project
|
||||||
|
(PGDG) provides packages (see the <ulink url="https://yum.postgresql.org/">PostgreSQL RPM Building Project</ulink>
|
||||||
|
page for details).
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Note these &repmgr; RPM packages are not designed to work with SuSE/OpenSuSE.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
&repmgr; packages are designed to be compatible with community-provided PostgreSQL packages.
|
||||||
|
They may not work with vendor-specific packages such as those provided by RedHat for RHEL
|
||||||
|
customers, as the filesystem layout may be different to the community RPMs.
|
||||||
|
Please contact your support vendor for assistance.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<sect2 id="packages-centos-repositories">
|
||||||
|
<title>CentOS repositories</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
&repmgr; packages are available from the public 2ndQuadrant repository, and also the
|
||||||
|
PostgreSQL community repository. The 2ndQuadrant repository is updated immediately
|
||||||
|
after each
|
||||||
|
&repmgr; release.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<table id="centos-2ndquadrant-repository">
|
||||||
|
<title>2ndQuadrant public repository</title>
|
||||||
|
<tgroup cols="2">
|
||||||
|
<tbody>
|
||||||
|
<row>
|
||||||
|
<entry>Repository URL:</entry>
|
||||||
|
<entry><ulink url="https://dl.2ndquadrant.com/">https://dl.2ndquadrant.com/</ulink></entry>
|
||||||
|
</row>
|
||||||
|
<row>
|
||||||
|
<entry>Repository documentation:</entry>
|
||||||
|
<entry><ulink url="https://repmgr.org/docs/4.1/installation-packages.html#INSTALLATION-PACKAGES-REDHAT-2NDQ">https://repmgr.org/docs/4.1/installation-packages.html#INSTALLATION-PACKAGES-REDHAT-2NDQ</ulink></entry>
|
||||||
|
</row>
|
||||||
|
</tbody>
|
||||||
|
</tgroup>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
<table id="centos-pgdg-repository">
|
||||||
|
<title>PostgreSQL community repository (PGDG)</title>
|
||||||
|
<tgroup cols="2">
|
||||||
|
<tbody>
|
||||||
|
<row>
|
||||||
|
<entry>Repository URL:</entry>
|
||||||
|
<entry><ulink url="https://yum.postgresql.org/repopackages.php">https://yum.postgresql.org/repopackages.php</ulink></entry>
|
||||||
|
</row>
|
||||||
|
<row>
|
||||||
|
<entry>Repository documentation:</entry>
|
||||||
|
<entry><ulink url="https://yum.postgresql.org/">https://yum.postgresql.org/</ulink></entry>
|
||||||
|
</row>
|
||||||
|
</tbody>
|
||||||
|
</tgroup>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="packages-centos-details">
|
||||||
|
<title>CentOS package details</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
The two tables below list relevant information, paths, commands etc. for the &repmgr; packages on
|
||||||
|
CentOS 7 (with systemd) and CentOS 6 (no systemd). Substitute the appropriate PostgreSQL major
|
||||||
|
version number for your installation.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
For PostgreSQL 9.6 and lower, the CentOS packages use a mixture of <literal>9.6</literal>
|
||||||
|
and <literal>96</literal> in various places to designate the major version; e.g. the
|
||||||
|
package name is <literal>repmgr96</literal>, but the binary directory is
|
||||||
|
<filename>/var/lib/pgsql/9.6/data</filename>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
From PostgreSQL 10, the first part of the version number (e.g. <literal>10</literal>) is
|
||||||
|
the major version, so there is more consistency in file/path/package naming
|
||||||
|
(package <literal>repmgr10</literal>, binary directory <filename>/var/lib/pgsql/10/data</filename>).
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
|
||||||
|
<table id="centos-7-packages">
|
||||||
|
<title>CentOS 7 packages</title>
|
||||||
|
|
||||||
|
<tgroup cols="2">
|
||||||
|
<tbody>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Package name example:</entry>
|
||||||
|
<entry><filename>repmgr10-4.0.4-1.rhel7.x86_64</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Metapackage:</entry>
|
||||||
|
<entry>(none)</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Installation command:</entry>
|
||||||
|
<entry><literal>yum install repmgr10</literal></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Binary location:</entry>
|
||||||
|
<entry><filename>/usr/pgsql-10/bin</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgr in default path:</entry>
|
||||||
|
<entry>NO</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Configuration file location:</entry>
|
||||||
|
<entry><filename>/etc/repmgr/10/repmgr.conf</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Data directory:</entry>
|
||||||
|
<entry><filename>/var/lib/pgsql/10/data</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd service command:</entry>
|
||||||
|
<entry><command>systemctl [start|stop|restart|reload] repmgr10</command></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd service file location:</entry>
|
||||||
|
<entry><filename>/usr/lib/systemd/system/repmgr10.service</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd log file location:</entry>
|
||||||
|
<entry>(not specified by package; set in <filename>repmgr.conf</filename>)</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
</tbody>
|
||||||
|
</tgroup>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
<table id="centos-6-packages">
|
||||||
|
<title>CentOS 6 packages</title>
|
||||||
|
|
||||||
|
<tgroup cols="2">
|
||||||
|
<tbody>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Package name example:</entry>
|
||||||
|
<entry><filename>repmgr96-4.0.4-1.rhel6.x86_64</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Metapackage:</entry>
|
||||||
|
<entry>(none)</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Installation command:</entry>
|
||||||
|
<entry><literal>yum install repmgr96</literal></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Binary location:</entry>
|
||||||
|
<entry><filename>/usr/pgsql-9.6/bin</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgr in default path:</entry>
|
||||||
|
<entry>NO</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Configuration file location:</entry>
|
||||||
|
<entry><filename>/etc/repmgr/9.6/repmgr.conf</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Data directory:</entry>
|
||||||
|
<entry><filename>/var/lib/pgsql/9.6/data</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd service command:</entry>
|
||||||
|
<entry><literal>service [start|stop|restart|reload] repmgr-9.6</literal></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd service file location:</entry>
|
||||||
|
<entry><literal>/etc/init.d/repmgr-9.6</literal></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd log file location:</entry>
|
||||||
|
<entry><filename>/var/log/repmgr/repmgrd-9.6.log</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
</tbody>
|
||||||
|
</tgroup>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
</sect2>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
<sect1 id="packages-debian-ubuntu" xreflabel="Debian/Ubuntu packages">
|
||||||
|
<title>Debian/Ubuntu Packages</title>
|
||||||
|
<indexterm>
|
||||||
|
<primary>packages</primary>
|
||||||
|
<secondary>Debian/Ubuntu packages</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>Debian/Ubuntu</primary>
|
||||||
|
<secondary>package information</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
&repmgr; <literal>.deb</literal> packages are provided via the
|
||||||
|
PostgreSQL Community APT repository, and are available for each community-supported
|
||||||
|
PostgreSQL version, currently supported Debian releases, and currently supported
|
||||||
|
Ubuntu LTS releases.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<sect2 id="packages-apt-repository">
|
||||||
|
<title>APT repository</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
&repmgr; packages are available from the PostgreSQL Community APT repository,
|
||||||
|
which is updated immediately after each &repmgr; release.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
|
||||||
|
<table id="apt-2ndquadrant-repository">
|
||||||
|
<title>2ndQuadrant public repository</title>
|
||||||
|
<tgroup cols="2">
|
||||||
|
<tbody>
|
||||||
|
<row>
|
||||||
|
<entry>Repository URL:</entry>
|
||||||
|
<entry><ulink url="https://dl.2ndquadrant.com/">https://dl.2ndquadrant.com/</ulink></entry>
|
||||||
|
</row>
|
||||||
|
<row>
|
||||||
|
<entry>Repository documentation:</entry>
|
||||||
|
<entry><ulink url="https://repmgr.org/docs/4.1/installation-packages.html#INSTALLATION-PACKAGES-DEBIAN">https://repmgr.org/docs/4.1/installation-packages.html#INSTALLATION-PACKAGES-DEBIAN</ulink></entry>
|
||||||
|
</row>
|
||||||
|
</tbody>
|
||||||
|
</tgroup>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
|
||||||
|
<table id="apt-repository">
|
||||||
|
<title>PostgreSQL Community APT repository (PGDG)</title>
|
||||||
|
<tgroup cols="2">
|
||||||
|
<tbody>
|
||||||
|
<row>
|
||||||
|
<entry>Repository URL:</entry>
|
||||||
|
<entry><ulink url="http://apt.postgresql.org/">http://apt.postgresql.org/</ulink></entry>
|
||||||
|
</row>
|
||||||
|
<row>
|
||||||
|
<entry>Repository documentation:</entry>
|
||||||
|
<entry><ulink url="https://wiki.postgresql.org/wiki/Apt)">https://wiki.postgresql.org/wiki/Apt)</ulink></entry>
|
||||||
|
</row>
|
||||||
|
</tbody>
|
||||||
|
</tgroup>
|
||||||
|
</table>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="packages-debian-details">
|
||||||
|
<title>Debian/Ubuntu package details</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
The table below lists relevant information, paths, commands etc. for the &repmgr; packages on
|
||||||
|
Debian 9.x ("Stretch"). Substitute the appropriate PostgreSQL major
|
||||||
|
version number for your installation.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
See also <xref linkend="repmgrd-configuration-debian-ubuntu"> for some specifics related
|
||||||
|
to configuring the <application>repmgrd</application> daemon.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<table id="debian-9-packages">
|
||||||
|
<title>Debian 9.x packages</title>
|
||||||
|
|
||||||
|
<tgroup cols="2">
|
||||||
|
<tbody>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Package name example:</entry>
|
||||||
|
<entry><filename>postgresql-10-repmgr</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Metapackage:</entry>
|
||||||
|
<entry><filename>repmgr-common</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Installation command:</entry>
|
||||||
|
<entry><literal>apt-get install postgresql-10-repmgr</literal></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Binary location:</entry>
|
||||||
|
<entry><filename>/usr/lib/postgresql/10/bin</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgr in default path:</entry>
|
||||||
|
<entry>Yes (via wrapper script <filename>/usr/bin/repmgr</filename>)</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Configuration file location:</entry>
|
||||||
|
<entry>(not set by package)</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>Data directory:</entry>
|
||||||
|
<entry><filename>/var/lib/postgresql/10/main</filename></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>PostgreSQL service command:</entry>
|
||||||
|
<entry><command>systemctl [start|stop|restart|reload] postgresql@10-main</command></entry>
|
||||||
|
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd service command:</entry>
|
||||||
|
<entry><command>systemctl [start|stop|restart|reload] repmgrd</command></entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd service file location:</entry>
|
||||||
|
<entry><filename>/etc/init.d/repmgrd</filename> (defaults in: <filename>/etc/defaults/repmgrd</filename>)</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
<row>
|
||||||
|
<entry>repmgrd log file location:</entry>
|
||||||
|
<entry>(not specified by package; set in <filename>repmgr.conf</filename>)</entry>
|
||||||
|
</row>
|
||||||
|
|
||||||
|
</tbody>
|
||||||
|
</tgroup>
|
||||||
|
</table>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
Instead of using the <application>systemd</application> service command directly,
|
||||||
|
it's recommended to execute <command>pg_ctlcluster</command> (as <literal>root</literal>,
|
||||||
|
either directly or via <command>sudo</command>), e.g.:
|
||||||
|
<programlisting>
|
||||||
|
<command>pg_ctlcluster 10 main [start|stop|restart|reload]</command></programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For pre-<application>systemd</application> systems, <command>pg_ctlcluster</command>
|
||||||
|
can be executed directly by the <literal>postgres</literal> user.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="packages-snapshot" xreflabel="Snapshot packages">
|
||||||
|
<title>Snapshot packages</title>
|
||||||
|
<indexterm>
|
||||||
|
<primary>snapshot packages</primary>
|
||||||
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>packages</primary>
|
||||||
|
<secondary>snaphots</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
For testing new features and bug fixes, from time to time 2ndQuadrant provides
|
||||||
|
so-called "snapshot packages" via its public repository. These packages
|
||||||
|
are built from the &repmgr; source at a particular point in time, and are not formal
|
||||||
|
releases.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
We do not recommend installing these packages in a production environment
|
||||||
|
unless specifically advised.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
To install a snapshot package, it's necessary to install the 2ndQuadrant public snapshot repository,
|
||||||
|
following the instructions here: <ulink url="https://dl.2ndquadrant.com/default/release/site/">https://dl.2ndquadrant.com/default/release/site/</ulink> but replace <literal>release</literal> with <literal>snapshot</literal>
|
||||||
|
in the appropriate URL.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For example, to install the snapshot RPM repository for PostgreSQL 9.6, execute (as <literal>root</literal>):
|
||||||
|
<programlisting>
|
||||||
|
curl https://dl.2ndquadrant.com/default/snapshot/get/9.6/rpm | bash</programlisting>
|
||||||
|
|
||||||
|
or as a normal user with root sudo access:
|
||||||
|
<programlisting>
|
||||||
|
curl https://dl.2ndquadrant.com/default/snapshot/get/9.6/rpm | sudo bash</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Alternatively you can browse the repository here:
|
||||||
|
<ulink url="https://dl.2ndquadrant.com/default/snapshot/browse/">https://dl.2ndquadrant.com/default/snapshot/browse/</ulink>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Once the repository is installed, installing or updating &repmgr; will result in the latest snapshot
|
||||||
|
package being installed.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The package name will be formatted like this:
|
||||||
|
<programlisting>
|
||||||
|
repmgr96-4.1.1-0.0git320.g5113ab0.1.el7.x86_64.rpm</programlisting>
|
||||||
|
containg the snapshot build number (here: <literal>320</literal>) and the hash
|
||||||
|
of the <application>git</application> commit it was built from (here: <literal>g5113ab0</literal>).
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Note that the next formal release (in the above example <literal>4.1.1</literal>), once available,
|
||||||
|
will install in place of any snapshot builds.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="packages-old-versions" xreflabel="Installing old package versions">
|
||||||
|
<title>Installing old package versions</title>
|
||||||
|
<indexterm>
|
||||||
|
<primary>old packages</primary>
|
||||||
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>packages</primary>
|
||||||
|
<secondary>old versions</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<sect2 id="packages-old-versions-debian" xreflabel="old Debian package versions">
|
||||||
|
<title>Debian/Ubuntu</title>
|
||||||
|
<para>
|
||||||
|
An archive of old packages (<literal>3.3.2</literal> and later) for Debian/Ubuntu-based systems is available here:
|
||||||
|
<ulink url="http://atalia.postgresql.org/morgue/r/repmgr/">http://atalia.postgresql.org/morgue/r/repmgr/</ulink>
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="packages-old-versions-rhel-centos" xreflabel="old RHEL/CentOS package versions">
|
||||||
|
<title>RHEL/CentOS</title>
|
||||||
|
<para>
|
||||||
|
Old RPM packages (<literal>3.2</literal> and later) can be retrieved from the
|
||||||
|
(deprecated) 2ndQuadrant repository at
|
||||||
|
<ulink url="http://packages.2ndquadrant.com/">http://packages.2ndquadrant.com/</ulink>
|
||||||
|
by installing the appropriate repository RPM:
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<ulink url="http://packages.2ndquadrant.com/repmgr/yum-repo-rpms/repmgr-fedora-1.0-1.noarch.rpm">http://packages.2ndquadrant.com/repmgr/yum-repo-rpms/repmgr-fedora-1.0-1.noarch.rpm</ulink>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<ulink url="http://packages.2ndquadrant.com/repmgr/yum-repo-rpms/repmgr-rhel-1.0-1.noarch.rpm">http://packages.2ndquadrant.com/repmgr/yum-repo-rpms/repmgr-rhel-1.0-1.noarch.rpm</ulink>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Old versions can be located with e.g.:
|
||||||
|
<programlisting>
|
||||||
|
yum --showduplicates list repmgr96</programlisting>
|
||||||
|
(substitute the appropriate package name; see <xref linkend="packages-centos">) and installed with:
|
||||||
|
<programlisting>
|
||||||
|
yum install {package_name}-{version}</programlisting>
|
||||||
|
where <literal>{package_name}</literal> is the base package name (e.g. <literal>repmgr96</literal>)
|
||||||
|
and <literal>{version}</literal> is the version listed by the
|
||||||
|
<command> yum --showduplicates list ...</command> command, e.g. <literal>4.0.6-1.rhel6</literal>.
|
||||||
|
</para>
|
||||||
|
<para>For example:
|
||||||
|
<programlisting>
|
||||||
|
yum install repmgr96-4.0.6-1.rhel6</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</sect2>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
|
||||||
|
<sect1 id="packages-packager-info" xreflabel="Information for packagers">
|
||||||
|
<title>Information for packagers</title>
|
||||||
|
<indexterm>
|
||||||
|
<primary>packages</primary>
|
||||||
|
<secondary>information for packagers</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<para>
|
||||||
|
We recommend patching the following parameters when
|
||||||
|
building the package as built-in default values for user convenience.
|
||||||
|
These values can nevertheless be overridden by the user, if desired.
|
||||||
|
</para>
|
||||||
|
<itemizedlist>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Configuration file location: the default configuration file location
|
||||||
|
can be hard-coded by patching <varname>package_conf_file</varname>
|
||||||
|
in <filename>configfile.c</filename>:
|
||||||
|
<programlisting>
|
||||||
|
/* packagers: if feasible, patch configuration file path into "package_conf_file" */
|
||||||
|
char package_conf_file[MAXPGPATH] = "";</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
See also: <xref linkend="configuration-file">
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
PID file location: the default <application>repmgrd</application> PID file
|
||||||
|
location can be hard-coded by patching <varname>package_pid_file</varname>
|
||||||
|
in <filename>repmgrd.c</filename>:
|
||||||
|
<programlisting>
|
||||||
|
/* packagers: if feasible, patch PID file path into "package_pid_file" */
|
||||||
|
char package_pid_file[MAXPGPATH] = "";</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
See also: <xref linkend="repmgrd-pid-file">
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
</sect1>
|
||||||
|
</appendix>
|
||||||
1558
doc/appendix-release-notes.sgml
Normal file
1558
doc/appendix-release-notes.sgml
Normal file
File diff suppressed because it is too large
Load Diff
@@ -1,5 +1,37 @@
|
|||||||
<appendix id="appendix-signatures" xreflabel="Verifying digital signatures">
|
<appendix id="appendix-signatures" xreflabel="Verifying digital signatures">
|
||||||
<title>Verifying digital signatures</title>
|
<title>Verifying digital signatures</title>
|
||||||
|
|
||||||
<para>WIP</para>
|
<sect1 id="repmgr-source-key" xreflabel="repmgr source key">
|
||||||
|
<title>repmgr source code signing key</title>
|
||||||
|
<para>
|
||||||
|
The signing key ID used for <application>repmgr</application> source code bundles is:
|
||||||
|
<ulink url="https://repmgr.org/download/SOURCE-GPG-KEY-repmgr">
|
||||||
|
<literal>0x297F1DCC</literal></ulink>.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
To download the <application>repmgr</application> source key to your computer:
|
||||||
|
<programlisting>
|
||||||
|
curl -s https://repmgr.org/download/SOURCE-GPG-KEY-repmgr | gpg --import
|
||||||
|
gpg --fingerprint 0x297F1DCC
|
||||||
|
</programlisting>
|
||||||
|
then verify that the fingerprint is the expected value:
|
||||||
|
<programlisting>
|
||||||
|
085A BE38 6FD9 72CE 6365 340D 8365 683D 297F 1DCC</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
For checking tarballs, first download and import the <application>repmgr</application>
|
||||||
|
source signing key as shown above. Then download both source tarball and the detached
|
||||||
|
key (e.g. <filename>repmgr-4.0beta1.tar.gz</filename> and
|
||||||
|
<filename>repmgr-4.0beta1.tar.gz.asc</filename>) from
|
||||||
|
<ulink url="https://repmgr.org/download/">https://repmgr.org/download/</ulink>
|
||||||
|
and use <application>gpg</application> to verify the key, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
gpg --verify repmgr-4.0beta1.tar.gz.asc</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
|
||||||
</appendix>
|
</appendix>
|
||||||
|
|||||||
@@ -1,288 +1,8 @@
|
|||||||
BDR failover with repmgrd
|
BDR failover with repmgrd
|
||||||
=========================
|
=========================
|
||||||
|
|
||||||
`repmgr 4` provides support for monitoring BDR nodes and taking action in case
|
This document has been integrated into the main `repmgr` documentation
|
||||||
one of the nodes fails.
|
and is now located here:
|
||||||
|
|
||||||
*NOTE* Due to the nature of BDR, it's only safe to use this solution for
|
> [BDR failover with repmgrd](https://repmgr.org/docs/4.0/repmgrd-bdr.html)
|
||||||
a two-node scenario. Introducing additional nodes will create an inherent
|
|
||||||
risk of node desynchronisation if a node goes down without being cleanly
|
|
||||||
removed from the cluster.
|
|
||||||
|
|
||||||
In contrast to streaming replication, there's no concept of "promoting" a new
|
|
||||||
primary node with BDR. Instead, "failover" involves monitoring both nodes
|
|
||||||
with `repmgrd` and redirecting queries from the failed node to the remaining
|
|
||||||
active node. This can be done by using the event notification script generated by
|
|
||||||
`repmgrd` to dynamically reconfigure a proxy server/connection pooler such
|
|
||||||
as PgBouncer.
|
|
||||||
|
|
||||||
|
|
||||||
Prerequisites
|
|
||||||
-------------
|
|
||||||
|
|
||||||
`repmgr 4` requires PostgreSQL 9.6 with the BDR 2 extension enabled and
|
|
||||||
configured for a two-node BDR network. `repmgr 4` packages
|
|
||||||
must be installed on each node before attempting to configure repmgr.
|
|
||||||
|
|
||||||
*NOTE* `repmgr 4` will refuse to install if it detects more than two
|
|
||||||
BDR nodes.
|
|
||||||
|
|
||||||
Application database connections *must* be passed through a proxy server/
|
|
||||||
connection pooler such as PgBouncer, and it must be possible to dynamically
|
|
||||||
reconfigure that from `repmgrd`. The example demonstrated in this document
|
|
||||||
will use PgBouncer.
|
|
||||||
|
|
||||||
The proxy server / connection poolers must not be installed on the database
|
|
||||||
servers.
|
|
||||||
|
|
||||||
For this example, it's assumed password-less SSH connections are available
|
|
||||||
from the PostgreSQL servers to the servers where PgBouncer runs, and
|
|
||||||
that the user on those servers has permission to alter the PgBouncer
|
|
||||||
configuration files.
|
|
||||||
|
|
||||||
PostgreSQL connections must be possible between each node, and each node
|
|
||||||
must be able to connect to each PgBouncer instance.
|
|
||||||
|
|
||||||
|
|
||||||
Configuration
|
|
||||||
-------------
|
|
||||||
|
|
||||||
Sample configuration for `repmgr.conf`:
|
|
||||||
|
|
||||||
node_id=1
|
|
||||||
node_name='node1'
|
|
||||||
conninfo='host=node1 dbname=bdrtest user=repmgr connect_timeout=2'
|
|
||||||
replication_type='bdr'
|
|
||||||
|
|
||||||
event_notifications=bdr_failover
|
|
||||||
event_notification_command='/path/to/bdr-pgbouncer.sh %n %e %s "%c" "%a" >> /tmp/bdr-failover.log 2>&1'
|
|
||||||
|
|
||||||
# repmgrd options
|
|
||||||
monitor_interval_secs=5
|
|
||||||
reconnect_attempts=6
|
|
||||||
reconnect_interval=5
|
|
||||||
|
|
||||||
Adjust settings as appropriate; copy and adjust for the second node (particularly
|
|
||||||
the values `node_id`, `node_name` and `conninfo`).
|
|
||||||
|
|
||||||
Note that the values provided for the `conninfo` string must be valid for
|
|
||||||
connections from *both* nodes in the cluster. The database must be the BDR
|
|
||||||
database.
|
|
||||||
|
|
||||||
If defined, `event_notifications` will restrict execution of `event_notification_command`
|
|
||||||
to the specified events.
|
|
||||||
|
|
||||||
`event_notification_command` is the script which does the actual "heavy lifting"
|
|
||||||
of reconfiguring the proxy server/ connection pooler. It is fully user-definable;
|
|
||||||
a sample implementation is documented below.
|
|
||||||
|
|
||||||
|
|
||||||
repmgr user permissions
|
|
||||||
-----------------------
|
|
||||||
|
|
||||||
`repmgr` will create an extension in the BDR database containing objects
|
|
||||||
for administering `repmgr` metadata. The user defined in the `conninfo`
|
|
||||||
setting must be able to access all objects. Additionally, superuser permissions
|
|
||||||
are required to install the `repmgr` extension. The easiest way to do this
|
|
||||||
is create the `repmgr` user as a superuser, however if this is not
|
|
||||||
desirable, the `repmgr` user can be created as a normal user and a
|
|
||||||
superuser specified with `--superuser` when registering a BDR node.
|
|
||||||
|
|
||||||
repmgr setup
|
|
||||||
------------
|
|
||||||
|
|
||||||
Register both nodes:
|
|
||||||
|
|
||||||
$ repmgr -f /etc/repmgr.conf bdr register
|
|
||||||
NOTICE: attempting to install extension "repmgr"
|
|
||||||
NOTICE: "repmgr" extension successfully installed
|
|
||||||
NOTICE: node record created for node 'node1' (ID: 1)
|
|
||||||
NOTICE: BDR node 1 registered (conninfo: host=localhost dbname=bdrtest user=repmgr port=5501)
|
|
||||||
|
|
||||||
$ repmgr -f /etc/repmgr.conf bdr register
|
|
||||||
NOTICE: node record created for node 'node2' (ID: 2)
|
|
||||||
NOTICE: BDR node 2 registered (conninfo: host=localhost dbname=bdrtest user=repmgr port=5502)
|
|
||||||
|
|
||||||
The `repmgr` extension will be automatically created when the first
|
|
||||||
node is registered, and will be propagated to the second node.
|
|
||||||
|
|
||||||
*IMPORTANT* ensure the repmgr package is available on both nodes before
|
|
||||||
attempting to register the first node
|
|
||||||
|
|
||||||
|
|
||||||
At this point the meta data for both nodes has been created; executing
|
|
||||||
`repmgr cluster show` (on either node) should produce output like this:
|
|
||||||
|
|
||||||
$ repmgr -f /etc/repmgr.conf cluster show
|
|
||||||
ID | Name | Role | Status | Upstream | Connection string
|
|
||||||
----+-------+------+-----------+----------+--------------------------------------------------------
|
|
||||||
1 | node1 | bdr | * running | | host=node1 dbname=bdrtest user=repmgr connect_timeout=2
|
|
||||||
2 | node2 | bdr | * running | | host=node2 dbname=bdrtest user=repmgr connect_timeout=2
|
|
||||||
|
|
||||||
Additionally it's possible to see a log of significant events; so far
|
|
||||||
this will only record the two node registrations (in reverse chronological order):
|
|
||||||
|
|
||||||
Node ID | Event | OK | Timestamp | Details
|
|
||||||
---------+--------------+----+---------------------+----------------------------------------------
|
|
||||||
2 | bdr_register | t | 2017-07-27 17:51:48 | node record created for node 'node2' (ID: 2)
|
|
||||||
1 | bdr_register | t | 2017-07-27 17:51:00 | node record created for node 'node1' (ID: 1)
|
|
||||||
|
|
||||||
|
|
||||||
Defining the "event_notification_command"
|
|
||||||
-----------------------------------------
|
|
||||||
|
|
||||||
Key to "failover" execution is the `event_notification_command`, which is a
|
|
||||||
user-definable script which should reconfigure the proxy server/
|
|
||||||
connection pooler.
|
|
||||||
|
|
||||||
Each time `repmgr` (or `repmgrd`) records an event, it can optionally
|
|
||||||
execute the script defined in `event_notification_command` to
|
|
||||||
take further action; details of the event will be passed as parameters.
|
|
||||||
Following placeholders are available to the script:
|
|
||||||
|
|
||||||
%n - node ID
|
|
||||||
%e - event type
|
|
||||||
%s - success (1 or 0)
|
|
||||||
%t - timestamp
|
|
||||||
%d - details
|
|
||||||
%c - conninfo string of the next available node
|
|
||||||
%a - name of the next available node
|
|
||||||
|
|
||||||
Note that `%c` and `%a` will only be provided during `bdr_failover`
|
|
||||||
events, which is what is of interest here.
|
|
||||||
|
|
||||||
The provided sample script (`scripts/bdr-pgbouncer.sh`) is configured like
|
|
||||||
this:
|
|
||||||
|
|
||||||
event_notification_command='/path/to/bdr-pgbouncer.sh %n %e %s "%c" "%a"'
|
|
||||||
|
|
||||||
and parses the configures parameters like this:
|
|
||||||
|
|
||||||
NODE_ID=$1
|
|
||||||
EVENT_TYPE=$2
|
|
||||||
SUCCESS=$3
|
|
||||||
NEXT_CONNINFO=$4
|
|
||||||
NEXT_NODE_NAME=$5
|
|
||||||
|
|
||||||
It also contains some hard-coded values about the PgBouncer configuration for
|
|
||||||
both nodes; these will need to be adjusted for your local environment of course
|
|
||||||
(ideally the scripts would be maintained as templates and generated by some
|
|
||||||
kind of provisioning system).
|
|
||||||
|
|
||||||
The script performs following steps:
|
|
||||||
|
|
||||||
- pauses PgBouncer on all nodes
|
|
||||||
- recreates the PgBouncer configuration file on each node using the information
|
|
||||||
provided by `repmgrd` (mainly the `conninfo` string) to configure PgBouncer
|
|
||||||
to point to the remaining node
|
|
||||||
- reloads the PgBouncer configuration
|
|
||||||
- resumes PgBouncer
|
|
||||||
|
|
||||||
From that point, any connections to PgBouncer on the failed BDR node will be redirected
|
|
||||||
to the active node.
|
|
||||||
|
|
||||||
|
|
||||||
repmgrd
|
|
||||||
-------
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
Node monitoring and failover
|
|
||||||
----------------------------
|
|
||||||
|
|
||||||
At the intervals specified by `monitor_interval_secs` in `repmgr.conf`, `repmgrd`
|
|
||||||
will ping each node to check if it's available. If a node isn't available,
|
|
||||||
`repmgrd` will enter failover mode and check `reconnect_attempts` times
|
|
||||||
at intervals of `reconnect_interval` to confirm the node is definitely unreachable.
|
|
||||||
This buffer period is necessary to avoid false positives caused by transient
|
|
||||||
network outages.
|
|
||||||
|
|
||||||
If the node is still unavailable, `repmgrd` will enter failover mode and execute
|
|
||||||
the script defined in `event_notification_command`; an entry will be logged
|
|
||||||
in the `repmgr.events` table and `repmgrd` will (unless otherwise configured)
|
|
||||||
resume monitoring of the node in "degraded" mode until it reappears.
|
|
||||||
|
|
||||||
`repmgrd` logfile output during a failover event will look something like this
|
|
||||||
one one node (usually the node which has failed, here "node2"):
|
|
||||||
|
|
||||||
...
|
|
||||||
[2017-07-27 21:08:39] [INFO] starting continuous BDR node monitoring
|
|
||||||
[2017-07-27 21:08:39] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
|
||||||
[2017-07-27 21:08:55] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
|
||||||
[2017-07-27 21:09:11] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
|
||||||
[2017-07-27 21:09:23] [WARNING] unable to connect to node node2 (ID 2)
|
|
||||||
[2017-07-27 21:09:23] [INFO] checking state of node 2, 0 of 5 attempts
|
|
||||||
[2017-07-27 21:09:23] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:24] [INFO] checking state of node 2, 1 of 5 attempts
|
|
||||||
[2017-07-27 21:09:24] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:25] [INFO] checking state of node 2, 2 of 5 attempts
|
|
||||||
[2017-07-27 21:09:25] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:26] [INFO] checking state of node 2, 3 of 5 attempts
|
|
||||||
[2017-07-27 21:09:26] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:27] [INFO] checking state of node 2, 4 of 5 attempts
|
|
||||||
[2017-07-27 21:09:27] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:28] [WARNING] unable to reconnect to node 2 after 5 attempts
|
|
||||||
[2017-07-27 21:09:28] [NOTICE] setting node record for node 2 to inactive
|
|
||||||
[2017-07-27 21:09:28] [INFO] executing notification command for event "bdr_failover"
|
|
||||||
[2017-07-27 21:09:28] [DETAIL] command is:
|
|
||||||
/path/to/bdr-pgbouncer.sh 2 bdr_failover 1 "host=host=node1 dbname=bdrtest user=repmgr connect_timeout=2" "node1"
|
|
||||||
[2017-07-27 21:09:28] [INFO] node 'node2' (ID: 2) detected as failed; next available node is 'node1' (ID: 1)
|
|
||||||
[2017-07-27 21:09:28] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
|
||||||
[2017-07-27 21:09:28] [DETAIL] monitoring node "node2" (ID: 2) in degraded mode
|
|
||||||
...
|
|
||||||
|
|
||||||
Output on the other node ("node1") during the same event will look like this:
|
|
||||||
|
|
||||||
[2017-07-27 21:08:35] [INFO] starting continuous BDR node monitoring
|
|
||||||
[2017-07-27 21:08:35] [INFO] monitoring BDR replication status on node "node1" (ID: 1)
|
|
||||||
[2017-07-27 21:08:51] [INFO] monitoring BDR replication status on node "node1" (ID: 1)
|
|
||||||
[2017-07-27 21:09:07] [INFO] monitoring BDR replication status on node "node1" (ID: 1)
|
|
||||||
[2017-07-27 21:09:23] [WARNING] unable to connect to node node2 (ID 2)
|
|
||||||
[2017-07-27 21:09:23] [INFO] checking state of node 2, 0 of 5 attempts
|
|
||||||
[2017-07-27 21:09:23] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:24] [INFO] checking state of node 2, 1 of 5 attempts
|
|
||||||
[2017-07-27 21:09:24] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:25] [INFO] checking state of node 2, 2 of 5 attempts
|
|
||||||
[2017-07-27 21:09:25] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:26] [INFO] checking state of node 2, 3 of 5 attempts
|
|
||||||
[2017-07-27 21:09:26] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:27] [INFO] checking state of node 2, 4 of 5 attempts
|
|
||||||
[2017-07-27 21:09:27] [INFO] sleeping 1 seconds until next reconnection attempt
|
|
||||||
[2017-07-27 21:09:28] [WARNING] unable to reconnect to node 2 after 5 attempts
|
|
||||||
[2017-07-27 21:09:28] [NOTICE] other node's repmgrd is handling failover
|
|
||||||
[2017-07-27 21:09:28] [INFO] monitoring BDR replication status on node "node1" (ID: 1)
|
|
||||||
[2017-07-27 21:09:28] [DETAIL] monitoring node "node2" (ID: 2) in degraded mode
|
|
||||||
|
|
||||||
This assumes only the PostgreSQL instance on "node2" has failed. In this case the
|
|
||||||
`repmgrd` instance running on "node2" has performed the failover. However if
|
|
||||||
the entire server becomes unavailable, `repmgrd` on "node1" will perform
|
|
||||||
the failover.
|
|
||||||
|
|
||||||
|
|
||||||
Node recovery
|
|
||||||
-------------
|
|
||||||
|
|
||||||
Following failure of a BDR node, if the node subsequently becomes available again,
|
|
||||||
a `bdr_recovery` event will be generated. This could potentially be used to
|
|
||||||
reconfigure PgBouncer automatically to bring the node back into the available pool,
|
|
||||||
however it would be prudent to manually verify the node's status before
|
|
||||||
exposing it to the application.
|
|
||||||
|
|
||||||
If the failed node comes back up and connects correctly, output similar to this
|
|
||||||
will be visible in the `repmgrd` log:
|
|
||||||
|
|
||||||
[2017-07-27 21:25:30] [DETAIL] monitoring node "node2" (ID: 2) in degraded mode
|
|
||||||
[2017-07-27 21:25:46] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
|
||||||
[2017-07-27 21:25:46] [DETAIL] monitoring node "node2" (ID: 2) in degraded mode
|
|
||||||
[2017-07-27 21:25:55] [INFO] active replication slot for node "node1" found after 1 seconds
|
|
||||||
[2017-07-27 21:25:55] [NOTICE] node "node2" (ID: 2) has recovered after 986 seconds
|
|
||||||
|
|
||||||
|
|
||||||
Shutdown of both nodes
|
|
||||||
----------------------
|
|
||||||
|
|
||||||
If both PostgreSQL instances are shut down, `repmgrd` will try and handle the
|
|
||||||
situation as gracefully as possible, though with no failover candidates available
|
|
||||||
there's not much it can do. Should this case ever occur, we recommend shutting
|
|
||||||
down `repmgrd` on both nodes and restarting it once the PostgreSQL instances
|
|
||||||
are running properly.
|
|
||||||
|
|||||||
@@ -1,106 +1,7 @@
|
|||||||
|
Changes in repmgr 4
|
||||||
|
===================
|
||||||
|
|
||||||
Standardisation on `primary`
|
This document has been integrated into the main `repmgr` documentation
|
||||||
----------------------------
|
and is now located here:
|
||||||
|
|
||||||
To standardise terminology, `primary` is used to denote the read/write
|
> [Release notes](https://repmgr.org/docs/4.0/release-4.0.html)
|
||||||
node in a streaming replication cluster. `master` is still accepted
|
|
||||||
as a synonym (e.g. `repmgr master register`).
|
|
||||||
|
|
||||||
|
|
||||||
New command line options
|
|
||||||
------------------------
|
|
||||||
|
|
||||||
- `--dry-run`: repmgr will attempt to perform the action as far as possible
|
|
||||||
without making any changes to the database
|
|
||||||
|
|
||||||
- `--upstream-node-id`: use to specify the upstream node the standby will
|
|
||||||
connect later stream from, when cloning a standby. This replaces the configuration
|
|
||||||
file parameter `upstream_node`, as the upstream node is set when the standby
|
|
||||||
is initially cloned, but can change over the lifetime of an installation (due
|
|
||||||
to failovers, switchovers etc.) so it's pointless/confusing keeping the original
|
|
||||||
value around in the config file.
|
|
||||||
|
|
||||||
Changed command line options
|
|
||||||
----------------------------
|
|
||||||
|
|
||||||
### repmgr
|
|
||||||
|
|
||||||
- `--replication-user` has been deprecated; it has been replaced by the
|
|
||||||
configuration file option `replication_user`. The value (which defaults
|
|
||||||
to the user in the `conninfo` string) will be stored in the repmgr metadata
|
|
||||||
for use by standby clone/follow..
|
|
||||||
|
|
||||||
- `--recovery-min-apply-delay` is now a configuration file parameter
|
|
||||||
`recovery_min_apply_delay, to ensure the setting does not get lost when
|
|
||||||
a standby follows a new upstream.
|
|
||||||
|
|
||||||
### repmgrd
|
|
||||||
|
|
||||||
- `--monitoring-history` is deprecated and has been replaced by the
|
|
||||||
configuration file option `monitoring_history`. This enables the
|
|
||||||
setting to be changed without having to modify system service files.
|
|
||||||
|
|
||||||
Changes to repmgr commands
|
|
||||||
--------------------------
|
|
||||||
|
|
||||||
|
|
||||||
### `repmgr cluster show`
|
|
||||||
|
|
||||||
This now displays the role of each node (e.g. `primary`, `standby`)
|
|
||||||
and its status in separate columns.
|
|
||||||
|
|
||||||
The `--csv` option now emits a third column indicating the recovery
|
|
||||||
status of the node.
|
|
||||||
|
|
||||||
|
|
||||||
Configuration file changes
|
|
||||||
--------------------------
|
|
||||||
|
|
||||||
### Required settings
|
|
||||||
|
|
||||||
The following 4 parameters are mandatory in `repmgr.conf`:
|
|
||||||
|
|
||||||
- `node_id`
|
|
||||||
- `node_name`
|
|
||||||
- `conninfo`
|
|
||||||
- `data_directory`
|
|
||||||
|
|
||||||
|
|
||||||
### Renamed settings
|
|
||||||
|
|
||||||
Some settings have been renamed for clarity and consistency:
|
|
||||||
|
|
||||||
- `node`: now `node_id`
|
|
||||||
- `name`: now `node_name`
|
|
||||||
- `master_reponse_timeout`: now `async_query_timeout` to better indicate its
|
|
||||||
purpose
|
|
||||||
|
|
||||||
- The following configuration file parameters have been renamed for consistency
|
|
||||||
with other parameters (and conform to the pattern used by PostgreSQL itself,
|
|
||||||
which uses the prefix `log_` for logging parameters):
|
|
||||||
- `loglevel` has been renamed to `log_level`
|
|
||||||
- `logfile` has been renamed to `log_file`
|
|
||||||
- `logfacility` has been renamed to `log_facility`
|
|
||||||
|
|
||||||
### Removed settings
|
|
||||||
|
|
||||||
- `cluster`: has been removed
|
|
||||||
- `upstream_node`: see note about `--upstream-node-id` above.
|
|
||||||
- `retry_promote_interval_secs`: this is now redundant due to changes in the
|
|
||||||
failover/promotion mechanism; the new equivalent is `primary_notification_timeout`
|
|
||||||
|
|
||||||
|
|
||||||
### Logging changes
|
|
||||||
|
|
||||||
- default value for `log_level` is `INFO` rather than `NOTICE`.
|
|
||||||
- new parameter `log_status_interval`, which causes `repmgrd` to emit a status log
|
|
||||||
line at the specified interval
|
|
||||||
|
|
||||||
|
|
||||||
repmgrd
|
|
||||||
-------
|
|
||||||
|
|
||||||
The `repmgr` shared library has been renamed from `repmgr_funcs` to `repmgr`,
|
|
||||||
meaning `shared_preload_libraries` needs to be updated to the new name:
|
|
||||||
|
|
||||||
shared_preload_libraries = 'repmgr'
|
|
||||||
|
|||||||
@@ -1,13 +1,16 @@
|
|||||||
<chapter id="cloning-standbys" xreflabel="cloning standbys">
|
<chapter id="cloning-standbys" xreflabel="cloning standbys">
|
||||||
<title>Cloning standbys</title>
|
<title>Cloning standbys</title>
|
||||||
<para>
|
|
||||||
</para>
|
|
||||||
|
|
||||||
<sect1 id="cloning-from-barman" xreflabel="Cloning from Barman">
|
<sect1 id="cloning-from-barman" xreflabel="Cloning from Barman">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>cloning</primary>
|
<primary>cloning</primary>
|
||||||
<secondary>from Barman</secondary>
|
<secondary>from Barman</secondary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>Barman</primary>
|
||||||
|
<secondary>cloning a standby</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Cloning a standby from Barman</title>
|
<title>Cloning a standby from Barman</title>
|
||||||
<para>
|
<para>
|
||||||
<xref linkend="repmgr-standby-clone"> can use
|
<xref linkend="repmgr-standby-clone"> can use
|
||||||
@@ -48,7 +51,7 @@
|
|||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<sect2 id="cloning-from-barman-prerequisites" xreflabel="Prerequisites for cloning from Barman">
|
<sect2 id="cloning-from-barman-prerequisites">
|
||||||
<title>Prerequisites for cloning from Barman</title>
|
<title>Prerequisites for cloning from Barman</title>
|
||||||
<para>
|
<para>
|
||||||
In order to enable Barman support for <command>repmgr standby clone</command>, following
|
In order to enable Barman support for <command>repmgr standby clone</command>, following
|
||||||
@@ -70,7 +73,8 @@
|
|||||||
<para>
|
<para>
|
||||||
the <varname>restore_command</varname> setting in <filename>repmgr.conf</filename> is configured to
|
the <varname>restore_command</varname> setting in <filename>repmgr.conf</filename> is configured to
|
||||||
use a copy of the <command>barman-wal-restore</command> script shipped with the
|
use a copy of the <command>barman-wal-restore</command> script shipped with the
|
||||||
<literal>barman-cli</literal> package (see below);
|
<literal>barman-cli</literal> package (see section <xref linkend="cloning-from-barman-restore-command">
|
||||||
|
below).
|
||||||
</para>
|
</para>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
@@ -122,6 +126,11 @@
|
|||||||
</para>
|
</para>
|
||||||
</sect2>
|
</sect2>
|
||||||
<sect2 id="cloning-from-barman-restore-command" xreflabel="Using Barman as a WAL file source">
|
<sect2 id="cloning-from-barman-restore-command" xreflabel="Using Barman as a WAL file source">
|
||||||
|
<indexterm>
|
||||||
|
<primary>Barman</primary>
|
||||||
|
<secondary>fetching archived WAL</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Using Barman as a WAL file source</title>
|
<title>Using Barman as a WAL file source</title>
|
||||||
<para>
|
<para>
|
||||||
As a fallback in case streaming replication is interrupted, PostgreSQL can optionally
|
As a fallback in case streaming replication is interrupted, PostgreSQL can optionally
|
||||||
@@ -188,11 +197,10 @@
|
|||||||
To enable &repmgr; to use replication slots, set the boolean parameter
|
To enable &repmgr; to use replication slots, set the boolean parameter
|
||||||
<varname>use_replication_slots</varname> in <filename>repmgr.conf</filename>:
|
<varname>use_replication_slots</varname> in <filename>repmgr.conf</filename>:
|
||||||
<programlisting>
|
<programlisting>
|
||||||
use_replication_slots=true
|
use_replication_slots=true</programlisting>
|
||||||
</programlisting>
|
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Replication slots must be enabled in <filename>postgresql.conf</filename>` by
|
Replication slots must be enabled in <filename>postgresql.conf</filename> by
|
||||||
setting the parameter <varname>max_replication_slots</varname> to at least the
|
setting the parameter <varname>max_replication_slots</varname> to at least the
|
||||||
number of expected standbys (changes to this parameter require a server restart).
|
number of expected standbys (changes to this parameter require a server restart).
|
||||||
</para>
|
</para>
|
||||||
@@ -339,16 +347,50 @@
|
|||||||
|
|
||||||
<sect2 id="cloning-advanced-pg-basebackup-options" xreflabel="pg_basebackup options when cloning a standby">
|
<sect2 id="cloning-advanced-pg-basebackup-options" xreflabel="pg_basebackup options when cloning a standby">
|
||||||
<title>pg_basebackup options when cloning a standby</title>
|
<title>pg_basebackup options when cloning a standby</title>
|
||||||
|
<para>
|
||||||
|
As &repmgr; uses <command>pg_basebackup</command> to clone a standby, it's possible to
|
||||||
|
provide additional parameters for <command>pg_basebackup</command> to customise the
|
||||||
|
cloning process.
|
||||||
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
By default, <command>pg_basebackup</command> performs a checkpoint before beginning the backup
|
By default, <command>pg_basebackup</command> performs a checkpoint before beginning the backup
|
||||||
process. However, a normal checkpoint may take some time to complete;
|
process. However, a normal checkpoint may take some time to complete;
|
||||||
a fast checkpoint can be forced with the <literal>-c/--fast-checkpoint</literal> option.
|
a fast checkpoint can be forced with <command><link linkend="repmgr-standby-clone">repmgr standby clone</link></command>'s
|
||||||
However this may impact performance of the server being cloned from
|
<literal>-c/--fast-checkpoint</literal> option.
|
||||||
|
Note that this may impact performance of the server being cloned from (typically the primary)
|
||||||
so should be used with care.
|
so should be used with care.
|
||||||
</para>
|
</para>
|
||||||
|
<tip>
|
||||||
|
<simpara>
|
||||||
|
If <application>Barman</application> is set up for the cluster, it's possible to
|
||||||
|
clone the standby directly from Barman, without any impact on the server the standby
|
||||||
|
is being cloned from. For more details see <xref linkend="cloning-from-barman">.
|
||||||
|
</simpara>
|
||||||
|
</tip>
|
||||||
|
<para>
|
||||||
|
Other options can be passed to <command>pg_basebackup</command> by including them
|
||||||
|
in the <filename>repmgr.conf</filename> setting <varname>pg_basebackup_options</varname>.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Not that by default, &repmgr; executes <command>pg_basebackup</command> with <option>-X/--wal-method</option>
|
||||||
|
(PostgreSQL 9.6 and earlier: <option>-X/--xlog-method</option>) set to <literal>stream</literal>.
|
||||||
|
From PostgreSQL 9.6, if replication slots are in use, it will also create a replication slot before
|
||||||
|
running the base backup, and execute <command>pg_basebackup</command> with the
|
||||||
|
<option>-S/--slot</option> option set to the name of the previously created replication slot.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
These parameters can set by the user in <varname>pg_basebackup_options</varname>, in which case they
|
||||||
|
will override the &repmgr; default values. However normally there's no reason to do this.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If using a separate directory to store WAL files, provide the option <literal>--waldir</literal>
|
||||||
|
(<literal>--xlogdir</literal> in PostgreSQL 9.6 and earlier) with the absolute path to the
|
||||||
|
WAL directory. Any WALs generated during the cloning process will be copied here, and
|
||||||
|
a symlink will automatically be created from the main data directory.
|
||||||
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Further options can be passed to the <command>pg_basebackup</command> utility via
|
|
||||||
the setting <varname>pg_basebackup_options</varname> in <filename>repmgr.conf</filename>.
|
|
||||||
See the <ulink url="https://www.postgresql.org/docs/current/static/app-pgbasebackup.html">PostgreSQL pg_basebackup documentation</ulink>
|
See the <ulink url="https://www.postgresql.org/docs/current/static/app-pgbasebackup.html">PostgreSQL pg_basebackup documentation</ulink>
|
||||||
for more details of available options.
|
for more details of available options.
|
||||||
</para>
|
</para>
|
||||||
@@ -356,11 +398,16 @@
|
|||||||
|
|
||||||
<sect2 id="cloning-advanced-managing-passwords" xreflabel="Managing passwords">
|
<sect2 id="cloning-advanced-managing-passwords" xreflabel="Managing passwords">
|
||||||
<title>Managing passwords</title>
|
<title>Managing passwords</title>
|
||||||
|
<indexterm>
|
||||||
|
<primary>cloning</primary>
|
||||||
|
<secondary>using passwords</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
If replication connections to a standby's upstream server are password-protected,
|
If replication connections to a standby's upstream server are password-protected,
|
||||||
the standby must be able to provide the password so it can begin streaming
|
the standby must be able to provide the password so it can begin streaming replication.
|
||||||
replication.
|
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
The recommended way to do this is to store the password in the <literal>postgres</literal> system
|
The recommended way to do this is to store the password in the <literal>postgres</literal> system
|
||||||
user's <filename>~/.pgpass</filename> file. It's also possible to store the password in the
|
user's <filename>~/.pgpass</filename> file. It's also possible to store the password in the
|
||||||
@@ -368,19 +415,38 @@
|
|||||||
security reasons. For more details see the
|
security reasons. For more details see the
|
||||||
<ulink url="https://www.postgresql.org/docs/current/static/libpq-pgpass.html">PostgreSQL password file documentation</ulink>.
|
<ulink url="https://www.postgresql.org/docs/current/static/libpq-pgpass.html">PostgreSQL password file documentation</ulink>.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If using a <filename>pgpass</filename> file, an entry for the replication user (by default the
|
||||||
|
user who connects to the <literal>repmgr</literal> database) <emphasis>must</emphasis>
|
||||||
|
be provided, with database name set to <literal>replication</literal>, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
node1:5432:replication:repmgr:12345</programlisting>
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
If, for whatever reason, you wish to include the password in <filename>recovery.conf</filename>,
|
If, for whatever reason, you wish to include the password in <filename>recovery.conf</filename>,
|
||||||
set <varname>use_primary_conninfo_password</varname> to <literal>true</literal> in
|
set <varname>use_primary_conninfo_password</varname> to <literal>true</literal> in
|
||||||
<filename>repmgr.conf</filename>. This will read a password set in <varname>PGPASSWORD</varname>
|
<filename>repmgr.conf</filename>. This will read a password set in <varname>PGPASSWORD</varname>
|
||||||
(but not <filename>~/.pgpass</filename>) and place it into the <literal>primary_conninfo</literal>
|
(but not <filename>~/.pgpass</filename>) and place it into the <varname>primary_conninfo</varname>
|
||||||
string in <filename>recovery.conf</filename>. Note that <varname>PGPASSWORD</varname>
|
string in <filename>recovery.conf</filename>. Note that <varname>PGPASSWORD</varname>
|
||||||
will need to be set during any action which causes <filename>recovery.conf</filename> to be
|
will need to be set during any action which causes <filename>recovery.conf</filename> to be
|
||||||
rewritten, e.g. <xref linkend="repmgr-standby-follow">.
|
rewritten, e.g. <xref linkend="repmgr-standby-follow">.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
It is of course also possible to include the password value in the <varname>conninfo</varname>
|
It is of course also possible to include the password value in the <varname>conninfo</varname>
|
||||||
string for each node, but this is obviously a security risk and should be
|
string for each node, but this is obviously a security risk and should be avoided.
|
||||||
avoided.
|
</para>
|
||||||
|
<para>
|
||||||
|
From PostgreSQL 9.6, <application>libpq</application> supports the <varname>passfile</varname>
|
||||||
|
parameter in connection strings, which can be used to specify a password file other than
|
||||||
|
the default <filename>~/.pgpass</filename>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To have &repmgr; write a custom password file in <varname>primary_conninfo</varname>,
|
||||||
|
specify its location in <varname>passfile</varname> in <filename>repmgr.conf</filename>.
|
||||||
</para>
|
</para>
|
||||||
</sect2>
|
</sect2>
|
||||||
|
|
||||||
@@ -392,7 +458,7 @@
|
|||||||
the replication user should be set in <filename>repmgr.conf</filename> via the parameter
|
the replication user should be set in <filename>repmgr.conf</filename> via the parameter
|
||||||
<varname>replication_user</varname>; &repmgr; will use this value when making
|
<varname>replication_user</varname>; &repmgr; will use this value when making
|
||||||
replication connections and generating <filename>recovery.conf</filename>. This
|
replication connections and generating <filename>recovery.conf</filename>. This
|
||||||
value will also be stored in the <literal>repmgr.nodes</literal>
|
value will also be stored in the parameter <literal>repmgr.nodes</literal>
|
||||||
table for each node; it no longer needs to be explicitly specified when
|
table for each node; it no longer needs to be explicitly specified when
|
||||||
cloning a node or executing <xref linkend="repmgr-standby-follow">.
|
cloning a node or executing <xref linkend="repmgr-standby-follow">.
|
||||||
</para>
|
</para>
|
||||||
|
|||||||
107
doc/configuration-file-log-settings.sgml
Normal file
107
doc/configuration-file-log-settings.sgml
Normal file
@@ -0,0 +1,107 @@
|
|||||||
|
<sect1 id="configuration-file-log-settings" xreflabel="log settings">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgr.conf</primary>
|
||||||
|
<secondary>log settings</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>log settings</primary>
|
||||||
|
<secondary>configuration in repmgr.conf</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Log settings</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
By default, &repmgr; and <application>repmgrd</application> write log output to
|
||||||
|
<literal>STDERR</literal>. An alternative log destination can be specified
|
||||||
|
(either a file or <literal>syslog</literal>).
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
The &repmgr; application itself will continue to write log output to <literal>STDERR</literal>
|
||||||
|
even if another log destination is configured, as otherwise any output resulting from a command
|
||||||
|
line operation will "disappear" into the log.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This behaviour can be overriden with the command line option <option>--log-to-file</option>,
|
||||||
|
which will redirect all logging output to the configured log destination. This is recommended
|
||||||
|
when &repmgr; is executed by another application, particularly <application>repmgrd</application>,
|
||||||
|
to enable log output generated by the &repmgr; application to be stored for later reference.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry id="repmgr-conf-log-level" xreflabel="log_level">
|
||||||
|
<term><varname>log_level</varname> (<type>string</type>)
|
||||||
|
<indexterm>
|
||||||
|
<primary><varname>log_level</varname> configuration file parameter</primary>
|
||||||
|
</indexterm>
|
||||||
|
</term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
One of <option>DEBUG</option>, <option>INFO</option>, <option>NOTICE</option>,
|
||||||
|
<option>WARNING</option>, <option>ERROR</option>, <option>ALERT</option>, <option>CRIT</option>
|
||||||
|
or <option>EMERG</option>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Default is <option>INFO</option>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Note that <option>DEBUG</option> will produce a substantial amount of log output
|
||||||
|
and should not be enabled in normal use.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry id="repmgr-conf-log-facility" xreflabel="log_facility">
|
||||||
|
<term><varname>log_facility</varname> (<type>string</type>)
|
||||||
|
<indexterm>
|
||||||
|
<primary><varname>log_facility</varname> configuration file parameter</primary>
|
||||||
|
</indexterm>
|
||||||
|
</term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Logging facility: possible values are <option>STDERR</option> (default), or for
|
||||||
|
syslog integration, one of <option>LOCAL0</option>, <option>LOCAL1</option>, <option>...</option>,
|
||||||
|
<option>LOCAL7</option>, <option>USER</option>.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry id="repmgr-conf-log-file" xreflabel="log_file">
|
||||||
|
<term><varname>log_file</varname> (<type>string</type>)
|
||||||
|
<indexterm>
|
||||||
|
<primary><varname>log_file</varname> configuration file parameter</primary>
|
||||||
|
</indexterm>
|
||||||
|
</term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
If <xref linkend="repmgr-conf-log-facility"> is set to <option>STDERR</option>, log output
|
||||||
|
can be redirected to the specified file.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
See <xref linkend="repmgrd-log-rotation"> for information on configuring log rotation.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry id="repmgr-conf-log-status-interval" xreflabel="log_status_interval">
|
||||||
|
<term><varname>log_status_interval</varname> (<type>integer</type>)
|
||||||
|
<indexterm>
|
||||||
|
<primary><varname>log_status_interval</varname> configuration file parameter</primary>
|
||||||
|
</indexterm>
|
||||||
|
</term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
This setting causes <application>repmgrd</application> to emit a status log
|
||||||
|
line at the specified interval (in seconds, default <literal>300</literal>)
|
||||||
|
describing <application>repmgrd</application>'s current state, e.g.:
|
||||||
|
</para>
|
||||||
|
<programlisting>
|
||||||
|
[2018-07-12 00:47:32] [INFO] monitoring connection to upstream node "node1" (node ID: 1)</programlisting>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
@@ -1,5 +1,10 @@
|
|||||||
<sect1 id="configuration-file-settings" xreflabel="configuration file settings">
|
<sect1 id="configuration-file-settings" xreflabel="required configuration file settings">
|
||||||
<title>Configuration file settings</title>
|
<indexterm>
|
||||||
|
<primary>repmgr.conf</primary>
|
||||||
|
<secondary>required settings</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>Required configuration file settings</title>
|
||||||
<para>
|
<para>
|
||||||
Each <filename>repmgr.conf</filename> file must contain the following parameters:
|
Each <filename>repmgr.conf</filename> file must contain the following parameters:
|
||||||
</para>
|
</para>
|
||||||
@@ -87,7 +92,10 @@
|
|||||||
|
|
||||||
<para>
|
<para>
|
||||||
For a full list of annotated configuration items, see the file
|
For a full list of annotated configuration items, see the file
|
||||||
<ulink url="https://raw.githubusercontent.com/2ndQuadrant/repmgr/master/repmgr.conf.sample">repmgr.conf.sample</>.
|
<ulink url="https://raw.githubusercontent.com/2ndQuadrant/repmgr/master/repmgr.conf.sample">repmgr.conf.sample</ulink>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For <application>repmgrd</application>-specific settings, see <xref linkend="repmgrd-configuration">.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<note>
|
<note>
|
||||||
130
doc/configuration-file-service-commands.sgml
Normal file
130
doc/configuration-file-service-commands.sgml
Normal file
@@ -0,0 +1,130 @@
|
|||||||
|
<sect1 id="configuration-file-service-commands" xreflabel="service command settings">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgr.conf</primary>
|
||||||
|
<secondary>service command settings</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>service command settings</primary>
|
||||||
|
<secondary>configuration in repmgr.conf</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Service command settings</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
In some circumstances, &repmgr; (and <application>repmgrd</application>) need to
|
||||||
|
be able to stop, start or restart PostgreSQL. &repmgr; commands which need to do this
|
||||||
|
include <link linkend="repmgr-standby-follow"><command>repmgr standby follow</command></link>,
|
||||||
|
<link linkend="repmgr-standby-switchover"><command>repmgr standby switchover</command></link> and
|
||||||
|
<link linkend="repmgr-node-rejoin"><command>repmgr node rejoin</command></link>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
By default, &repmgr; will use PostgreSQL's <command>pg_ctl</command> utility to control the PostgreSQL
|
||||||
|
server. However this can lead to various problems, particularly when PostgreSQL has been
|
||||||
|
installed from packages, and especially so if <application>systemd</application> is in use.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If using <application>systemd</application>, ensure you have <varname>RemoveIPC</varname> set to <literal>off</literal>.
|
||||||
|
See the <ulink url="https://wiki.postgresql.org/wiki/Systemd">systemd</ulink>
|
||||||
|
entry in the <ulink url="https://wiki.postgresql.org/wiki/Main_Page">PostgreSQL wiki</ulink> for details.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
|
||||||
|
<para>
|
||||||
|
With this in mind, we recommend to <emphasis>always</emphasis> configure &repmgr; to use the
|
||||||
|
available system service commands.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
To do this, specify the appropriate command for each action
|
||||||
|
in <filename>repmgr.conf</filename> using the following configuration
|
||||||
|
parameters:
|
||||||
|
<programlisting>
|
||||||
|
service_start_command
|
||||||
|
service_stop_command
|
||||||
|
service_restart_command
|
||||||
|
service_reload_command</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
&repmgr; will not apply <option>pg_bindir</option> when executing any of these commands;
|
||||||
|
these can be user-defined scripts so must always be specified with the full path.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
It's also possible to specify a <varname>service_promote_command</varname>.
|
||||||
|
This is intended for systems which provide a package-level promote command,
|
||||||
|
such as Debian's <application>pg_ctlcluster</application>, to promote the
|
||||||
|
PostgreSQL from standby to primary.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If your packaging system does not provide such a command, it can be left empty,
|
||||||
|
and &repmgr; will generate the appropriate `pg_ctl ... promote` command.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Do not confuse this with <varname>promote_command</varname>, which is used
|
||||||
|
by <application>repmgrd</application> to execute <xref linkend="repmgr-standby-promote">.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
To confirm which command &repmgr; will execute for each action, use
|
||||||
|
<command>repmgr node service --list --action=...</command>, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
repmgr -f /etc/repmgr.conf node service --list --action=stop
|
||||||
|
repmgr -f /etc/repmgr.conf node service --list --action=start
|
||||||
|
repmgr -f /etc/repmgr.conf node service --list --action=restart
|
||||||
|
repmgr -f /etc/repmgr.conf node service --list --action=reload</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
These commands will be executed by the system user which &repmgr; runs as (usually <literal>postgres</literal>)
|
||||||
|
and will probably require passwordless sudo access to be able to execute the command.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For example, using <application>systemd</application> on CentOS 7, the service commands can be
|
||||||
|
set as follows:
|
||||||
|
<programlisting>
|
||||||
|
service_start_command = 'sudo systemctl start postgresql-9.6'
|
||||||
|
service_stop_command = 'sudo systemctl stop postgresql-9.6'
|
||||||
|
service_restart_command = 'sudo systemctl restart postgresql-9.6'
|
||||||
|
service_reload_command = 'sudo systemctl reload postgresql-9.6'</programlisting>
|
||||||
|
and <filename>/etc/sudoers</filename> should be set as follows:
|
||||||
|
<programlisting>
|
||||||
|
Defaults:postgres !requiretty
|
||||||
|
postgres ALL = NOPASSWD: /usr/bin/systemctl stop postgresql-9.6, \
|
||||||
|
/usr/bin/systemctl start postgresql-9.6, \
|
||||||
|
/usr/bin/systemctl restart postgresql-9.6, \
|
||||||
|
/usr/bin/systemctl reload postgresql-9.6</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<important>
|
||||||
|
<indexterm>
|
||||||
|
<primary>pg_ctlcluster</primary>
|
||||||
|
<secondary>service command settings</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<para>
|
||||||
|
Debian/Ubuntu users: instead of calling <command>sudo systemctl</command> directly, use
|
||||||
|
<command>sudo pg_ctlcluster</command>, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
service_start_command = 'sudo pg_ctlcluster 9.6 main start'
|
||||||
|
service_stop_command = 'sudo pg_ctlcluster 9.6 main stop'
|
||||||
|
service_restart_command = 'sudo pg_ctlcluster 9.6 main restart'
|
||||||
|
service_reload_command = 'sudo pg_ctlcluster 9.6 main reload'</programlisting>
|
||||||
|
and set <filename>/etc/sudoers</filename> accordingly.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
While <command>pg_ctlcluster</command> will work when executed as user <literal>postgres</literal>,
|
||||||
|
it's strongly recommended to use <command>sudo pg_ctlcluster</command> on <application>systemd</application>
|
||||||
|
systems, to ensure <application>systemd</application> has a correct picture of
|
||||||
|
the PostgreSQL application state.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</important>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
@@ -1,4 +1,14 @@
|
|||||||
<sect1 id="configuration-file" xreflabel="configuration file location">
|
<sect1 id="configuration-file" xreflabel="configuration file location">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgr.conf</primary>
|
||||||
|
<secondary>location</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>configuration</primary>
|
||||||
|
<secondary>repmgr.conf location</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Configuration file location</title>
|
<title>Configuration file location</title>
|
||||||
<para>
|
<para>
|
||||||
<application>repmgr</application> and <application>repmgrd</application>
|
<application>repmgr</application> and <application>repmgrd</application>
|
||||||
@@ -7,7 +17,7 @@
|
|||||||
<filename>repmgr.conf</filename> must contain a number of required parameters, including
|
<filename>repmgr.conf</filename> must contain a number of required parameters, including
|
||||||
the database connection string for the local node and the location
|
the database connection string for the local node and the location
|
||||||
of its data directory; other values will be inferred from defaults if
|
of its data directory; other values will be inferred from defaults if
|
||||||
not explicitly supplied. See section `configuration file parameters`
|
not explicitly supplied. See section <xref linkend="configuration-file-settings">
|
||||||
for more details.
|
for more details.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
@@ -15,7 +25,7 @@
|
|||||||
The configuration file will be searched for in the following locations:
|
The configuration file will be searched for in the following locations:
|
||||||
<itemizedlist spacing="compact" mark="bullet">
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
<listitem>
|
<listitem>
|
||||||
<para>a configuration file specified by the `-f/--config-file` command line option</para>
|
<para>a configuration file specified by the <literal>-f/--config-file</literal> command line option</para>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<para>
|
<para>
|
||||||
@@ -37,10 +47,23 @@
|
|||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Note that if a file is explicitly specified with <application>-f/--config-file</application>,
|
Note that if a file is explicitly specified with <literal>-f/--config-file</literal>,
|
||||||
an error will be raised if it is not found or not readable and no attempt will be made to
|
an error will be raised if it is not found or not readable, and no attempt will be made to
|
||||||
check default locations; this is to prevent <application>repmgr</application> unexpectedly
|
check default locations; this is to prevent <application>repmgr</application> unexpectedly
|
||||||
reading the wrong file.
|
reading the wrong configuraton file.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If providing the configuration file location with <literal>-f/--config-file</literal>,
|
||||||
|
avoid using a relative path, particularly when executing <xref linkend="repmgr-primary-register">
|
||||||
|
and <xref linkend="repmgr-standby-register">, as &repmgr; stores the configuration file location
|
||||||
|
in the repmgr metadata for use when &repmgr; is executed remotely (e.g. during
|
||||||
|
<xref linkend="repmgr-standby-switchover">). &repmgr; will attempt to convert the
|
||||||
|
a relative path into an absolute one, but this may not be the same as the path you
|
||||||
|
would explicitly provide (e.g. <filename>./repmgr.conf</filename> might be converted
|
||||||
|
to <filename>/path/to/./repmgr.conf</filename>, whereas you'd normally write
|
||||||
|
<filename>/path/to/repmgr.conf</filename>).
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|||||||
@@ -1,7 +1,26 @@
|
|||||||
<chapter id="configuration" xreflabel="Configuration">
|
<chapter id="configuration" xreflabel="Configuration">
|
||||||
<title>repmgr configuration</title>
|
<title>repmgr configuration</title>
|
||||||
|
|
||||||
&configuration-file;
|
&configuration-file;
|
||||||
&configuration-file-settings;
|
&configuration-file-required-settings;
|
||||||
|
&configuration-file-log-settings;
|
||||||
|
&configuration-file-service-commands;
|
||||||
|
|
||||||
|
<sect1 id="configuration-permissions" xreflabel="Database user permissions">
|
||||||
|
<indexterm>
|
||||||
|
<primary>configuration</primary>
|
||||||
|
<secondary>database user permissions</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>repmgr database user permissions</title>
|
||||||
|
<para>
|
||||||
|
&repmgr; will create an extension database containing objects
|
||||||
|
for administering &repmgr; metadata. The user defined in the <varname>conninfo</varname>
|
||||||
|
setting must be able to access all objects. Additionally, superuser permissions
|
||||||
|
are required to install the &repmgr; extension. The easiest way to do this
|
||||||
|
is create the &repmgr; user as a superuser, however if this is not
|
||||||
|
desirable, the &repmgr; user can be created as a normal user and a
|
||||||
|
superuser specified with <literal>--superuser</literal> when registering a &repmgr; node.
|
||||||
|
</para>
|
||||||
|
</sect1>
|
||||||
</chapter>
|
</chapter>
|
||||||
|
|||||||
93
doc/configuring-witness-server.sgml
Normal file
93
doc/configuring-witness-server.sgml
Normal file
@@ -0,0 +1,93 @@
|
|||||||
|
<chapter id="using-witness-server">
|
||||||
|
<indexterm>
|
||||||
|
<primary>witness server</primary>
|
||||||
|
<seealso>Using a witness server with repmgrd</seealso>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
|
||||||
|
<title>Using a witness server</title>
|
||||||
|
<para>
|
||||||
|
A <xref linkend="witness-server"> is a normal PostgreSQL instance which
|
||||||
|
is not part of the streaming replication cluster; its purpose is, if a
|
||||||
|
failover situation occurs, to provide proof that the primary server
|
||||||
|
itself is unavailable.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
A typical use case for a witness server is a two-node streaming replication
|
||||||
|
setup, where the primary and standby are in different locations (data centres).
|
||||||
|
By creating a witness server in the same location (data centre) as the primary,
|
||||||
|
if the primary becomes unavailable it's possible for the standby to decide whether
|
||||||
|
it can promote itself without risking a "split brain" scenario: if it can't see either the
|
||||||
|
witness or the primary server, it's likely there's a network-level interruption
|
||||||
|
and it should not promote itself. If it can seen the witness but not the primary,
|
||||||
|
this proves there is no network interruption and the primary itself is unavailable,
|
||||||
|
and it can therefore promote itself (and ideally take action to fence the
|
||||||
|
former primary).
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
<emphasis>Never</emphasis> install a witness server on the same physical host
|
||||||
|
as another node in the replication cluster managed by &repmgr; - it's essential
|
||||||
|
the witness is not affected in any way by failure of another node.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
For more complex replication scenarios,e.g. with multiple datacentres, it may
|
||||||
|
be preferable to use location-based failover, which ensures that only nodes
|
||||||
|
in the same location as the primary will ever be promotion candidates;
|
||||||
|
see <xref linkend="repmgrd-network-split"> for more details.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
A witness server will only be useful if <application>repmgrd</application>
|
||||||
|
is in use.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<sect1 id="creating-witness-server">
|
||||||
|
<title>Creating a witness server</title>
|
||||||
|
<para>
|
||||||
|
To create a witness server, set up a normal PostgreSQL instance on a server
|
||||||
|
in the same physical location as the cluster's primary server.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This instance should *not* be on the same physical host as the primary server,
|
||||||
|
as otherwise if the primary server fails due to hardware issues, the witness
|
||||||
|
server will be lost too.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
&repmgr; 3.3 and earlier provided a <command>repmgr create witness</command>
|
||||||
|
command, which would automatically create a PostgreSQL instance. However
|
||||||
|
this often resulted in an unsatisfactory, hard-to-customise instance.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
The witness server should be configured in the same way as a normal
|
||||||
|
&repmgr; node; see section <xref linkend="configuration">.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Register the witness server with <xref linkend="repmgr-witness-register">.
|
||||||
|
This will create the &repmgr; extension on the witness server, and make
|
||||||
|
a copy of the &repmgr; metadata.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
As the witness server is not part of the replication cluster, further
|
||||||
|
changes to the &repmgr; metadata will be synchronised by
|
||||||
|
<application>repmgrd</application>.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
Once the witness server has been configured, <application>repmgrd</application>
|
||||||
|
should be started; for more details see <xref linkend="repmgrd-witness-server">.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
To unregister a witness server, use <xref linkend="repmgr-witness-unregister">.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
</chapter>
|
||||||
@@ -1,12 +1,17 @@
|
|||||||
<chapter id="event-notifications" xreflabel="event notifications">
|
<chapter id="event-notifications" xreflabel="event notifications">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>event notifications</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Event Notifications</title>
|
<title>Event Notifications</title>
|
||||||
<para>
|
<para>
|
||||||
Each time `repmgr` or `repmgrd` perform a significant event, a record
|
Each time &repmgr; or <application>repmgrd</application> perform a significant event, a record
|
||||||
of that event is written into the `repmgr.events` table together with
|
of that event is written into the <literal>repmgr.events</literal> table together with
|
||||||
a timestamp, an indication of failure or success, and further details
|
a timestamp, an indication of failure or success, and further details
|
||||||
if appropriate. This is useful for gaining an overview of events
|
if appropriate. This is useful for gaining an overview of events
|
||||||
affecting the replication cluster. However note that this table has
|
affecting the replication cluster. However note that this table has
|
||||||
advisory character and should be used in combination with the `repmgr`
|
advisory character and should be used in combination with the &repmgr;
|
||||||
and PostgreSQL logs to obtain details of any events.
|
and PostgreSQL logs to obtain details of any events.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
@@ -28,11 +33,11 @@
|
|||||||
<para>
|
<para>
|
||||||
Additionally, event notifications can be passed to a user-defined program
|
Additionally, event notifications can be passed to a user-defined program
|
||||||
or script which can take further action, e.g. send email notifications.
|
or script which can take further action, e.g. send email notifications.
|
||||||
This is done by setting the `event_notification_command` parameter in
|
This is done by setting the <literal>event_notification_command</literal> parameter in
|
||||||
`repmgr.conf`.
|
<filename>repmgr.conf</filename>.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
This parameter accepts the following format placeholders:
|
The following format placeholders are provided for all event notifications:
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<variablelist>
|
<variablelist>
|
||||||
@@ -55,10 +60,10 @@
|
|||||||
</varlistentry>
|
</varlistentry>
|
||||||
|
|
||||||
<varlistentry>
|
<varlistentry>
|
||||||
<term><option>%t</option></term>
|
<term><option>%s</option></term>
|
||||||
<listitem>
|
<listitem>
|
||||||
<para>
|
<para>
|
||||||
success (1 or 0)
|
success (1) or failure (0)
|
||||||
</para>
|
</para>
|
||||||
</listitem>
|
</listitem>
|
||||||
</varlistentry>
|
</varlistentry>
|
||||||
@@ -80,6 +85,7 @@
|
|||||||
</listitem>
|
</listitem>
|
||||||
</varlistentry>
|
</varlistentry>
|
||||||
</variablelist>
|
</variablelist>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
The values provided for <literal>%t</literal> and <literal>%d</literal>
|
The values provided for <literal>%t</literal> and <literal>%d</literal>
|
||||||
will probably contain spaces, so should be quoted in the provided command
|
will probably contain spaces, so should be quoted in the provided command
|
||||||
@@ -88,69 +94,173 @@
|
|||||||
event_notification_command='/path/to/some/script %n %e %s "%t" "%d"'
|
event_notification_command='/path/to/some/script %n %e %s "%t" "%d"'
|
||||||
</programlisting>
|
</programlisting>
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Additionally the following format placeholders are available for the event
|
The following parameters are provided for a subset of event notifications:
|
||||||
type <varname>bdr_failover</varname> and optionally <varname>bdr_recovery</varname>:
|
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<variablelist>
|
<variablelist>
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>%p</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
node ID of the current primary (<xref linkend="repmgr-standby-register"> and <xref linkend="repmgr-standby-follow">)
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
node ID of the demoted primary (<xref linkend="repmgr-standby-switchover"> only)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
<varlistentry>
|
<varlistentry>
|
||||||
<term><option>%c</option></term>
|
<term><option>%c</option></term>
|
||||||
<listitem>
|
<listitem>
|
||||||
<para>
|
<para>
|
||||||
conninfo string of the next available node
|
<literal>conninfo</literal> string of the primary node
|
||||||
|
(<xref linkend="repmgr-standby-register"> and <xref linkend="repmgr-standby-follow">)
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
<literal>conninfo</literal> string of the next available node
|
||||||
|
(<varname>bdr_failover</varname> and <varname>bdr_recovery</varname>)
|
||||||
</para>
|
</para>
|
||||||
</listitem>
|
</listitem>
|
||||||
</varlistentry>
|
</varlistentry>
|
||||||
|
|
||||||
<varlistentry>
|
<varlistentry>
|
||||||
<term><option>%a</option></term>
|
<term><option>%a</option></term>
|
||||||
<listitem>
|
<listitem>
|
||||||
<para>
|
<para>
|
||||||
name of the next available node
|
name of the current primary node (<xref linkend="repmgr-standby-register"> and <xref linkend="repmgr-standby-follow">)
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
name of the next available node (<varname>bdr_failover</varname> and <varname>bdr_recovery</varname>)
|
||||||
</para>
|
</para>
|
||||||
</listitem>
|
</listitem>
|
||||||
</varlistentry>
|
</varlistentry>
|
||||||
|
|
||||||
</variablelist>
|
</variablelist>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
These should always be quoted.
|
The values provided for <literal>%c</literal> and <literal>%a</literal>
|
||||||
|
will probably contain spaces, so should always be quoted.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
By default, all notification types will be passed to the designated script;
|
By default, all notification types will be passed to the designated script;
|
||||||
the notification types can be filtered to explicitly named ones:
|
the notification types can be filtered to explicitly named ones using the
|
||||||
|
<varname>event_notifications</varname> parameter.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Events generated by the &repmgr; command:
|
||||||
|
|
||||||
<itemizedlist spacing="compact" mark="bullet">
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>primary_register</literal></simpara>
|
<simpara><literal><link linkend="repmgr-primary-register-events">cluster_created</link></literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>standby_register</literal></simpara>
|
<simpara><literal><link linkend="repmgr-primary-register-events">primary_register</link></literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>standby_unregister</literal></simpara>
|
<simpara><literal><link linkend="repmgr-primary-unregister-events">primary_unregister</link></literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal><link linkend="repmgr-standby-clone-events">standby_clone</link></literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>standby_clone</literal></simpara>
|
<simpara><literal><link linkend="repmgr-standby-register-events">standby_register</link></literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>standby_promote</literal></simpara>
|
<simpara><literal><link linkend="repmgr-standby-register-events">standby_register_sync</link></literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>standby_follow</literal></simpara>
|
<simpara><literal><link linkend="repmgr-standby-unregister-events">standby_unregister</link></literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal><link linkend="repmgr-standby-promote-events">standby_promote</link></literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>standby_disconnect_manual</literal></simpara>
|
<simpara><literal><link linkend="repmgr-standby-follow-events">standby_follow</link></literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal><link linkend="repmgr-standby-switchover-events">standby_switchover</link></literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal><link linkend="repmgr-witness-register-events">witness_register</link></literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal><link linkend="repmgr-witness-unregister-events">witness_unregister</link></literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal><link linkend="repmgr-node-rejoin-events">node_rejoin</link></literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal><link linkend="repmgr-cluster-cleanup-events">cluster_cleanup</link></literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Events generated by <application>repmgrd</application> (streaming replication mode):
|
||||||
|
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>repmgrd_start</literal></simpara>
|
<simpara><literal>repmgrd_start</literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>repmgrd_shutdown</literal></simpara>
|
<simpara><literal>repmgrd_shutdown</literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>repmgrd_reload</literal></simpara>
|
||||||
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>repmgrd_failover_promote</literal></simpara>
|
<simpara><literal>repmgrd_failover_promote</literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>repmgrd_failover_follow</literal></simpara>
|
<simpara><literal>repmgrd_failover_follow</literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>repmgrd_failover_aborted</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>repmgrd_standby_reconnect</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>repmgrd_promote_error</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>repmgrd_local_disconnect</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>repmgrd_local_reconnect</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>repmgrd_upstream_disconnect</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>repmgrd_upstream_reconnect</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>standby_disconnect_manual</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>standby_failure</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>standby_recovery</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Events generated by <application>repmgrd</application> (BDR mode):
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><literal>bdr_failover</literal></simpara>
|
<simpara><literal>bdr_failover</literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
@@ -169,6 +279,7 @@
|
|||||||
|
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Note that under some circumstances (e.g. when no replication cluster primary
|
Note that under some circumstances (e.g. when no replication cluster primary
|
||||||
could be located), it will not be possible to write an entry into the
|
could be located), it will not be possible to write an entry into the
|
||||||
|
|||||||
@@ -38,11 +38,15 @@
|
|||||||
<!ENTITY quickstart SYSTEM "quickstart.sgml">
|
<!ENTITY quickstart SYSTEM "quickstart.sgml">
|
||||||
<!ENTITY configuration SYSTEM "configuration.sgml">
|
<!ENTITY configuration SYSTEM "configuration.sgml">
|
||||||
<!ENTITY configuration-file SYSTEM "configuration-file.sgml">
|
<!ENTITY configuration-file SYSTEM "configuration-file.sgml">
|
||||||
<!ENTITY configuration-file-settings SYSTEM "configuration-file-settings.sgml">
|
<!ENTITY configuration-file-required-settings SYSTEM "configuration-file-required-settings.sgml">
|
||||||
|
<!ENTITY configuration-file-log-settings SYSTEM "configuration-file-log-settings.sgml">
|
||||||
|
<!ENTITY configuration-file-service-commands SYSTEM "configuration-file-service-commands.sgml">
|
||||||
<!ENTITY cloning-standbys SYSTEM "cloning-standbys.sgml">
|
<!ENTITY cloning-standbys SYSTEM "cloning-standbys.sgml">
|
||||||
<!ENTITY promoting-standby SYSTEM "promoting-standby.sgml">
|
<!ENTITY promoting-standby SYSTEM "promoting-standby.sgml">
|
||||||
<!ENTITY follow-new-primary SYSTEM "follow-new-primary.sgml">
|
<!ENTITY follow-new-primary SYSTEM "follow-new-primary.sgml">
|
||||||
<!ENTITY switchover SYSTEM "switchover.sgml">
|
<!ENTITY switchover SYSTEM "switchover.sgml">
|
||||||
|
<!ENTITY configuring-witness-server SYSTEM "configuring-witness-server.sgml">
|
||||||
|
|
||||||
<!ENTITY event-notifications SYSTEM "event-notifications.sgml">
|
<!ENTITY event-notifications SYSTEM "event-notifications.sgml">
|
||||||
<!ENTITY upgrading-repmgr SYSTEM "upgrading-repmgr.sgml">
|
<!ENTITY upgrading-repmgr SYSTEM "upgrading-repmgr.sgml">
|
||||||
|
|
||||||
@@ -53,6 +57,9 @@
|
|||||||
<!ENTITY repmgrd-degraded-monitoring SYSTEM "repmgrd-degraded-monitoring.sgml">
|
<!ENTITY repmgrd-degraded-monitoring SYSTEM "repmgrd-degraded-monitoring.sgml">
|
||||||
<!ENTITY repmgrd-cascading-replication SYSTEM "repmgrd-cascading-replication.sgml">
|
<!ENTITY repmgrd-cascading-replication SYSTEM "repmgrd-cascading-replication.sgml">
|
||||||
<!ENTITY repmgrd-network-split SYSTEM "repmgrd-network-split.sgml">
|
<!ENTITY repmgrd-network-split SYSTEM "repmgrd-network-split.sgml">
|
||||||
|
<!ENTITY repmgrd-witness-server SYSTEM "repmgrd-witness-server.sgml">
|
||||||
|
<!ENTITY repmgrd-pausing SYSTEM "repmgrd-pausing.sgml">
|
||||||
|
<!ENTITY repmgrd-bdr SYSTEM "repmgrd-bdr.sgml">
|
||||||
|
|
||||||
<!ENTITY repmgr-primary-register SYSTEM "repmgr-primary-register.sgml">
|
<!ENTITY repmgr-primary-register SYSTEM "repmgr-primary-register.sgml">
|
||||||
<!ENTITY repmgr-primary-unregister SYSTEM "repmgr-primary-unregister.sgml">
|
<!ENTITY repmgr-primary-unregister SYSTEM "repmgr-primary-unregister.sgml">
|
||||||
@@ -62,6 +69,8 @@
|
|||||||
<!ENTITY repmgr-standby-promote SYSTEM "repmgr-standby-promote.sgml">
|
<!ENTITY repmgr-standby-promote SYSTEM "repmgr-standby-promote.sgml">
|
||||||
<!ENTITY repmgr-standby-follow SYSTEM "repmgr-standby-follow.sgml">
|
<!ENTITY repmgr-standby-follow SYSTEM "repmgr-standby-follow.sgml">
|
||||||
<!ENTITY repmgr-standby-switchover SYSTEM "repmgr-standby-switchover.sgml">
|
<!ENTITY repmgr-standby-switchover SYSTEM "repmgr-standby-switchover.sgml">
|
||||||
|
<!ENTITY repmgr-witness-register SYSTEM "repmgr-witness-register.sgml">
|
||||||
|
<!ENTITY repmgr-witness-unregister SYSTEM "repmgr-witness-unregister.sgml">
|
||||||
<!ENTITY repmgr-node-status SYSTEM "repmgr-node-status.sgml">
|
<!ENTITY repmgr-node-status SYSTEM "repmgr-node-status.sgml">
|
||||||
<!ENTITY repmgr-node-check SYSTEM "repmgr-node-check.sgml">
|
<!ENTITY repmgr-node-check SYSTEM "repmgr-node-check.sgml">
|
||||||
<!ENTITY repmgr-node-rejoin SYSTEM "repmgr-node-rejoin.sgml">
|
<!ENTITY repmgr-node-rejoin SYSTEM "repmgr-node-rejoin.sgml">
|
||||||
@@ -70,8 +79,14 @@
|
|||||||
<!ENTITY repmgr-cluster-crosscheck SYSTEM "repmgr-cluster-crosscheck.sgml">
|
<!ENTITY repmgr-cluster-crosscheck SYSTEM "repmgr-cluster-crosscheck.sgml">
|
||||||
<!ENTITY repmgr-cluster-event SYSTEM "repmgr-cluster-event.sgml">
|
<!ENTITY repmgr-cluster-event SYSTEM "repmgr-cluster-event.sgml">
|
||||||
<!ENTITY repmgr-cluster-cleanup SYSTEM "repmgr-cluster-cleanup.sgml">
|
<!ENTITY repmgr-cluster-cleanup SYSTEM "repmgr-cluster-cleanup.sgml">
|
||||||
|
<!ENTITY repmgr-daemon-status SYSTEM "repmgr-daemon-status.sgml">
|
||||||
|
<!ENTITY repmgr-daemon-pause SYSTEM "repmgr-daemon-pause.sgml">
|
||||||
|
<!ENTITY repmgr-daemon-unpause SYSTEM "repmgr-daemon-unpause.sgml">
|
||||||
|
|
||||||
|
<!ENTITY appendix-release-notes SYSTEM "appendix-release-notes.sgml">
|
||||||
|
<!ENTITY appendix-faq SYSTEM "appendix-faq.sgml">
|
||||||
<!ENTITY appendix-signatures SYSTEM "appendix-signatures.sgml">
|
<!ENTITY appendix-signatures SYSTEM "appendix-signatures.sgml">
|
||||||
|
<!ENTITY appendix-packages SYSTEM "appendix-packages.sgml">
|
||||||
|
|
||||||
<!ENTITY bookindex SYSTEM "bookindex.sgml">
|
<!ENTITY bookindex SYSTEM "bookindex.sgml">
|
||||||
|
|
||||||
|
|||||||
@@ -1,4 +1,9 @@
|
|||||||
<chapter id="follow-new-primary" xreflabel="Following a new primary">
|
<chapter id="follow-new-primary">
|
||||||
|
<indexterm>
|
||||||
|
<primary>Following a new primary</primary>
|
||||||
|
<seealso>repmgr standby follow</seealso>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Following a new primary</title>
|
<title>Following a new primary</title>
|
||||||
<para>
|
<para>
|
||||||
Following the failure or removal of the replication cluster's existing primary
|
Following the failure or removal of the replication cluster's existing primary
|
||||||
@@ -22,7 +27,8 @@
|
|||||||
</programlisting>
|
</programlisting>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
The standby is now replicating from the new primary and `repmgr cluster show`
|
The standby is now replicating from the new primary and
|
||||||
|
<command><link linkend="repmgr-cluster-show">repmgr cluster show</link></command>
|
||||||
output reflects this:
|
output reflects this:
|
||||||
<programlisting>
|
<programlisting>
|
||||||
$ repmgr -f /etc/repmgr.conf cluster show
|
$ repmgr -f /etc/repmgr.conf cluster show
|
||||||
|
|||||||
@@ -1,32 +1,228 @@
|
|||||||
<sect1 id="installation-packages" xreflabel="Installing from packages">
|
<sect1 id="installation-packages" xreflabel="Installing from packages">
|
||||||
<title>Installing &repmgr; from packages</title>
|
<title>Installing &repmgr; from packages</title>
|
||||||
<para>
|
<para>
|
||||||
We recommend installing `repmgr` using the available packages for your
|
We recommend installing &repmgr; using the available packages for your
|
||||||
system.
|
system.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<sect2 id="installation-packages-redhat" xreflabel="Installing from packages on RHEL, Fedora and CentOS">
|
<sect2 id="installation-packages-redhat" xreflabel="Installing from packages on RHEL, CentOS and Fedora">
|
||||||
<title>RedHat/Fedora/CentOS</title>
|
|
||||||
<para>
|
<indexterm>
|
||||||
RPM packages for `repmgr` are available via Yum through
|
<primary>installation</primary>
|
||||||
the PostgreSQL Global Development Group RPM repository
|
<secondary>on Red Hat/CentOS/Fedora etc.</secondary>
|
||||||
( <ulink url="https://yum.postgresql.org/">http://yum.postgresql.org/</>).
|
</indexterm>
|
||||||
Follow the instructions for your distribution (RedHat, CentOS,
|
|
||||||
Fedora, etc.) and architecture as detailed at yum.postgresql.org.
|
<title>RedHat/CentOS/Fedora</title>
|
||||||
</para>
|
<para>
|
||||||
<para>
|
&repmgr; RPM packages for RedHat/CentOS variants and Fedora are available from the
|
||||||
2ndQuadrant also provides its own RPM packages which are made available
|
<ulink url="https://2ndquadrant.com">2ndQuadrant</ulink>
|
||||||
at the same time as each `repmgr` release, as it can take some days for
|
<ulink url="https://dl.2ndquadrant.com/">public repository</ulink>; see following
|
||||||
them to become available via the main PGDG repository. See here for details:
|
section for details.
|
||||||
<ulink url="http://repmgr.org/yum-repository.html">http://repmgr.org/yum-repository.html</>
|
|
||||||
</para>
|
|
||||||
</sect2>
|
|
||||||
<sect2 id="installation-packages-debian" xreflabel="Installing from packages on Debian or Ubuntu">
|
|
||||||
<title>Debian/Ubuntu</title>
|
|
||||||
<para>.deb packages for `repmgr` are available from the
|
|
||||||
PostgreSQL Community APT repository (<ulink url="http://apt.postgresql.org/">http://apt.postgresql.org/</> ).
|
|
||||||
Instructions can be found in the APT section of the PostgreSQL Wiki
|
|
||||||
(<ulink url="https://wiki.postgresql.org/wiki/Apt">https://wiki.postgresql.org/wiki/Apt</> ).
|
|
||||||
</para>
|
</para>
|
||||||
|
<para>
|
||||||
|
RPM packages for &repmgr; are also available via Yum through
|
||||||
|
the PostgreSQL Global Development Group RPM repository
|
||||||
|
(<ulink url="https://yum.postgresql.org/">http://yum.postgresql.org/</ulink>).
|
||||||
|
Follow the instructions for your distribution (RedHat, CentOS,
|
||||||
|
Fedora, etc.) and architecture as detailed there. Note that it can take some days
|
||||||
|
for new &repmgr; packages to become available via the this repository.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
&repmgr; packages are designed to be compatible with the community-provided PostgreSQL packages.
|
||||||
|
They may not work with vendor-specific packages such as those provided by RedHat for RHEL
|
||||||
|
customers, as the filesystem layout may be different to the community RPMs.
|
||||||
|
Please contact your support vendor for assistance.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
For more information on the package contents, including details of installation
|
||||||
|
paths and relevant <link linkend="configuration-file-service-commands">service commands</link>,
|
||||||
|
see the appendix section <xref linkend="packages-centos">.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
|
||||||
|
<sect3 id="installation-packages-redhat-2ndq">
|
||||||
|
<title>2ndQuadrant public RPM yum repository</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Beginning with <ulink url="https://repmgr.org/docs/4.1/release-4.0.5.html">repmgr 4.0.5</ulink>,
|
||||||
|
<ulink url="https://2ndquadrant.com/">2ndQuadrant</ulink> provides a dedicated <literal>yum</literal>
|
||||||
|
<ulink url="https://dl.2ndquadrant.com/">public repository</ulink> for 2ndQuadrant software,
|
||||||
|
including &repmgr;. We recommend using this for all future &repmgr; releases.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
General instructions for using this repository can be found on its
|
||||||
|
<ulink url="https://dl.2ndquadrant.com/">homepage</ulink>. Specific instructions
|
||||||
|
for installing &repmgr; follow below.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
<emphasis>Installation</emphasis>
|
||||||
|
|
||||||
|
<itemizedlist>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Locate the repository RPM for your PostgreSQL version from the list at:
|
||||||
|
<ulink url="https://dl.2ndquadrant.com/">https://dl.2ndquadrant.com/</ulink>
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Install the repository definition for your distribution and PostgreSQL version
|
||||||
|
(this enables the 2ndQuadrant repository as a source of &repmgr; packages).
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For example, for PostgreSQL 10 on CentOS, execute:
|
||||||
|
<programlisting>
|
||||||
|
curl https://dl.2ndquadrant.com/default/release/get/10/rpm | sudo bash</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Verify that the repository is installed with:
|
||||||
|
<programlisting>
|
||||||
|
sudo yum repolist</programlisting>
|
||||||
|
The output should contain two entries like this:
|
||||||
|
<programlisting>
|
||||||
|
2ndquadrant-dl-default-release-pg10/7/x86_64 2ndQuadrant packages (PG10) for 7 - x86_64 4
|
||||||
|
2ndquadrant-dl-default-release-pg10-debug/7/x86_64 2ndQuadrant packages (PG10) for 7 - x86_64 - Debug 3</programlisting>
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Install the &repmgr version appropriate for your PostgreSQL version (e.g. <literal>repmgr10</literal>):
|
||||||
|
<programlisting>
|
||||||
|
$ yum install repmgr10</programlisting>
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<emphasis>Compatibility with PGDG Repositories</emphasis>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The 2ndQuadrant &repmgr; yum repository packages use the same definitions and file system layout as the
|
||||||
|
main PGDG repository.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Normally <application>yum</application> will prioritize the repository with the most recent &repmgr; version.
|
||||||
|
Once the PGDG repository has been updated, it doesn't matter which repository
|
||||||
|
the packages are installed from.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To ensure the 2ndQuadrant repository is always prioritised, install <literal>yum-plugin-priorities</literal>
|
||||||
|
and set the repository priorities accordingly.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<emphasis>Installing a specific package version</emphasis>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To install a specific package version, execute <command>yum --showduplicates list</command>
|
||||||
|
for the package in question:
|
||||||
|
<programlisting>
|
||||||
|
[root@localhost ~]# yum --showduplicates list repmgr10
|
||||||
|
Loaded plugins: fastestmirror
|
||||||
|
Loading mirror speeds from cached hostfile
|
||||||
|
* base: ftp.iij.ad.jp
|
||||||
|
* extras: ftp.iij.ad.jp
|
||||||
|
* updates: ftp.iij.ad.jp
|
||||||
|
Available Packages
|
||||||
|
repmgr10.x86_64 4.0.3-1.rhel7 pgdg10
|
||||||
|
repmgr10.x86_64 4.0.4-1.rhel7 pgdg10
|
||||||
|
repmgr10.x86_64 4.0.5-1.el7 2ndquadrant-repo-10</programlisting>
|
||||||
|
then append the appropriate version number to the package name with a hyphen, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
[root@localhost ~]# yum install repmgr10-4.0.3-1.rhel7</programlisting>
|
||||||
|
</para>
|
||||||
|
</sect3>
|
||||||
</sect2>
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="installation-packages-debian" xreflabel="Installing from packages on Debian or Ubuntu">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>installation</primary>
|
||||||
|
<secondary>on Debian/Ubuntu etc.</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>Debian/Ubuntu</title>
|
||||||
|
<para>.deb packages for &repmgr; are available from the
|
||||||
|
PostgreSQL Community APT repository (<ulink url="http://apt.postgresql.org/">http://apt.postgresql.org/</ulink>).
|
||||||
|
Instructions can be found in the APT section of the PostgreSQL Wiki
|
||||||
|
(<ulink url="https://wiki.postgresql.org/wiki/Apt">https://wiki.postgresql.org/wiki/Apt</ulink>).
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For more information on the package contents, including details of installation
|
||||||
|
paths and relevant <link linkend="configuration-file-service-commands">service commands</link>,
|
||||||
|
see the appendix section <xref linkend="packages-debian-ubuntu">.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<sect3 id="installation-packages-debian-ubuntu-2ndq">
|
||||||
|
<title>2ndQuadrant public apt repository for Debian/Ubuntu</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Beginning with <ulink url="https://repmgr.org/docs/4.0/release-4.0.5.html">repmgr 4.0.5</ulink>,
|
||||||
|
<ulink url="https://2ndquadrant.com/">2ndQuadrant</ulink> provides a
|
||||||
|
<ulink url="https://dl.2ndquadrant.com/">public apt repository</ulink> for 2ndQuadrant software,
|
||||||
|
including &repmgr;.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
General instructions for using this repository can be found on its
|
||||||
|
<ulink url="https://dl.2ndquadrant.com/">homepage</ulink>. Specific instructions
|
||||||
|
for installing &repmgr; follow below.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
|
||||||
|
<emphasis>Installation</emphasis>
|
||||||
|
|
||||||
|
<itemizedlist>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Install the repository definition for your distribution and PostgreSQL version
|
||||||
|
(this enables the 2ndQuadrant repository as a source of &repmgr; packages) by executing:
|
||||||
|
<programlisting>
|
||||||
|
curl https://dl.2ndquadrant.com/default/release/get/deb | sudo bash</programlisting>
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
This will automatically install the following additional packages, if not already present:
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>lsb-release</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>apt-transport-https</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Install the &repmgr version appropriate for your PostgreSQL version (e.g. <literal>repmgr10</literal>):
|
||||||
|
<programlisting>
|
||||||
|
$ apt-get install postgresql-10-repmgr</programlisting>
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
For packages for PostgreSQL 9.6 and earlier, the package name includes
|
||||||
|
a period between major and minor version numbers, e.g.
|
||||||
|
<literal>postgresql-9.6-repmgr</literal>.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</sect3>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|||||||
@@ -1,4 +1,10 @@
|
|||||||
<sect1 id="install-requirements" xreflabel="installation requirements">
|
<sect1 id="install-requirements" xreflabel="installation requirements">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>installation</primary>
|
||||||
|
<secondary>requirements</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Requirements for installing repmgr</title>
|
<title>Requirements for installing repmgr</title>
|
||||||
<para>
|
<para>
|
||||||
repmgr is developed and tested on Linux and OS X, but should work on any
|
repmgr is developed and tested on Linux and OS X, but should work on any
|
||||||
@@ -7,17 +13,14 @@
|
|||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
From version 4.0, repmgr is compatible with all PostgreSQL versions from 9.4, including PostgreSQL 10.
|
From version 4.0, repmgr is compatible with all PostgreSQL versions from 9.3, including PostgreSQL 10.
|
||||||
</para>
|
Note that some &repmgr; functionality is not available in PostgreSQL 9.3 and PostgreSQL 9.4.
|
||||||
<para>
|
|
||||||
PostgreSQL 9.3 is supported by repmgr 3.3.
|
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<note>
|
<note>
|
||||||
<simpara>
|
<simpara>
|
||||||
If upgrading from `repmgr 3`, please see the separate upgrade guide
|
If upgrading from &repmgr; 3.x, please see the section <xref linkend="upgrading-from-repmgr-3">.
|
||||||
`doc/upgrading-from-repmgr3.md`.
|
</simpara>
|
||||||
</simpara>
|
|
||||||
</note>
|
</note>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
@@ -26,42 +29,51 @@ If upgrading from `repmgr 3`, please see the separate upgrade guide
|
|||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
`repmgr` must be installed on each server in the replication cluster.
|
&repmgr; must be installed on each server in the replication cluster.
|
||||||
If installing repmgr from packages, the package version must match the PostgreSQL
|
If installing repmgr from packages, the package version must match the PostgreSQL
|
||||||
version. If installing from source, repmgr must be compiled against the same
|
version. If installing from source, repmgr must be compiled against the same
|
||||||
major version.
|
major version.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
A dedicated system user for `repmgr` is *not* required; as many `repmgr` and
|
A dedicated system user for &repmgr; is <emphasis>not</emphasis> required; as many &repmgr; and
|
||||||
`repmgrd` actions require direct access to the PostgreSQL data directory,
|
<application>repmgrd</application> actions require direct access to the PostgreSQL data directory,
|
||||||
these commands should be executed by the `postgres` user.
|
these commands should be executed by the <literal>postgres</literal> user.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Passwordless `ssh` connectivity between all servers in the replication cluster
|
Passwordless <command>ssh</command> connectivity between all servers in the replication cluster
|
||||||
is not required, but is necessary in the following cases:
|
is not required, but is necessary in the following cases:
|
||||||
<itemizedlist>
|
<itemizedlist>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>if you need `repmgr` to copy configuration files from outside the PostgreSQL
|
<simpara>if you need &repmgr; to copy configuration files from outside the PostgreSQL
|
||||||
data directory (in which case `rsync` is also required)</simpara>
|
data directory (in which case <command>rsync</command> is also required)</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>to perform switchover operations</simpara>
|
<simpara>to perform <link linkend="performing-switchover">switchover operations</link></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>when executing `repmgr cluster matrix` and `repmgr cluster crosscheck`</simpara>
|
<simpara>
|
||||||
|
when executing <command><link linkend="repmgr-cluster-matrix">repmgr cluster matrix</link></command>
|
||||||
|
and <command><link linkend="repmgr-cluster-crosscheck">repmgr cluster crosscheck</link></command>
|
||||||
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<tip>
|
||||||
|
<simpara>
|
||||||
|
Consider setting <varname>ConnectTimeout</varname> to a low value in your SSH configuration.
|
||||||
|
This will make it faster to detect any SSH connection errors.
|
||||||
|
</simpara>
|
||||||
|
</tip>
|
||||||
|
|
||||||
<tip>
|
<tip>
|
||||||
<simpara>
|
<simpara>
|
||||||
We recommend using a session multiplexer utility such as `screen` or
|
We recommend using a session multiplexer utility such as <command>screen</command> or
|
||||||
`tmux` when performing long-running actions (such as cloning a database)
|
<command>tmux</command> when performing long-running actions (such as cloning a database)
|
||||||
on a remote server - this will ensure the `repmgr` action won't be prematurely
|
on a remote server - this will ensure the &repmgr; action won't be prematurely
|
||||||
terminated if your `ssh` session to the server is interrupted or closed.
|
terminated if your <command>ssh</command> session to the server is interrupted or closed.
|
||||||
</simpara>
|
</simpara>
|
||||||
</tip>
|
</tip>
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|||||||
@@ -1,4 +1,9 @@
|
|||||||
<sect1 id="installation-source" xreflabel="Installing from source code">
|
<sect1 id="installation-source" xreflabel="Installing from source code">
|
||||||
|
<indexterm>
|
||||||
|
<primary>installation</primary>
|
||||||
|
<secondary>from source</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Installing &repmgr; from source</title>
|
<title>Installing &repmgr; from source</title>
|
||||||
|
|
||||||
<sect2 id="installation-source-prereqs">
|
<sect2 id="installation-source-prereqs">
|
||||||
@@ -7,8 +12,8 @@
|
|||||||
To install &repmgr; the prerequisites for compiling
|
To install &repmgr; the prerequisites for compiling
|
||||||
&postgres; must be installed. These are described in &postgres;'s
|
&postgres; must be installed. These are described in &postgres;'s
|
||||||
documentation
|
documentation
|
||||||
on <ulink url="https://www.postgresql.org/docs/current/install-requirements.html">build requirements</ulink>
|
on <ulink url="https://www.postgresql.org/docs/current/static/install-requirements.html">build requirements</ulink>
|
||||||
and <ulink url="https://www.postgresql.org/docs/current/docguide-toolsets.html">build requirements for documentation</ulink>.
|
and <ulink url="https://www.postgresql.org/docs/current/static/docguide-toolsets.html">build requirements for documentation</ulink>.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
@@ -25,8 +30,7 @@
|
|||||||
building PostgreSQL with:
|
building PostgreSQL with:
|
||||||
<programlisting>
|
<programlisting>
|
||||||
sudo apt-get update
|
sudo apt-get update
|
||||||
sudo apt-get build-dep postgresql-9.6
|
sudo apt-get build-dep postgresql-9.6</programlisting>
|
||||||
</programlisting>
|
|
||||||
</para>
|
</para>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
@@ -39,8 +43,7 @@
|
|||||||
sudo yum check-update
|
sudo yum check-update
|
||||||
sudo yum groupinstall "Development Tools"
|
sudo yum groupinstall "Development Tools"
|
||||||
sudo yum install yum-utils openjade docbook-dtds docbook-style-dsssl docbook-style-xsl
|
sudo yum install yum-utils openjade docbook-dtds docbook-style-dsssl docbook-style-xsl
|
||||||
sudo yum-builddep postgresql96
|
sudo yum-builddep postgresql96</programlisting>
|
||||||
</programlisting>
|
|
||||||
</para>
|
</para>
|
||||||
</listitem>
|
</listitem>
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
@@ -77,14 +80,13 @@
|
|||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
There are also tags for each &repmgr; release, e.g. <filename>REL4_0_STABLE</filename>.
|
There are also tags for each &repmgr; release, e.g. <filename>4.0.5</filename>.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Clone the source code using <application>git</application>:
|
Clone the source code using <application>git</application>:
|
||||||
<programlisting>
|
<programlisting>
|
||||||
git clone https://github.com/2ndQuadrant/repmgr
|
git clone https://github.com/2ndQuadrant/repmgr</programlisting>
|
||||||
</programlisting>
|
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
@@ -129,11 +131,45 @@
|
|||||||
To installing &repmgr; from source, simply execute:
|
To installing &repmgr; from source, simply execute:
|
||||||
|
|
||||||
<programlisting>
|
<programlisting>
|
||||||
./configure && make install
|
./configure && make install</programlisting>
|
||||||
</programlisting>
|
|
||||||
|
|
||||||
Ensure `pg_config` for the target PostgreSQL version is in `$PATH`.
|
Ensure <command>pg_config</command> for the target PostgreSQL version is in
|
||||||
|
<varname>$PATH</varname>.
|
||||||
</para>
|
</para>
|
||||||
</sect2>
|
</sect2>
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
<sect2 id="installation-build-repmgr-docs">
|
||||||
|
<title>Building &repmgr; documentation</title>
|
||||||
|
<para>
|
||||||
|
The &repmgr; documentation is (like the main PostgreSQL project)
|
||||||
|
written in DocBook format. To build it locally as HTML, you'll need to
|
||||||
|
install the required packages as described in the
|
||||||
|
<ulink url="https://www.postgresql.org/docs/9.6/static/docguide-toolsets.html">
|
||||||
|
PostgreSQL documentation</ulink> then execute:
|
||||||
|
<programlisting>
|
||||||
|
./configure && make install-doc</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The generated HTML files will be placed in the <filename>doc/html</filename>
|
||||||
|
subdirectory of your source tree.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
To build the documentation as a single HTML file, execute:
|
||||||
|
<programlisting>
|
||||||
|
cd doc/ && make repmgr.html</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
Due to changes in PostgreSQL's documentation build system from PostgreSQL 10,
|
||||||
|
the documentation can currently only be built agains PostgreSQL 9.6 or earlier.
|
||||||
|
This limitation will be fixed when time and resources permit.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|||||||
@@ -1,4 +1,8 @@
|
|||||||
<chapter id="installation" xreflabel="Installation">
|
<chapter id="installation" xreflabel="Installation">
|
||||||
|
<indexterm>
|
||||||
|
<primary>installation</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Installation</title>
|
<title>Installation</title>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
|
|||||||
@@ -1,9 +1,9 @@
|
|||||||
<!-- doc/src/sgml/legal.sgml -->
|
<!-- doc/legal.sgml -->
|
||||||
|
|
||||||
<date>2017</date>
|
<date>2017</date>
|
||||||
|
|
||||||
<copyright>
|
<copyright>
|
||||||
<year>2010-2017</year>
|
<year>2010-2018</year>
|
||||||
<holder>2ndQuadrant, Ltd.</holder>
|
<holder>2ndQuadrant, Ltd.</holder>
|
||||||
</copyright>
|
</copyright>
|
||||||
|
|
||||||
@@ -11,10 +11,27 @@
|
|||||||
<title>Legal Notice</title>
|
<title>Legal Notice</title>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
<productname>repmgr</productname> is Copyright © 2010-2017
|
<productname>repmgr</productname> is Copyright © 2010-2018
|
||||||
by 2ndQuadrant, Ltd.
|
by 2ndQuadrant, Ltd. All rights reserved.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>add license</para>
|
<para>
|
||||||
|
This program is free software: you can redistribute it and/or modify
|
||||||
|
it under the terms of the GNU General Public License as published by
|
||||||
|
the Free Software Foundation, either version 3 of the License, or
|
||||||
|
(at your option) any later version.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This program is distributed in the hope that it will be useful,
|
||||||
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
GNU General Public License for more details.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
You should have received a copy of the GNU General Public License
|
||||||
|
along with this program. If not, see
|
||||||
|
<ulink url="https://www.gnu.org/licenses/">https://www.gnu.org/licenses/</ulink>
|
||||||
|
to obtain one.
|
||||||
|
</para>
|
||||||
|
|
||||||
</legalnotice>
|
</legalnotice>
|
||||||
|
|||||||
@@ -2,9 +2,15 @@
|
|||||||
<title>repmgr overview</title>
|
<title>repmgr overview</title>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
This chapter provides a high-level overview of repmgr's components and functionality.
|
This chapter provides a high-level overview of &repmgr;'s components and
|
||||||
|
functionality.
|
||||||
</para>
|
</para>
|
||||||
<sect1 id="repmgr-concepts" xreflabel="Concepts">
|
<sect1 id="repmgr-concepts" xreflabel="Concepts">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>concepts</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Concepts</title>
|
<title>Concepts</title>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
@@ -15,13 +21,13 @@
|
|||||||
streaming replication</>.
|
streaming replication</>.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
The following terms are used throughout the `repmgr` documentation.
|
The following terms are used throughout the &repmgr; documentation.
|
||||||
<variablelist>
|
<variablelist>
|
||||||
<varlistentry>
|
<varlistentry>
|
||||||
<term>replication cluster</term>
|
<term>replication cluster</term>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>
|
<simpara>
|
||||||
In the `repmgr` documentation, "replication cluster" refers to the network
|
In the &repmgr; documentation, "replication cluster" refers to the network
|
||||||
of PostgreSQL servers connected by streaming replication.
|
of PostgreSQL servers connected by streaming replication.
|
||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
@@ -31,7 +37,7 @@
|
|||||||
<term>node</term>
|
<term>node</term>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>
|
<simpara>
|
||||||
A node is a server within a replication cluster.
|
A node is a single PostgreSQL server within a replication cluster.
|
||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</varlistentry>
|
</varlistentry>
|
||||||
@@ -41,7 +47,7 @@
|
|||||||
<listitem>
|
<listitem>
|
||||||
<simpara>
|
<simpara>
|
||||||
The node a standby server connects to, in order to receive streaming replication.
|
The node a standby server connects to, in order to receive streaming replication.
|
||||||
This is either the primary server or in the case of cascading replication, another
|
This is either the primary server, or in the case of cascading replication, another
|
||||||
standby.
|
standby.
|
||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
@@ -52,7 +58,7 @@
|
|||||||
<listitem>
|
<listitem>
|
||||||
<simpara>
|
<simpara>
|
||||||
This is the action which occurs if a primary server fails and a suitable standby
|
This is the action which occurs if a primary server fails and a suitable standby
|
||||||
is promoted as the new primary. The `repmgrd` daemon supports automatic failover
|
is promoted as the new primary. The <application>repmgrd</application> daemon supports automatic failover
|
||||||
to minimise downtime.
|
to minimise downtime.
|
||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
@@ -66,7 +72,7 @@
|
|||||||
it's necessary to take a primary server offline; in this case a controlled
|
it's necessary to take a primary server offline; in this case a controlled
|
||||||
switchover is necessary, whereby a suitable standby is promoted and the
|
switchover is necessary, whereby a suitable standby is promoted and the
|
||||||
existing primary removed from the replication cluster in a controlled manner.
|
existing primary removed from the replication cluster in a controlled manner.
|
||||||
The `repmgr` command line client provides this functionality.
|
The &repmgr; command line client provides this functionality.
|
||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</varlistentry>
|
</varlistentry>
|
||||||
@@ -82,13 +88,37 @@
|
|||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</varlistentry>
|
</varlistentry>
|
||||||
|
<varlistentry id="witness-server">
|
||||||
|
<term>witness server</term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
&repmgr; provides functionality to set up a so-called "witness server" to
|
||||||
|
assist in determining a new primary server in a failover situation with more
|
||||||
|
than one standby. The witness server itself is not part of the replication
|
||||||
|
cluster, although it does contain a copy of the repmgr metadata schema.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The purpose of a witness server is to provide a "casting vote" where servers
|
||||||
|
in the replication cluster are split over more than one location. In the event
|
||||||
|
of a loss of connectivity between locations, the presence or absence of
|
||||||
|
the witness server will decide whether a server at that location is promoted
|
||||||
|
to primary; this is to prevent a "split-brain" situation where an isolated
|
||||||
|
location interprets a network outage as a failure of the (remote) primary and
|
||||||
|
promotes a (local) standby.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
A witness server only needs to be created if <application>repmgrd</application>
|
||||||
|
is in use.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
</variablelist>
|
</variablelist>
|
||||||
</para>
|
</para>
|
||||||
</sect1>
|
</sect1>
|
||||||
<sect1 id="repmgr-components" xreflabel="Components">
|
<sect1 id="repmgr-components" xreflabel="Components">
|
||||||
<title>Components</title>
|
<title>Components</title>
|
||||||
<para>
|
<para>
|
||||||
`repmgr` is a suite of open-source tools to manage replication and failover
|
&repmgr; is a suite of open-source tools to manage replication and failover
|
||||||
within a cluster of PostgreSQL servers. It supports and enhances PostgreSQL's
|
within a cluster of PostgreSQL servers. It supports and enhances PostgreSQL's
|
||||||
built-in streaming replication, which provides a single read/write primary server
|
built-in streaming replication, which provides a single read/write primary server
|
||||||
and one or more read-only standbys containing near-real time copies of the primary
|
and one or more read-only standbys containing near-real time copies of the primary
|
||||||
@@ -147,11 +177,12 @@
|
|||||||
<sect1 id="repmgr-user-metadata" xreflabel="Repmgr user and metadata">
|
<sect1 id="repmgr-user-metadata" xreflabel="Repmgr user and metadata">
|
||||||
<title>Repmgr user and metadata</title>
|
<title>Repmgr user and metadata</title>
|
||||||
<para>
|
<para>
|
||||||
In order to effectively manage a replication cluster, `repmgr` needs to store
|
In order to effectively manage a replication cluster, &repmgr; needs to store
|
||||||
information about the servers in the cluster in a dedicated database schema.
|
information about the servers in the cluster in a dedicated database schema.
|
||||||
This schema is automatically by the `repmgr` extension, which is installed
|
This schema is automatically created by the &repmgr; extension, which is installed
|
||||||
during the first step in initialising a `repmgr`-administered cluster
|
during the first step in initializing a &repmgr;-administered cluster
|
||||||
(`repmgr primary register`) and contains the following objects:
|
(<command><link linkend="repmgr-primary-register">repmgr primary register</link></command>)
|
||||||
|
and contains the following objects:
|
||||||
<variablelist>
|
<variablelist>
|
||||||
<varlistentry>
|
<varlistentry>
|
||||||
<term>Tables</term>
|
<term>Tables</term>
|
||||||
@@ -159,14 +190,15 @@
|
|||||||
<para>
|
<para>
|
||||||
<itemizedlist>
|
<itemizedlist>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>repmgr.events: records events of interest</simpara>
|
<simpara><literal>repmgr.events</literal>: records events of interest</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>repmgr.nodes: connection and status information for each server in the
|
<simpara><literal>repmgr.nodes</literal>: connection and status information for each server in the
|
||||||
replication cluster</simpara>
|
replication cluster</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>repmgr.monitoring_history: historical standby monitoring information written by `repmgrd`</simpara>
|
<simpara><literal>repmgr.monitoring_history</literal>: historical standby monitoring information
|
||||||
|
written by <application>repmgrd</application></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
</para>
|
</para>
|
||||||
@@ -178,12 +210,12 @@
|
|||||||
<para>
|
<para>
|
||||||
<itemizedlist>
|
<itemizedlist>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>repmgr.show_nodes: based on the table `repl_nodes`, additionally showing the
|
<simpara>repmgr.show_nodes: based on the table <literal>repmgr.nodes</literal>, additionally showing the
|
||||||
name of the server's upstream node</simpara>
|
name of the server's upstream node</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>repmgr.replication_status: when `repmgrd`'s monitoring is enabled, shows current monitoring
|
<simpara>repmgr.replication_status: when <application>repmgrd</application>'s monitoring is enabled, shows
|
||||||
status for each standby.</simpara>
|
current monitoring status for each standby.</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
</para>
|
</para>
|
||||||
@@ -193,16 +225,16 @@
|
|||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
The `repmgr` metadata schema can be stored in an existing database or in its own
|
The &repmgr; metadata schema can be stored in an existing database or in its own
|
||||||
dedicated database. Note that the `repmgr` metadata schema cannot reside on a database
|
dedicated database. Note that the &repmgr; metadata schema cannot reside on a database
|
||||||
server which is not part of the replication cluster managed by `repmgr`.
|
server which is not part of the replication cluster managed by &repmgr;.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
A database user must be available for `repmgr` to access this database and perform
|
A database user must be available for &repmgr; to access this database and perform
|
||||||
necessary changes. This user does not need to be a superuser, however some operations
|
necessary changes. This user does not need to be a superuser, however some operations
|
||||||
such as initial installation of the `repmgr` extension will require a superuser
|
such as initial installation of the &repmgr; extension will require a superuser
|
||||||
connection (this can be specified where required with the command line option
|
connection (this can be specified where required with the command line option
|
||||||
`--superuser`).
|
<literal>--superuser</literal>).
|
||||||
</para>
|
</para>
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|
||||||
|
|||||||
@@ -1,4 +1,8 @@
|
|||||||
<chapter id="promoting-standby" xreflabel="Promoting a standby">
|
<chapter id="promoting-standby" xreflabel="Promoting a standby">
|
||||||
|
<indexterm>
|
||||||
|
<primary>promoting a standby</primary>
|
||||||
|
<seealso>repmgr standby promote</seealso>
|
||||||
|
</indexterm>
|
||||||
<title>Promoting a standby server with repmgr</title>
|
<title>Promoting a standby server with repmgr</title>
|
||||||
<para>
|
<para>
|
||||||
If a primary server fails or needs to be removed from the replication cluster,
|
If a primary server fails or needs to be removed from the replication cluster,
|
||||||
|
|||||||
@@ -5,12 +5,17 @@
|
|||||||
This section gives a quick introduction to &repmgr;, including setting up a
|
This section gives a quick introduction to &repmgr;, including setting up a
|
||||||
sample &repmgr; installation and a basic replication cluster.
|
sample &repmgr; installation and a basic replication cluster.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
These instructions are not suitable for a production install, as they may not
|
These instructions for demonstration purposes and are not suitable for a production
|
||||||
take into account security considerations, proper system administration
|
install, as issues such as account security considerations, and system administration
|
||||||
procedures etc..
|
best practices are omitted.
|
||||||
</para>
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
To upgrade an existing &repmgr; 3.x installation, see section
|
||||||
|
<xref linkend="upgrading-from-repmgr-3">.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
|
||||||
<sect1 id="quickstart-prerequisites">
|
<sect1 id="quickstart-prerequisites">
|
||||||
<title>Prerequisites for setting up a basic replication cluster with &repmgr;</title>
|
<title>Prerequisites for setting up a basic replication cluster with &repmgr;</title>
|
||||||
@@ -98,11 +103,11 @@
|
|||||||
# ignores archiving. Use something more sensible.
|
# ignores archiving. Use something more sensible.
|
||||||
archive_command = '/bin/true'
|
archive_command = '/bin/true'
|
||||||
|
|
||||||
# If you have configured `pg_basebackup_options`
|
# If you have configured "pg_basebackup_options"
|
||||||
# in `repmgr.conf` to include the setting `--xlog-method=fetch` (from
|
# in "repmgr.conf" to include the setting "--xlog-method=fetch" (from
|
||||||
# PostgreSQL 10 `--wal-method=fetch`), *and* you have not set
|
# PostgreSQL 10 "--wal-method=fetch"), *and* you have not set
|
||||||
# `restore_command` in `repmgr.conf`to fetch WAL files from another
|
# "restore_command" in "repmgr.conf"to fetch WAL files from another
|
||||||
# source such as Barman, you'll need to set `wal_keep_segments` to a
|
# source such as Barman, you'll need to set "wal_keep_segments" to a
|
||||||
# high enough value to ensure that all WAL files generated while
|
# high enough value to ensure that all WAL files generated while
|
||||||
# the standby is being cloned are retained until the standby starts up.
|
# the standby is being cloned are retained until the standby starts up.
|
||||||
#
|
#
|
||||||
@@ -116,6 +121,11 @@
|
|||||||
<command>include 'postgresql.replication.conf</command>.
|
<command>include 'postgresql.replication.conf</command>.
|
||||||
</simpara>
|
</simpara>
|
||||||
</tip>
|
</tip>
|
||||||
|
<para>
|
||||||
|
Additionally, if you are intending to use <application>pg_rewind</application>,
|
||||||
|
and the cluster was not initialised using data checksums, you may want to consider enabling
|
||||||
|
<varname>wal_log_hints</varname>; for more details see <xref linkend="repmgr-node-rejoin-pg-rewind">.
|
||||||
|
</para>
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|
||||||
<sect1 id="quickstart-repmgr-user-database">
|
<sect1 id="quickstart-repmgr-user-database">
|
||||||
@@ -224,17 +234,45 @@
|
|||||||
<para>
|
<para>
|
||||||
<filename>repmgr.conf</filename> should not be stored inside the PostgreSQL data directory,
|
<filename>repmgr.conf</filename> should not be stored inside the PostgreSQL data directory,
|
||||||
as it could be overwritten when setting up or reinitialising the PostgreSQL
|
as it could be overwritten when setting up or reinitialising the PostgreSQL
|
||||||
server. See sections on <xref linkend="configuration-file"> and <xref linkend="configuration-file-settings">
|
server. See sections <xref linkend="configuration"> and <xref linkend="configuration-file">
|
||||||
for further details about <filename>repmgr.conf</filename>.
|
for further details about <filename>repmgr.conf</filename>.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
&repmgr; only uses <option>pg_bindir</option> when it executes
|
||||||
|
PostgreSQL binaries directly.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For user-defined scripts such as <option>promote_command</option> and the
|
||||||
|
various <option>service_*_command</option>s, you <emphasis>must</emphasis>
|
||||||
|
always explicitly provide the full path to the binary or script being
|
||||||
|
executed, even if it is &repmgr; itself.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This is because these options can contain user-defined scripts in arbitrary
|
||||||
|
locations, so prepending <option>pg_bindir</option> may break them.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
<tip>
|
<tip>
|
||||||
<simpara>
|
<simpara>
|
||||||
For Debian-based distributions we recommend explictly setting
|
For Debian-based distributions we recommend explictly setting
|
||||||
<literal>pg_bindir</literal> to the directory where <command>pg_ctl</command> and other binaries
|
<option>pg_bindir</option> to the directory where <command>pg_ctl</command> and other binaries
|
||||||
not in the standard path are located. For PostgreSQL 9.6 this would be <filename>/usr/lib/postgresql/9.6/bin/</filename>.
|
not in the standard path are located. For PostgreSQL 9.6 this would be <filename>/usr/lib/postgresql/9.6/bin/</filename>.
|
||||||
</simpara>
|
</simpara>
|
||||||
</tip>
|
</tip>
|
||||||
|
|
||||||
|
<tip>
|
||||||
|
<simpara>
|
||||||
|
If your distribution places the &repmgr; binaries in a location other than the
|
||||||
|
PostgreSQL installation directory, specify this with <option>repmgr_bindir</option>
|
||||||
|
to enable &repmgr; to perform operations (e.g.
|
||||||
|
<command><link linkend="repmgr-cluster-crosscheck">repmgr cluster crosscheck</link></command>)
|
||||||
|
on other nodes.
|
||||||
|
</simpara>
|
||||||
|
</tip>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
See the file
|
See the file
|
||||||
<ulink url="https://raw.githubusercontent.com/2ndQuadrant/repmgr/master/repmgr.conf.sample">repmgr.conf.sample</>
|
<ulink url="https://raw.githubusercontent.com/2ndQuadrant/repmgr/master/repmgr.conf.sample">repmgr.conf.sample</>
|
||||||
@@ -286,7 +324,7 @@
|
|||||||
slot_name |
|
slot_name |
|
||||||
config_file | /etc/repmgr.conf</programlisting>
|
config_file | /etc/repmgr.conf</programlisting>
|
||||||
<para>
|
<para>
|
||||||
Each server in the replication cluster will have its own record. If <command>repmgrd</command>
|
Each server in the replication cluster will have its own record. If <application>repmgrd</application>
|
||||||
is in use, the fields <literal>upstream_node_id</literal>, <literal>active</literal> and
|
is in use, the fields <literal>upstream_node_id</literal>, <literal>active</literal> and
|
||||||
<literal>type</literal> will be updated when the node's status or role changes.
|
<literal>type</literal> will be updated when the node's status or role changes.
|
||||||
</para>
|
</para>
|
||||||
@@ -301,11 +339,10 @@
|
|||||||
(and possibly <literal>data_directory</literal>) adjusted accordingly, e.g.:
|
(and possibly <literal>data_directory</literal>) adjusted accordingly, e.g.:
|
||||||
</para>
|
</para>
|
||||||
<programlisting>
|
<programlisting>
|
||||||
node=2
|
node_id=2
|
||||||
node_name=node2
|
node_name=node2
|
||||||
conninfo='host=node2 user=repmgr dbname=repmgr connect_timeout=2'
|
conninfo='host=node2 user=repmgr dbname=repmgr connect_timeout=2'
|
||||||
data_directory='/var/lib/postgresql/data'
|
data_directory='/var/lib/postgresql/data'</programlisting>
|
||||||
</programlisting>
|
|
||||||
<para>
|
<para>
|
||||||
Use the <command>--dry-run</command> option to check the standby can be cloned:
|
Use the <command>--dry-run</command> option to check the standby can be cloned:
|
||||||
</para>
|
</para>
|
||||||
|
|||||||
@@ -1,23 +1,77 @@
|
|||||||
<chapter id="repmgr-cluster-cleanup" xreflabel="repmgr cluster cleanup">
|
<refentry id="repmgr-cluster-cleanup">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr cluster cleanup</primary>
|
<primary>repmgr cluster cleanup</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr cluster cleanup</title>
|
<refmeta>
|
||||||
<para>
|
<refentrytitle>repmgr cluster cleanup</refentrytitle>
|
||||||
Purges monitoring history from the <literal>repmgr.monitoring_history</literal> table to
|
</refmeta>
|
||||||
prevent excessive table growth. Use the <literal>-k/--keep-history</literal> to specify the
|
|
||||||
number of days of monitoring history to retain. This command can be used
|
<refnamediv>
|
||||||
manually or as a cronjob.
|
<refname>repmgr cluster cleanup</refname>
|
||||||
</para>
|
<refpurpose>purge monitoring history</refpurpose>
|
||||||
<para>
|
</refnamediv>
|
||||||
This command requires a valid <filename>repmgr.conf</filename> file for the node on which it is
|
|
||||||
executed; no additional arguments are required.
|
<refsect1>
|
||||||
</para>
|
<title>Description</title>
|
||||||
<note>
|
<para>
|
||||||
<simpara>
|
Purges monitoring history from the <literal>repmgr.monitoring_history</literal> table to
|
||||||
Monitoring history will only be written if <command>repmgrd</command> is active, and
|
prevent excessive table growth.
|
||||||
<varname>monitoring_history</varname> is set to <literal>true</literal> in
|
</para>
|
||||||
<filename>repmgr.conf</filename>.
|
<para>
|
||||||
</simpara>
|
By default <emphasis>all</emphasis> data will be removed; Use the <option>-k/--keep-history</option>
|
||||||
</note>
|
option to specify the number of days of monitoring history to retain.
|
||||||
</chapter>
|
</para>
|
||||||
|
<para>
|
||||||
|
This command can be executed manually or as a cronjob.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Usage</title>
|
||||||
|
<para>
|
||||||
|
This command requires a valid <filename>repmgr.conf</filename> file for the node on which it is
|
||||||
|
executed; no additional arguments are required.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Notes</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Monitoring history will only be written if <application>repmgrd</application> is active, and
|
||||||
|
<varname>monitoring_history</varname> is set to <literal>true</literal> in
|
||||||
|
<filename>repmgr.conf</filename>.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-cluster-cleanup-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>cluster_cleanup</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--node-id</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Only delete monitoring records for the specified node.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
For more details see the sections <xref linkend="repmgrd-monitoring"> and
|
||||||
|
<xref linkend="repmgrd-monitoring-configuration">.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,15 +1,27 @@
|
|||||||
<chapter id="repmgr-cluster-crosscheck" xreflabel="repmgr cluster crosscheck">
|
<refentry id="repmgr-cluster-crosscheck">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr cluster crosscheck</primary>
|
<primary>repmgr cluster crosscheck</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr cluster crosscheck</title>
|
|
||||||
<para>
|
|
||||||
<command>repmgr cluster crosscheck</command> is similar to <xref linkend="repmgr-cluster-matrix">,
|
<refmeta>
|
||||||
but cross-checks connections between each combination of nodes. In "Example 3" in
|
<refentrytitle>repmgr cluster crosscheck</refentrytitle>
|
||||||
<xref linkend="repmgr-cluster-matrix"> we have no information about the state of <literal>node3</literal>.
|
</refmeta>
|
||||||
However by running <command>repmgr cluster crosscheck</command> it's possible to get a better
|
|
||||||
overview of the cluster situation:
|
<refnamediv>
|
||||||
<programlisting>
|
<refname>repmgr cluster crosscheck</refname>
|
||||||
|
<refpurpose>cross-checks connections between each combination of nodes</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr cluster crosscheck</command> is similar to <xref linkend="repmgr-cluster-matrix">,
|
||||||
|
but cross-checks connections between each combination of nodes. In "Example 3" in
|
||||||
|
<xref linkend="repmgr-cluster-matrix"> we have no information about the state of <literal>node3</literal>.
|
||||||
|
However by running <command>repmgr cluster crosscheck</command> it's possible to get a better
|
||||||
|
overview of the cluster situation:
|
||||||
|
<programlisting>
|
||||||
$ repmgr -f /etc/repmgr.conf cluster crosscheck
|
$ repmgr -f /etc/repmgr.conf cluster crosscheck
|
||||||
|
|
||||||
Name | Id | 1 | 2 | 3
|
Name | Id | 1 | 2 | 3
|
||||||
@@ -17,12 +29,68 @@
|
|||||||
node1 | 1 | * | * | x
|
node1 | 1 | * | * | x
|
||||||
node2 | 2 | * | * | *
|
node2 | 2 | * | * | *
|
||||||
node3 | 3 | * | * | *</programlisting>
|
node3 | 3 | * | * | *</programlisting>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
What happened is that <command>repmgr cluster crosscheck</command> merged its own
|
What happened is that <command>repmgr cluster crosscheck</command> merged its own
|
||||||
<command>repmgr cluster matrix</command> with the <command>repmgr cluster matrix</command>
|
<command><link linkend="repmgr-cluster-matrix">repmgr cluster matrix</link></command> with the
|
||||||
output from <literal>node2</literal>; the latter is able to connect to <literal>node3</literal>
|
<command>repmgr cluster matrix</command> output from <literal>node2</literal>; the latter is
|
||||||
and therefore determine the state of outbound connections from that node.
|
able to connect to <literal>node3</literal>
|
||||||
</para>
|
and therefore determine the state of outbound connections from that node.
|
||||||
</chapter>
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Exit codes</title>
|
||||||
|
<para>
|
||||||
|
Following exit codes can be emitted by <command>repmgr cluster crosscheck</command>:
|
||||||
|
</para>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>SUCCESS (0)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
The check completed successfully and all nodes are reachable.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_BAD_SSH (12)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
One or more nodes could not be accessed via SSH.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
This only applies to nodes unreachable from the node where
|
||||||
|
this command is executed.
|
||||||
|
</simpara>
|
||||||
|
<simpara>
|
||||||
|
It's also possible that the crosscheck establishes that
|
||||||
|
connections between PostgreSQL on all nodes are functioning,
|
||||||
|
even if SSH access between some nodes is not possible.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_NODE_STATUS (25)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
PostgreSQL on one or more nodes could not be reached.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
This error code overrides <option>ERR_BAD_SSH</option>.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|
||||||
|
|||||||
@@ -1,37 +1,79 @@
|
|||||||
<chapter id="repmgr-cluster-event" xreflabel="repmgr cluster event">
|
<refentry id="repmgr-cluster-event">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr cluster event</primary>
|
<primary>repmgr cluster event</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr cluster event</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
This outputs a formatted list of cluster events, as stored in the
|
<refentrytitle>repmgr cluster event</refentrytitle>
|
||||||
<literal>repmgr.events</literal> table. Output is in reverse chronological order, and
|
</refmeta>
|
||||||
can be filtered with the following options:
|
|
||||||
<itemizedlist spacing="compact" mark="bullet">
|
<refnamediv>
|
||||||
<listitem>
|
<refname>repmgr cluster event</refname>
|
||||||
<simpara><literal>--all</literal>: outputs all entries</simpara>
|
<refpurpose>output a formatted list of cluster events</refpurpose>
|
||||||
</listitem>
|
</refnamediv>
|
||||||
<listitem>
|
|
||||||
<simpara><literal>--limit</literal>: set the maximum number of entries to output (default: 20)</simpara>
|
<refsect1>
|
||||||
</listitem>
|
<title>Description</title>
|
||||||
<listitem>
|
|
||||||
<simpara><literal>--node-id</literal>: restrict entries to node with this ID</simpara>
|
<para>
|
||||||
</listitem>
|
Outputs a formatted list of cluster events, as stored in the <literal>repmgr.events</literal> table.
|
||||||
<listitem>
|
</para>
|
||||||
<simpara><literal>--node-name</literal>: restrict entries to node with this name</simpara>
|
</refsect1>
|
||||||
</listitem>
|
|
||||||
<listitem>
|
<refsect1>
|
||||||
<simpara><literal>--event</literal>: filter specific event</simpara>
|
<title>Usage</title>
|
||||||
</listitem>
|
|
||||||
</itemizedlist>
|
<para>
|
||||||
</para>
|
Output is in reverse chronological order, and
|
||||||
<para>
|
can be filtered with the following options:
|
||||||
Example:
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
<programlisting>
|
<listitem>
|
||||||
|
<simpara><literal>--all</literal>: outputs all entries</simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>--limit</literal>: set the maximum number of entries to output (default: 20)</simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>--node-id</literal>: restrict entries to node with this ID</simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>--node-name</literal>: restrict entries to node with this name</simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>--event</literal>: filter specific event (see <xref linkend="event-notifications"> for a full list)</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The "Details" column can be omitted by providing <literal>--terse</literal>.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Output format</title>
|
||||||
|
<para>
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>--csv</literal>: generate output in CSV format. Note that the <literal>Details</literal>
|
||||||
|
column will currently not be emitted in CSV format.
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
$ repmgr -f /etc/repmgr.conf cluster event --event=standby_register
|
$ repmgr -f /etc/repmgr.conf cluster event --event=standby_register
|
||||||
Node ID | Name | Event | OK | Timestamp | Details
|
Node ID | Name | Event | OK | Timestamp | Details
|
||||||
---------+-------+------------------+----+---------------------+--------------------------------
|
---------+-------+------------------+----+---------------------+--------------------------------
|
||||||
3 | node3 | standby_register | t | 2017-08-17 10:28:55 | standby registration succeeded
|
3 | node3 | standby_register | t | 2017-08-17 10:28:55 | standby registration succeeded
|
||||||
2 | node2 | standby_register | t | 2017-08-17 10:28:53 | standby registration succeeded</programlisting>
|
2 | node2 | standby_register | t | 2017-08-17 10:28:53 | standby registration succeeded</programlisting>
|
||||||
</para>
|
</para>
|
||||||
</chapter>
|
</refsect1>
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,27 +1,44 @@
|
|||||||
<chapter id="repmgr-cluster-matrix" xreflabel="repmgr cluster matrix">
|
<refentry id="repmgr-cluster-matrix">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr cluster matrix</primary>
|
<primary>repmgr cluster matrix</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr cluster matrix</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
<command>repmgr cluster matrix</command> runs <command>repmgr cluster show</command> on each
|
<refentrytitle>repmgr cluster matrix</refentrytitle>
|
||||||
node and arranges the results in a matrix, recording success or failure.
|
</refmeta>
|
||||||
</para>
|
|
||||||
<para>
|
<refnamediv>
|
||||||
<command>repmgr cluster matrix</command> requires a valid <filename>repmgr.conf</filename>
|
<refname>repmgr cluster matrix</refname>
|
||||||
file on each node. Additionally passwordless `ssh` connections are required between
|
<refpurpose>
|
||||||
all nodes.
|
runs repmgr cluster show on each node and summarizes output
|
||||||
</para>
|
</refpurpose>
|
||||||
<para>
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr cluster matrix</command> runs <command><link linkend="repmgr-cluster-show">repmgr cluster show</link></command> on each
|
||||||
|
node and arranges the results in a matrix, recording success or failure.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
<command>repmgr cluster matrix</command> requires a valid <filename>repmgr.conf</filename>
|
||||||
|
file on each node. Additionally, passwordless <command>ssh</command> connections are required between
|
||||||
|
all nodes.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
Example 1 (all nodes up):
|
Example 1 (all nodes up):
|
||||||
<programlisting>
|
<programlisting>
|
||||||
$ repmgr -f /etc/repmgr.conf cluster matrix
|
$ repmgr -f /etc/repmgr.conf cluster matrix
|
||||||
|
|
||||||
Name | Id | 1 | 2 | 3
|
Name | Id | 1 | 2 | 3
|
||||||
-------+----+----+----+----
|
-------+----+----+----+----
|
||||||
node1 | 1 | * | * | *
|
node1 | 1 | * | * | *
|
||||||
node2 | 2 | * | * | *
|
node2 | 2 | * | * | *
|
||||||
node3 | 3 | * | * | *</programlisting>
|
node3 | 3 | * | * | *</programlisting>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Example 2 (<literal>node1</literal> and <literal>node2</literal> up, <literal>node3</literal> down):
|
Example 2 (<literal>node1</literal> and <literal>node2</literal> up, <literal>node3</literal> down):
|
||||||
@@ -46,7 +63,7 @@
|
|||||||
<para>
|
<para>
|
||||||
The other two nodes are up; the corresponding rows have <literal>x</literal> in the
|
The other two nodes are up; the corresponding rows have <literal>x</literal> in the
|
||||||
column corresponding to <literal>node3</literal>, meaning that inbound connections to
|
column corresponding to <literal>node3</literal>, meaning that inbound connections to
|
||||||
that node have failed, and `*` in the columns corresponding to
|
that node have failed, and <literal>*</literal> in the columns corresponding to
|
||||||
<literal>node1</literal> and <literal>node2</literal>, meaning that inbound connections
|
<literal>node1</literal> and <literal>node2</literal>, meaning that inbound connections
|
||||||
to these nodes have succeeded.
|
to these nodes have succeeded.
|
||||||
</para>
|
</para>
|
||||||
@@ -79,5 +96,50 @@
|
|||||||
In this case, the <xref linkend="repmgr-cluster-crosscheck"> command will produce a more
|
In this case, the <xref linkend="repmgr-cluster-crosscheck"> command will produce a more
|
||||||
useful result.
|
useful result.
|
||||||
</para>
|
</para>
|
||||||
</chapter>
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Exit codes</title>
|
||||||
|
<para>
|
||||||
|
Following exit codes can be emitted by <command>repmgr cluster matrix</command>:
|
||||||
|
</para>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>SUCCESS (0)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
The check completed successfully and all nodes are reachable.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_BAD_SSH (12)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
One or more nodes could not be accessed via SSH.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_NODE_STATUS (25)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
PostgreSQL on one or more nodes could not be reached.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
This error code overrides <option>ERR_BAD_SSH</option>.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|
||||||
|
|||||||
@@ -1,22 +1,46 @@
|
|||||||
<chapter id="repmgr-cluster-show" xreflabel="repmgr cluster show">
|
<refentry id="repmgr-cluster-show">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr cluster show</primary>
|
<primary>repmgr cluster show</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr cluster show</title>
|
|
||||||
<para>
|
|
||||||
Displays information about each active node in the replication cluster. This
|
|
||||||
command polls each registered server and shows its role (<literal>primary</literal> /
|
|
||||||
<literal>standby</literal> / <literal>bdr</literal>) and status. It polls each server
|
|
||||||
directly and can be run on any node in the cluster; this is also useful when analyzing
|
|
||||||
connectivity from a particular node.
|
|
||||||
</para>
|
|
||||||
<para>
|
|
||||||
This command requires either a valid <filename>repmgr.conf</filename> file or a database
|
|
||||||
connection string to one of the registered nodes; no additional arguments are needed.
|
|
||||||
</para>
|
|
||||||
|
|
||||||
<para>
|
<refmeta>
|
||||||
Example:
|
<refentrytitle>repmgr cluster show</refentrytitle>
|
||||||
|
</refmeta>
|
||||||
|
|
||||||
|
<refnamediv>
|
||||||
|
<refname>repmgr cluster show</refname>
|
||||||
|
<refpurpose>display information about each registered node in the replication cluster</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
Displays information about each registered node in the replication cluster. This
|
||||||
|
command polls each registered server and shows its role (<literal>primary</literal> /
|
||||||
|
<literal>standby</literal> / <literal>bdr</literal>) and status. It polls each server
|
||||||
|
directly and can be run on any node in the cluster; this is also useful when analyzing
|
||||||
|
connectivity from a particular node.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Execution</title>
|
||||||
|
<para>
|
||||||
|
This command requires either a valid <filename>repmgr.conf</filename> file or a database
|
||||||
|
connection string to one of the registered nodes; no additional arguments are needed.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
To show database connection errors when polling nodes, run the command in
|
||||||
|
<literal>--verbose</literal> mode.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
<programlisting>
|
<programlisting>
|
||||||
$ repmgr -f /etc/repmgr.conf cluster show
|
$ repmgr -f /etc/repmgr.conf cluster show
|
||||||
|
|
||||||
@@ -26,42 +50,123 @@
|
|||||||
2 | node2 | standby | running | node1 | default | host=db_node2 dbname=repmgr user=repmgr
|
2 | node2 | standby | running | node1 | default | host=db_node2 dbname=repmgr user=repmgr
|
||||||
3 | node3 | standby | running | node1 | default | host=db_node3 dbname=repmgr user=repmgr</programlisting>
|
3 | node3 | standby | running | node1 | default | host=db_node3 dbname=repmgr user=repmgr</programlisting>
|
||||||
</para>
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
<refsect1>
|
||||||
|
<title>Notes</title>
|
||||||
|
<para>
|
||||||
|
The column <literal>Role</literal> shows the expected server role according to the
|
||||||
|
&repmgr; metadata. <literal>Status</literal> shows whether the server is running or unreachable.
|
||||||
|
If the node has an unexpected role not reflected in the &repmgr; metadata, e.g. a node was manually
|
||||||
|
promoted to primary, this will be highlighted with an exclamation mark, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf cluster show
|
||||||
|
|
||||||
<para>
|
ID | Name | Role | Status | Upstream | Location | Connection string
|
||||||
To show database connection errors when polling nodes, run the command in
|
----+-------+---------+----------------------+----------+----------+-----------------------------------------
|
||||||
<literal>--verbose</literal> mode.
|
1 | node1 | primary | ? unreachable | | default | host=db_node1 dbname=repmgr user=repmgr
|
||||||
</para>
|
2 | node2 | standby | ! running as primary | node1 | default | host=db_node2 dbname=repmgr user=repmgr
|
||||||
<para>
|
3 | node3 | standby | running | node1 | default | host=db_node3 dbname=repmgr user=repmgr
|
||||||
The `cluster show` command accepts an optional parameter <literal>--csv</literal>, which
|
|
||||||
outputs the replication cluster's status in a simple CSV format, suitable for
|
WARNING: following issues were detected
|
||||||
parsing by scripts:
|
node "node1" (ID: 1) is registered as an active primary but is unreachable
|
||||||
<programlisting>
|
node "node2" (ID: 2) is registered as standby but running as primary</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Node availability is tested by connecting from the node where
|
||||||
|
<command>repmgr cluster show</command> is executed, and does not necessarily imply the node
|
||||||
|
is down. See <xref linkend="repmgr-cluster-matrix"> and <xref linkend="repmgr-cluster-crosscheck"> to get
|
||||||
|
a better overviews of connections between nodes.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Options</title>
|
||||||
|
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--csv</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
<command>repmgr cluster show</command> accepts an optional parameter <literal>--csv</literal>, which
|
||||||
|
outputs the replication cluster's status in a simple CSV format, suitable for
|
||||||
|
parsing by scripts, e.g.:
|
||||||
|
<programlisting>
|
||||||
$ repmgr -f /etc/repmgr.conf cluster show --csv
|
$ repmgr -f /etc/repmgr.conf cluster show --csv
|
||||||
1,-1,-1
|
1,-1,-1
|
||||||
2,0,0
|
2,0,0
|
||||||
3,0,1</programlisting>
|
3,0,1</programlisting>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
The columns have following meanings:
|
The columns have following meanings:
|
||||||
<itemizedlist spacing="compact" mark="bullet">
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>
|
<simpara>
|
||||||
node ID
|
node ID
|
||||||
</simpara>
|
</simpara>
|
||||||
<simpara>
|
</listitem>
|
||||||
availability (0 = available, -1 = unavailable)
|
<listitem>
|
||||||
</simpara>
|
<simpara>
|
||||||
<simpara>
|
availability (0 = available, -1 = unavailable)
|
||||||
recovery state (0 = not in recovery, 1 = in recovery, -1 = unknown)
|
</simpara>
|
||||||
</simpara>
|
</listitem>
|
||||||
</listitem>
|
<listitem>
|
||||||
</itemizedlist>
|
<simpara>
|
||||||
</para>
|
recovery state (0 = not in recovery, 1 = in recovery, -1 = unknown)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
<para>
|
<varlistentry>
|
||||||
Note that the availability is tested by connecting from the node where
|
<term><option>--verbose</option></term>
|
||||||
<command>repmgr cluster show</command> is executed, and does not necessarily imply the node
|
<listitem>
|
||||||
is down. See <xref linkend="repmgr-cluster-matrix"> and <xref linkend="repmgr-cluster-crosscheck"> to get
|
<para>
|
||||||
a better overviews of connections between nodes.
|
Display the full text of any database connection error messages
|
||||||
</para>
|
</para>
|
||||||
</chapter>
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Exit codes</title>
|
||||||
|
<para>
|
||||||
|
Following exit codes can be emitted by <command>repmgr cluster show</command>:
|
||||||
|
</para>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>SUCCESS (0)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
No issues were detected.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_NODE_STATUS (25)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
One or more issues were detected.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
<xref linkend="repmgr-node-status">, <xref linkend="repmgr-node-check">, <xref linkend="repmgr-daemon-status">
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|||||||
109
doc/repmgr-daemon-pause.sgml
Normal file
109
doc/repmgr-daemon-pause.sgml
Normal file
@@ -0,0 +1,109 @@
|
|||||||
|
<refentry id="repmgr-daemon-pause">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgr daemon pause</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<refmeta>
|
||||||
|
<refentrytitle>repmgr daemon pause</refentrytitle>
|
||||||
|
</refmeta>
|
||||||
|
|
||||||
|
<refnamediv>
|
||||||
|
<refname>repmgr daemon pause</refname>
|
||||||
|
<refpurpose>Instruct all <application>repmgrd</application> instances in the replication cluster to pause failover operations</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
This command can be run on any active node in the replication cluster to instruct all
|
||||||
|
running <application>repmgrd</application> instances to "pause" themselves, i.e. take no
|
||||||
|
action (such as promoting themselves or following a new primary) if a failover event is detected.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This functionality is useful for performing maintenance operations, such as switchovers
|
||||||
|
or upgrades, which might otherwise trigger a failover if <application>repmgrd</application>
|
||||||
|
is running normally.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
It's important to wait a few seconds after restarting PostgreSQL on any node before running
|
||||||
|
<command>repmgr daemon pause</command>, as the <application>repmgrd</application> instance
|
||||||
|
on the restarted node will take a second or two before it has updated its status.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
<xref linkend="repmgr-daemon-unpause"> will instruct all previously paused <application>repmgrd</application>
|
||||||
|
instances to resume normal failover operation.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Execution</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr daemon pause</command> can be executed on any active node in the
|
||||||
|
replication cluster. A valid <filename>repmgr.conf</filename> file is required.
|
||||||
|
It will have no effect on previously paused nodes.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf daemon pause
|
||||||
|
NOTICE: node 1 (node1) paused
|
||||||
|
NOTICE: node 2 (node2) paused
|
||||||
|
NOTICE: node 3 (node3) paused</programlisting>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check if nodes are reachable but don't pause <application>repmgrd</application>.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Exit codes</title>
|
||||||
|
<para>
|
||||||
|
Following exit codes can be emitted by <command>repmgr daemon unpause</command>:
|
||||||
|
</para>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>SUCCESS (0)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> could be paused on all nodes.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_REPMGRD_PAUSE (26)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> could not be paused on one or mode nodes.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
<xref linkend="repmgr-daemon-unpause">, <xref linkend="repmgr-daemon-status">
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
</refentry>
|
||||||
|
|
||||||
165
doc/repmgr-daemon-status.sgml
Normal file
165
doc/repmgr-daemon-status.sgml
Normal file
@@ -0,0 +1,165 @@
|
|||||||
|
<refentry id="repmgr-daemon-status">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgr daemon status</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<refmeta>
|
||||||
|
<refentrytitle>repmgr daemon status</refentrytitle>
|
||||||
|
</refmeta>
|
||||||
|
|
||||||
|
<refnamediv>
|
||||||
|
<refname>repmgr daemon status</refname>
|
||||||
|
<refpurpose>display information about the status of <application>repmgrd</application> on each node in the cluster</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
This command provides an overview over all active nodes in the cluster and the state
|
||||||
|
of each node's <application>repmgrd</application> instance. It can be used to check
|
||||||
|
the result of <xref linkend="repmgr-daemon-pause"> and <xref linkend="repmgr-daemon-unpause">
|
||||||
|
operations.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Execution</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr daemon status</command> can be executed on any active node in the
|
||||||
|
replication cluster. A valid <filename>repmgr.conf</filename> file is required.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
After restarting PostgreSQL on any node, the <application>repmgrd</application> instance
|
||||||
|
will take a second or two before it is able to update its status. Until then,
|
||||||
|
<application>repmgrd</application> will be shown as not running.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Examples</title>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> running normally on all nodes:
|
||||||
|
<programlisting>$ repmgr -f /etc/repmgr.conf daemon status
|
||||||
|
ID | Name | Role | Status | repmgrd | PID | Paused?
|
||||||
|
----+-------+---------+---------+---------+------+---------
|
||||||
|
1 | node1 | primary | running | running | 7851 | no
|
||||||
|
2 | node2 | standby | running | running | 7889 | no
|
||||||
|
3 | node3 | standby | running | running | 7918 | no</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> paused on all nodes (using <xref linkend="repmgr-daemon-pause">):
|
||||||
|
<programlisting>$ repmgr -f /etc/repmgr.conf daemon status
|
||||||
|
ID | Name | Role | Status | repmgrd | PID | Paused?
|
||||||
|
----+-------+---------+---------+---------+------+---------
|
||||||
|
1 | node1 | primary | running | running | 7851 | yes
|
||||||
|
2 | node2 | standby | running | running | 7889 | yes
|
||||||
|
3 | node3 | standby | running | running | 7918 | yes</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> not running on one node:
|
||||||
|
<programlisting>$ repmgr -f /etc/repmgr.conf daemon status
|
||||||
|
ID | Name | Role | Status | repmgrd | PID | Paused?
|
||||||
|
----+-------+---------+---------+-------------+------+---------
|
||||||
|
1 | node1 | primary | running | running | 7851 | yes
|
||||||
|
2 | node2 | standby | running | not running | n/a | n/a
|
||||||
|
3 | node3 | standby | running | running | 7918 | yes</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Options</title>
|
||||||
|
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--csv</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
<command>repmgr daemon status</command> accepts an optional parameter <literal>--csv</literal>, which
|
||||||
|
outputs the replication cluster's status in a simple CSV format, suitable for
|
||||||
|
parsing by scripts, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf daemon status --csv
|
||||||
|
1,node1,primary,1,1,10204,1
|
||||||
|
2,node2,standby,1,0,-1,1
|
||||||
|
3,node3,standby,1,1,10225,1</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The columns have following meanings:
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
node ID
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
node name
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
node type (primary or standby)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
PostgreSQL server running
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<application>repmgrd</application> running (1 = running, 0 = not running)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<application>repmgrd</application> PID (-1 if not running)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<application>repmgrd</application> paused (1 = paused, 0 = not paused)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--verbose</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Display the full text of any database connection error messages
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
<xref linkend="repmgr-daemon-pause">, <xref linkend="repmgr-daemon-unpause">, <xref linkend="repmgr-cluster-show">
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
</refentry>
|
||||||
103
doc/repmgr-daemon-unpause.sgml
Normal file
103
doc/repmgr-daemon-unpause.sgml
Normal file
@@ -0,0 +1,103 @@
|
|||||||
|
<refentry id="repmgr-daemon-unpause">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgr daemon unpause</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<refmeta>
|
||||||
|
<refentrytitle>repmgr daemon unpause</refentrytitle>
|
||||||
|
</refmeta>
|
||||||
|
|
||||||
|
<refnamediv>
|
||||||
|
<refname>repmgr daemon unpause</refname>
|
||||||
|
<refpurpose>Instruct all <application>repmgrd</application> instances in the replication cluster to resume failover operations</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
This command can be run on any active node in the replication cluster to instruct all
|
||||||
|
running <application>repmgrd</application> instances to "unpause"
|
||||||
|
(following a previous execution of <xref linkend="repmgr-daemon-pause">)
|
||||||
|
and resume normal failover/monitoring operation.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
It's important to wait a few seconds after restarting PostgreSQL on any node before running
|
||||||
|
<command>repmgr daemon pause</command>, as the <application>repmgrd</application> instance
|
||||||
|
on the restarted node will take a second or two before it has updated its status.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Execution</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr daemon unpause</command> can be executed on any active node in the
|
||||||
|
replication cluster. A valid <filename>repmgr.conf</filename> file is required.
|
||||||
|
It will have no effect on nodes which are not already paused.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf daemon unpause
|
||||||
|
NOTICE: node 1 (node1) unpaused
|
||||||
|
NOTICE: node 2 (node2) unpaused
|
||||||
|
NOTICE: node 3 (node3) unpaused</programlisting>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check if nodes are reachable but don't unpause <application>repmgrd</application>.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Exit codes</title>
|
||||||
|
<para>
|
||||||
|
Following exit codes can be emitted by <command>repmgr daemon unpause</command>:
|
||||||
|
</para>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>SUCCESS (0)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> could be unpaused on all nodes.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_REPMGRD_PAUSE (26)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> could not be unpaused on one or mode nodes.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
<xref linkend="repmgr-daemon-pause">, <xref linkend="repmgr-daemon-status">
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
</refentry>
|
||||||
|
|
||||||
@@ -1,32 +1,49 @@
|
|||||||
<chapter id="repmgr-node-check" xreflabel="repmgr node check">
|
<refentry id="repmgr-node-check">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr node check</primary>
|
<primary>repmgr node check</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr node check</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
Performs some health checks on a node from a replication perspective.
|
<refentrytitle>repmgr node check</refentrytitle>
|
||||||
This command must be run on the local node.
|
</refmeta>
|
||||||
</para>
|
|
||||||
<para>
|
<refnamediv>
|
||||||
Sample output (execute <command>repmgr node check</command>):
|
<refname>repmgr node check</refname>
|
||||||
<programlisting>
|
<refpurpose>performs some health checks on a node from a replication perspective</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
Performs some health checks on a node from a replication perspective.
|
||||||
|
This command must be run on the local node.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf node check
|
||||||
Node "node1":
|
Node "node1":
|
||||||
Server role: OK (node is primary)
|
Server role: OK (node is primary)
|
||||||
Replication lag: OK (N/A - node is primary)
|
Replication lag: OK (N/A - node is primary)
|
||||||
WAL archiving: OK (0 pending files)
|
WAL archiving: OK (0 pending files)
|
||||||
Downstream servers: OK (2 of 2 downstream nodes attached)
|
Downstream servers: OK (2 of 2 downstream nodes attached)
|
||||||
Replication slots: OK (node has no replication slots)
|
Replication slots: OK (node has no replication slots)
|
||||||
</programlisting>
|
Missing replication slots: OK (node has no missing replication slots)</programlisting>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
</refsect1>
|
||||||
Additionally each check can be performed individually by supplying
|
<refsect1>
|
||||||
an additional command line parameter, e.g.:
|
<title>Individual checks</title>
|
||||||
<programlisting>
|
<para>
|
||||||
$ repmgr node check --role
|
Each check can be performed individually by supplying
|
||||||
OK (node is primary)
|
an additional command line parameter, e.g.:
|
||||||
</programlisting>
|
<programlisting>
|
||||||
</para>
|
$ repmgr node check --role
|
||||||
<para>
|
OK (node is primary)</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
Parameters for individual checks are as follows:
|
Parameters for individual checks are as follows:
|
||||||
<itemizedlist spacing="compact" mark="bullet">
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
@@ -45,7 +62,9 @@
|
|||||||
|
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>
|
<simpara>
|
||||||
<literal>--archive-ready</literal>: checks for WAL files which have not yet been archived
|
<literal>--archive-ready</literal>: checks for WAL files which have not yet been archived,
|
||||||
|
and returns <literal>WARNING</literal> or <literal>CRITICAL</literal> if the number
|
||||||
|
exceeds <varname>archive_ready_warning</varname> or <varname>archive_ready_critical</varname> respectively.
|
||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
|
|
||||||
@@ -61,10 +80,110 @@
|
|||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>--missing-slots</literal>: checks there are no missing replication slots
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
</refsect1>
|
||||||
Individual checks can also be output in a Nagios-compatible format by additionally
|
|
||||||
providing the option <literal>--nagios</literal>.
|
<refsect1>
|
||||||
</para>
|
<title>Output format</title>
|
||||||
</chapter>
|
<para>
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>--csv</literal>: generate output in CSV format (not available
|
||||||
|
for individual checks)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>--nagios</literal>: generate output in a Nagios-compatible format
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Exit codes</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
When executing <command>repmgr node check</command> with one of the individual
|
||||||
|
checks listed above, &repmgr; will emit one of the following Nagios-style exit codes
|
||||||
|
(even if <literal>--nagios</literal> is not supplied):
|
||||||
|
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>0</literal>: OK
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>1</literal>: WARNING
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>2</literal>: ERROR
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>3</literal>: UNKNOWN
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Following exit codes can be emitted by <command>repmgr status check</command>
|
||||||
|
if no individual check was specified.
|
||||||
|
</para>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>SUCCESS (0)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
No issues were detected.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_NODE_STATUS (25)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
One or more issues were detected.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
<xref linkend="repmgr-node-status">, <xref linkend="repmgr-cluster-show">
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,13 +1,264 @@
|
|||||||
<chapter id="repmgr-node-rejoin" xreflabel="repmgr node rejoin">
|
<refentry id="repmgr-node-rejoin">
|
||||||
|
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr node rejoin</primary>
|
<primary>repmgr node rejoin</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr node rejoin</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
Enables a dormant (stopped) node to be rejoined to the replication cluster.
|
<refentrytitle>repmgr node rejoin</refentrytitle>
|
||||||
</para>
|
</refmeta>
|
||||||
<para>
|
|
||||||
This can optionally use <command>pg_rewind</command> to re-integrate a node which has diverged
|
<refnamediv>
|
||||||
from the rest of the cluster, typically a failed primary.
|
<refname>repmgr node rejoin</refname>
|
||||||
</para>
|
<refpurpose>rejoin a dormant (stopped) node to the replication cluster</refpurpose>
|
||||||
</chapter>
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
Enables a dormant (stopped) node to be rejoined to the replication cluster.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This can optionally use <application>pg_rewind</application> to re-integrate
|
||||||
|
a node which has diverged from the rest of the cluster, typically a failed primary.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<tip>
|
||||||
|
<para>
|
||||||
|
If the node is running and needs to be attached to the current primary, use
|
||||||
|
<xref linkend="repmgr-standby-follow">.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Note <xref linkend="repmgr-standby-follow"> can only be used for standbys which have not diverged
|
||||||
|
from the rest of the cluster.
|
||||||
|
</para>
|
||||||
|
</tip>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Usage</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
|
repmgr node rejoin -d '$conninfo'</programlisting>
|
||||||
|
|
||||||
|
where <literal>$conninfo</literal> is the conninfo string of any reachable node in the cluster.
|
||||||
|
<filename>repmgr.conf</filename> for the stopped node *must* be supplied explicitly if not
|
||||||
|
otherwise available.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check prerequisites but don't actually execute the rejoin.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--force-rewind[=/path/to/pg_rewind]</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Execute <application>pg_rewind</application>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
It is only necessary to provide the <application>pg_rewind</application> path
|
||||||
|
if using PostgreSQL 9.3 or 9.4, and <application>pg_rewind</application>
|
||||||
|
is not installed in the PostgreSQL <filename>bin</filename> directory.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--config-files</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
comma-separated list of configuration files to retain after
|
||||||
|
executing <application>pg_rewind</application>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Currently <application>pg_rewind</application> will overwrite
|
||||||
|
the local node's configuration files with the files from the source node,
|
||||||
|
so it's advisable to use this option to ensure they are kept.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--config-archive-dir</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Directory to temporarily store configuration files specified with
|
||||||
|
<option>--config-files</option>; default: <filename>/tmp</filename>.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-W/--no-wait</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Don't wait for the node to rejoin cluster.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If this option is supplied, &repmgr; will restart the node but
|
||||||
|
not wait for it to connect to the primary.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
<refsect1>
|
||||||
|
<title>Configuration file settings</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>node_rejoin_timeout</literal>:
|
||||||
|
the maximum length of time (in seconds) to wait for
|
||||||
|
the node to reconnect to the replication cluster (defaults to
|
||||||
|
the value set in <literal>standby_reconnect_timeout</literal>,
|
||||||
|
60 seconds).
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-node-rejoin-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>node_rejoin</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Notes</title>
|
||||||
|
<para>
|
||||||
|
Currently <command>repmgr node rejoin</command> can only be used to attach
|
||||||
|
a standby to the current primary, not another standby.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The node must have been shut down cleanly; if this was not the case, it will
|
||||||
|
need to be manually started (remove any existing <filename>recovery.conf</filename> file first)
|
||||||
|
until it has reached a consistent recovery point, then shut down cleanly.
|
||||||
|
</para>
|
||||||
|
<tip>
|
||||||
|
<para>
|
||||||
|
If <application>PostgreSQL</application> is started in single-user mode and
|
||||||
|
input is directed from <filename>/dev/null/</filename>, it will perform recovery
|
||||||
|
then immediately quit, and will then be in a state suitable for use by
|
||||||
|
<application>pg_rewind</application>.
|
||||||
|
<programlisting>
|
||||||
|
rm -f /var/lib/pgsql/data/recovery.conf
|
||||||
|
postgres --single -D /var/lib/pgsql/data/ < /dev/null</programlisting>
|
||||||
|
</para>
|
||||||
|
</tip>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-node-rejoin-pg-rewind" xreflabel="Using pg_rewind">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>pg_rewind</primary>
|
||||||
|
<secondary>using with "repmgr node rejoin"</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>Using <command>pg_rewind</command></title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr node rejoin</command> can optionally use <command>pg_rewind</command> to re-integrate a
|
||||||
|
node which has diverged from the rest of the cluster, typically a failed primary.
|
||||||
|
<command>pg_rewind</command> is available in PostgreSQL 9.5 and later as part of the core distribution,
|
||||||
|
and can be installed from external sources for PostgreSQL 9.3 and 9.4.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
<command>pg_rewind</command> <emphasis>requires</emphasis> that either
|
||||||
|
<varname>wal_log_hints</varname> is enabled, or that
|
||||||
|
data checksums were enabled when the cluster was initialized. See the
|
||||||
|
<ulink url="https://www.postgresql.org/docs/current/static/app-pgrewind.html"><command>pg_rewind</command> documentation</ulink> for details.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
To have <command>repmgr node rejoin</command> use <command>pg_rewind</command>,
|
||||||
|
pass the command line option <literal>--force-rewind</literal>, which will tell &repmgr;
|
||||||
|
to execute <command>pg_rewind</command> to ensure the node can be rejoined successfully.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Be aware that if <command>pg_rewind</command> is executed and actually performs a
|
||||||
|
rewind operation, any configuration files in the PostgreSQL data directory will be
|
||||||
|
overwritten with those from the source server.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To prevent this happening, provide a comma-separated list of files to retain
|
||||||
|
using the <literal>--config-file</literal> command line option; the specified files
|
||||||
|
will be archived in a temporary directory (whose parent directory can be specified with
|
||||||
|
<literal>--config-archive-dir</literal>) and restored once the rewind operation is
|
||||||
|
complete.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Example, first using <literal>--dry-run</literal>, then actually executing the
|
||||||
|
<literal>node rejoin command</literal>.
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr node rejoin -f /etc/repmgr.conf -d 'host=node1 dbname=repmgr user=repmgr' \
|
||||||
|
--force-rewind --config-files=postgresql.local.conf,postgresql.conf --verbose --dry-run
|
||||||
|
NOTICE: using provided configuration file "/etc/repmgr.conf"
|
||||||
|
INFO: prerequisites for using pg_rewind are met
|
||||||
|
INFO: file "postgresql.local.conf" would be copied to "/tmp/repmgr-config-archive-node1/postgresql.local.conf"
|
||||||
|
INFO: file "postgresql.conf" would be copied to "/tmp/repmgr-config-archive-node1/postgresql.local.conf"
|
||||||
|
INFO: 2 files would have been copied to "/tmp/repmgr-config-archive-node1"
|
||||||
|
INFO: directory "/tmp/repmgr-config-archive-node1" deleted
|
||||||
|
INFO: pg_rewind would now be executed
|
||||||
|
DETAIL: pg_rewind command is:
|
||||||
|
pg_rewind -D '/var/lib/postgresql/data' --source-server='host=node1 dbname=repmgr user=repmgr'</programlisting>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If <option>--force-rewind</option> is used with the <option>--dry-run</option> option,
|
||||||
|
this checks the prerequisites for using <application>pg_rewind</application>, but cannot
|
||||||
|
predict the outcome of actually executing <application>pg_rewind</application>.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr node rejoin -f /etc/repmgr.conf -d 'host=node1 dbname=repmgr user=repmgr' \
|
||||||
|
--force-rewind --config-files=postgresql.local.conf,postgresql.conf --verbose
|
||||||
|
NOTICE: using provided configuration file "/etc/repmgr.conf"
|
||||||
|
INFO: prerequisites for using pg_rewind are met
|
||||||
|
INFO: 2 files copied to "/tmp/repmgr-config-archive-node1"
|
||||||
|
NOTICE: executing pg_rewind
|
||||||
|
NOTICE: 2 files copied to /var/lib/pgsql/data
|
||||||
|
INFO: directory "/tmp/repmgr-config-archive-node1" deleted
|
||||||
|
INFO: deleting "recovery.done"
|
||||||
|
INFO: setting node 1's primary to node 2
|
||||||
|
NOTICE: starting server using "pg_ctl-l /var/log/postgres/startup.log -w -D '/var/lib/pgsql/data' start"
|
||||||
|
waiting for server to start.... done
|
||||||
|
server started
|
||||||
|
NOTICE: NODE REJOIN successful
|
||||||
|
DETAIL: node 1 is now attached to node 2</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
<xref linkend="repmgr-standby-follow">
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,16 +1,30 @@
|
|||||||
|
<refentry id="repmgr-node-status">
|
||||||
<chapter id="repmgr-node-status" xreflabel="repmgr node status">
|
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr node status</primary>
|
<primary>repmgr node status</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr node status</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
Displays an overview of a node's basic information and replication
|
<refentrytitle>repmgr node status</refentrytitle>
|
||||||
status. This command must be run on the local node.
|
</refmeta>
|
||||||
</para>
|
|
||||||
<para>
|
<refnamediv>
|
||||||
Sample output (execute <command>repmgr node status</command>):
|
<refname>repmgr node status</refname>
|
||||||
<programlisting>
|
<refpurpose>show overview of a node's basic information and replication status</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
Displays an overview of a node's basic information and replication
|
||||||
|
status. This command must be run on the local node.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf node status
|
||||||
Node "node1":
|
Node "node1":
|
||||||
PostgreSQL version: 10beta1
|
PostgreSQL version: 10beta1
|
||||||
Total data size: 30 MB
|
Total data size: 30 MB
|
||||||
@@ -20,10 +34,58 @@
|
|||||||
Archive command: (none)
|
Archive command: (none)
|
||||||
Replication connections: 2 (of maximal 10)
|
Replication connections: 2 (of maximal 10)
|
||||||
Replication slots: 0 (of maximal 10)
|
Replication slots: 0 (of maximal 10)
|
||||||
Replication lag: n/a
|
Replication lag: n/a</programlisting>
|
||||||
</programlisting>
|
</para>
|
||||||
</para>
|
</refsect1>
|
||||||
<para>
|
|
||||||
See <xref linkend="repmgr-node-check"> to diagnose issues.
|
<refsect1>
|
||||||
</para>
|
<title>Output format</title>
|
||||||
</chapter>
|
<para>
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>--csv</literal>: generate output in CSV format
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Exit codes</title>
|
||||||
|
<para>
|
||||||
|
Following exit codes can be emitted by <command>repmgr node status</command>:
|
||||||
|
</para>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>SUCCESS (0)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
No issues were detected.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_NODE_STATUS (25)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
One or more issues were detected.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
See <xref linkend="repmgr-node-check"> to diagnose issues and <xref linkend="repmgr-cluster-show">
|
||||||
|
for an overview of all nodes in the cluster.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,18 +1,93 @@
|
|||||||
<chapter id="repmgr-primary-register" xreflabel="repmgr primary register">
|
<refentry id="repmgr-primary-register">
|
||||||
<indexterm><primary>repmgr primary register</primary></indexterm>
|
<indexterm>
|
||||||
<title>repmgr primary register</title>
|
<primary>repmgr primary register</primary>
|
||||||
<para>
|
</indexterm>
|
||||||
<command>repmgr primary register</command> registers a primary node in a
|
|
||||||
streaming replication cluster, and configures it for use with repmgr, including
|
<refmeta>
|
||||||
installing the &repmgr; extension. This command needs to be executed before any
|
<refentrytitle>repmgr primary register</refentrytitle>
|
||||||
standby nodes are registered.
|
</refmeta>
|
||||||
</para>
|
|
||||||
<para>
|
<refnamediv>
|
||||||
Execute with the <literal>--dry-run</literal> option to check what would happen without
|
<refname>repmgr primary register</refname>
|
||||||
actually registering the primary.
|
<refpurpose>initialise a repmgr installation and register the primary node</refpurpose>
|
||||||
</para>
|
</refnamediv>
|
||||||
<para>
|
|
||||||
<command>repmgr master register</command> can be used as an alias for
|
|
||||||
<command>repmgr primary register</command>.
|
<refsect1>
|
||||||
</para>
|
<title>Description</title>
|
||||||
</chapter>
|
<para>
|
||||||
|
<command>repmgr primary register</command> registers a primary node in a
|
||||||
|
streaming replication cluster, and configures it for use with &repmgr;, including
|
||||||
|
installing the &repmgr; extension. This command needs to be executed before any
|
||||||
|
standby nodes are registered.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Execution</title>
|
||||||
|
<para>
|
||||||
|
Execute with the <option>--dry-run</option> option to check what would happen without
|
||||||
|
actually registering the primary.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
<command>repmgr master register</command> can be used as an alias for
|
||||||
|
<command>repmgr primary register</command>.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If providing the configuration file location with <option>-f/--config-file</option>,
|
||||||
|
avoid using a relative path, as &repmgr; stores the configuration file location
|
||||||
|
in the repmgr metadata for use when &repmgr; is executed remotely (e.g. during
|
||||||
|
<xref linkend="repmgr-standby-switchover">). &repmgr; will attempt to convert the
|
||||||
|
a relative path into an absolute one, but this may not be the same as the path you
|
||||||
|
would explicitly provide (e.g. <filename>./repmgr.conf</filename> might be converted
|
||||||
|
to <filename>/path/to/./repmgr.conf</filename>, whereas you'd normally write
|
||||||
|
<filename>/path/to/repmgr.conf</filename>).
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check prerequisites but don't actually register the primary.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-F</option>, <option>--force</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Overwrite an existing node record
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-primary-register-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
Following <link linkend="event-notifications">event notifications</link> will be generated:
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>cluster_created</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara><literal>primary_register</literal></simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,18 +1,74 @@
|
|||||||
<chapter id="repmgr-primary-unregister" xreflabel="repmgr primary unregister">
|
<refentry id="repmgr-primary-unregister">
|
||||||
<indexterm><primary>repmgr primary unregister</primary></indexterm>
|
<indexterm>
|
||||||
<title>repmgr primary unregister</title>
|
<primary>repmgr primary unregister</primary>
|
||||||
<para>
|
</indexterm>
|
||||||
<command>repmgr primary register</command> unregisters an inactive primary node
|
<refmeta>
|
||||||
from the &repmgr; metadata. This is typically when the primary has failed and is
|
<refentrytitle>repmgr primary unregister</refentrytitle>
|
||||||
being removed from the cluster after a new primary has been promoted.
|
</refmeta>
|
||||||
</para>
|
<refnamediv>
|
||||||
<para>
|
<refname>repmgr primary unregister</refname>
|
||||||
Execute with the <literal>--dry-run</literal> option to check what would happen without
|
<refpurpose>unregister an inactive primary node</refpurpose>
|
||||||
actually unregistering the node.
|
</refnamediv>
|
||||||
</para>
|
|
||||||
|
|
||||||
<para>
|
<refsect1>
|
||||||
<command>repmgr master unregister</command> can be used as an alias for
|
<title>Description</title>
|
||||||
<command>repmgr primary unregister</command>/
|
<para>
|
||||||
</para>
|
<command>repmgr primary unregister</command> unregisters an inactive primary node
|
||||||
</chapter>
|
from the &repmgr; metadata. This is typically when the primary has failed and is
|
||||||
|
being removed from the cluster after a new primary has been promoted.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Execution</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr primary unregister</command> can be run on any active &repmgr; node,
|
||||||
|
with the ID of the node to unregister passed as <option>--node-id</option>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Execute with the <literal>--dry-run</literal> option to check what would happen without
|
||||||
|
actually unregistering the node.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<command>repmgr master unregister</command> can be used as an alias for
|
||||||
|
<command>repmgr primary unregister</command>.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
|
||||||
|
<title>Options</title>
|
||||||
|
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check prerequisites but don't actually unregister the primary.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--node-id</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
ID of the inactive primary to be unregistered.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-primary-unregister-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>primary_unregister</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,25 +1,39 @@
|
|||||||
<chapter id="repmgr-standby-clone" xreflabel="repmgr standby clone">
|
<refentry id="repmgr-standby-clone">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr standby clone</primary>
|
<primary>repmgr standby clone</primary>
|
||||||
<seealso>cloning</seealso>
|
<seealso>cloning</seealso>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr standby clone</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
<command>repmgr standby clone</command> clones a PostgreSQL node from another
|
<refentrytitle>repmgr standby clone</refentrytitle>
|
||||||
PostgreSQL node, typically the primary, but optionally from any other node in
|
</refmeta>
|
||||||
the cluster or from Barman. It creates the <filename>recovery.conf</filename> file required
|
|
||||||
to attach the cloned node to the primary node (or another standby, if cascading replication
|
<refnamediv>
|
||||||
is in use).
|
<refname>repmgr standby clone</refname>
|
||||||
</para>
|
<refpurpose>clone a PostgreSQL standby node from another PostgreSQL node</refpurpose>
|
||||||
<note>
|
</refnamediv>
|
||||||
<simpara>
|
|
||||||
<command>repmgr standby clone</command> does not start the standby, and after cloning
|
<refsect1>
|
||||||
<command>repmgr standby register</command> must be executed to notify &repmgr; of its presence.
|
<title>Description</title>
|
||||||
</simpara>
|
<para>
|
||||||
</note>
|
<command>repmgr standby clone</command> clones a PostgreSQL node from another
|
||||||
|
PostgreSQL node, typically the primary, but optionally from any other node in
|
||||||
|
the cluster or from Barman. It creates the <filename>recovery.conf</filename> file required
|
||||||
|
to attach the cloned node to the primary node (or another standby, if cascading replication
|
||||||
|
is in use).
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
<command>repmgr standby clone</command> does not start the standby, and after cloning
|
||||||
|
a standby, the command <command>repmgr standby register</command> must be executed to
|
||||||
|
notify &repmgr; of its existence.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
<sect1 id="repmgr-standby-clone-config-file-copying" xreflabel="Copying configuration files">
|
<refsect1 id="repmgr-standby-clone-config-file-copying" xreflabel="Copying configuration files">
|
||||||
<title>Handling configuration files</title>
|
<title>Handling configuration files</title>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
@@ -35,7 +49,7 @@
|
|||||||
not be copied by default. &repmgr; can copy these files, either to the same
|
not be copied by default. &repmgr; can copy these files, either to the same
|
||||||
location on the standby server (provided appropriate directory and file permissions
|
location on the standby server (provided appropriate directory and file permissions
|
||||||
are available), or into the standby's data directory. This requires passwordless
|
are available), or into the standby's data directory. This requires passwordless
|
||||||
SSH access to the primary server. Add the option <literal>--copy-external-config-files</literal>
|
SSH access to the primary server. Add the option <option>--copy-external-config-files</option>
|
||||||
to the <command>repmgr standby clone</command> command; by default files will be copied to
|
to the <command>repmgr standby clone</command> command; by default files will be copied to
|
||||||
the same path as on the upstream server. Note that the user executing <command>repmgr</command>
|
the same path as on the upstream server. Note that the user executing <command>repmgr</command>
|
||||||
must have write access to those directories.
|
must have write access to those directories.
|
||||||
@@ -45,20 +59,101 @@
|
|||||||
<literal>--copy-external-config-files=pgdata</literal>, but note that
|
<literal>--copy-external-config-files=pgdata</literal>, but note that
|
||||||
any include directives in the copied files may need to be updated.
|
any include directives in the copied files may need to be updated.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
When executing <command>repmgr standby clone</command> with the
|
||||||
|
<option>--copy-external-config-files</option> aand <option>--dry-run</option>
|
||||||
|
options, &repmgr; will check the SSH connection to the source node, but
|
||||||
|
will not verify whether the files can actually be copied.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
During the actual clone operation, a check will be made before the database itself
|
||||||
|
is cloned to determine whether the files can actually be copied; if any problems are
|
||||||
|
encountered, the clone operation will be aborted, enabling the user to fix
|
||||||
|
any issues before retrying the clone operation.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
<tip>
|
<tip>
|
||||||
<simpara>
|
<simpara>
|
||||||
For reliable configuration file management we recommend using a
|
For reliable configuration file management we recommend using a
|
||||||
configuration management tool such as Ansible, Chef, Puppet or Salt.
|
configuration management tool such as Ansible, Chef, Puppet or Salt.
|
||||||
</simpara>
|
</simpara>
|
||||||
</tip>
|
</tip>
|
||||||
</sect1>
|
|
||||||
|
|
||||||
<sect1 id="repmgr-standby-clone-wal-management" xreflabel="Managing WAL during the cloning process">
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-clone-recovery-conf">
|
||||||
|
<indexterm>
|
||||||
|
<primary>recovery.conf</primary>
|
||||||
|
<secondary>customising with "repmgr standby clone"</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>Customising recovery.conf</title>
|
||||||
|
<para>
|
||||||
|
By default, &repmgr; will create a minimal <filename>recovery.conf</filename>
|
||||||
|
containing following parameters:
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><varname>standby_mode</varname> (always <literal>'on'</literal>)</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><varname>recovery_target_timeline</varname> (always <literal>'latest'</literal>)</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><varname>primary_conninfo</varname></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><varname>primary_slot_name</varname> (if replication slots in use)</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
The following additional parameters can be specified in <filename>repmgr.conf</filename>
|
||||||
|
for inclusion in <filename>recovery.conf</filename>:
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><varname>restore_command</varname></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><varname>archive_cleanup_command</varname></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><varname>recovery_min_apply_delay</varname></simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
We recommend using <ulink url="https://www.pgbarman.org/">Barman</ulink> to manage
|
||||||
|
WAL file archiving. For more details on combining &repmgr; and <application>Barman</application>,
|
||||||
|
in particular using <varname>restore_command</varname> to configure Barman as a backup source of
|
||||||
|
WAL files, see <xref linkend="cloning-from-barman">.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-clone-wal-management">
|
||||||
<title>Managing WAL during the cloning process</title>
|
<title>Managing WAL during the cloning process</title>
|
||||||
<para>
|
<para>
|
||||||
When initially cloning a standby, you will need to ensure
|
When initially cloning a standby, you will need to ensure
|
||||||
that all required WAL files remain available while the cloning is taking
|
that all required WAL files remain available while the cloning is taking
|
||||||
place. To ensure this happens when using the default `pg_basebackup` method,
|
place. To ensure this happens when using the default <command>pg_basebackup</command> method,
|
||||||
&repmgr; will set <command>pg_basebackup</command>'s <literal>--xlog-method</literal>
|
&repmgr; will set <command>pg_basebackup</command>'s <literal>--xlog-method</literal>
|
||||||
parameter to <literal>stream</literal>,
|
parameter to <literal>stream</literal>,
|
||||||
which will ensure all WAL files generated during the cloning process are
|
which will ensure all WAL files generated during the cloning process are
|
||||||
@@ -86,6 +181,187 @@
|
|||||||
<literal>--wal-method</literal>.
|
<literal>--wal-method</literal>.
|
||||||
</simpara>
|
</simpara>
|
||||||
</note>
|
</note>
|
||||||
</sect1>
|
</refsect1>
|
||||||
</chapter>
|
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-create-recovery-conf">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>recovery.conf</primary>
|
||||||
|
<secondary>generating for a standby cloned by another method</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>Using a standby cloned by another method</title>
|
||||||
|
<para>
|
||||||
|
&repmgr; supports standbys cloned by another method (e.g. using <application>barman</application>'s
|
||||||
|
<command><ulink url="http://docs.pgbarman.org/release/2.4/#recover">barman recover</ulink></command> command).
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To integrate the standby as a &repmgr; node, ensure the <filename>repmgr.conf</filename>
|
||||||
|
file is created for the node, and that it has been registered using
|
||||||
|
<command><link linkend="repmgr-standby-register">repmgr standby register</link></command>.
|
||||||
|
Then execute the command <command>repmgr standby clone --recovery-conf-only</command>.
|
||||||
|
This will create the <filename>recovery.conf</filename> file needed to attach
|
||||||
|
the node to its upstream, and will also create a replication slot on the
|
||||||
|
upstream node if required.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Note that the upstream node must be running. An existing
|
||||||
|
<filename>recovery.conf</filename> will not be overwritten unless the
|
||||||
|
<option>-F/--force</option> option is provided.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Execute <command>repmgr standby clone --recovery-conf-only --dry-run</command>
|
||||||
|
to check the prerequisites for creating the <filename>recovery.conf</filename> file,
|
||||||
|
and display the contents of the file without actually creating it.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
<option>--recovery-conf-only</option> was introduced in &repmgr; <link linkend="release-4.0.4">4.0.4</link>.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
|
||||||
|
<title>Options</title>
|
||||||
|
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-d, --dbname=CONNINFO</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Connection string of the upstream node to use for cloning.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check prerequisites but don't actually clone the standby.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If <option>--recovery-conf-only</option> specified, the contents of
|
||||||
|
the generated <filename>recovery.conf</filename> file will be displayed
|
||||||
|
but the file itself not written.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-c, --fast-checkpoint</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Force fast checkpoint (not effective when cloning from Barman).
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--copy-external-config-files[={samepath|pgdata}]</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Copy configuration files located outside the data directory on the source
|
||||||
|
node to the same path on the standby (default) or to the
|
||||||
|
PostgreSQL data directory.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--no-upstream-connection</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
When using Barman, do not connect to upstream node.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-R, --remote-user=USERNAME</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Remote system username for SSH operations (default: current local system username).
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option> --recovery-conf-only</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Create <filename>recovery.conf</filename> file for a previously cloned instance. &repmgr 4.0.4 and later.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--replication-user</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
User to make replication connections with (optional, not usually required).
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--superuser</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
If the &repmgr; user is not a superuser, the name of a valid superuser must
|
||||||
|
be provided with this option.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--upstream-conninfo</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
<literal>primary_conninfo</literal> value to write in recovery.conf
|
||||||
|
when the intended upstream server does not yet exist.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--upstream-node-id</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
ID of the upstream node to replicate from (optional, defaults to primary node)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--without-barman </option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Do not use Barman even if configured.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-clone-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>standby_clone</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
See <xref linkend="cloning-standbys"> for details about various aspects of cloning.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
</refentry>
|
||||||
|
|
||||||
|
|||||||
@@ -1,21 +1,116 @@
|
|||||||
<chapter id="repmgr-standby-follow" xreflabel="repmgr standby follow">
|
<refentry id="repmgr-standby-follow">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr standby follow</primary>
|
<primary>repmgr standby follow</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr standby follow</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
Attaches the standby to a new primary. This command requires a valid
|
<refentrytitle>repmgr standby follow</refentrytitle>
|
||||||
<filename>repmgr.conf</filename> file for the standby, either specified
|
</refmeta>
|
||||||
explicitly with <literal>-f/--config-file</literal> or located in a
|
|
||||||
default location; no additional arguments are required.
|
<refnamediv>
|
||||||
</para>
|
<refname>repmgr standby follow</refname>
|
||||||
<para>
|
<refpurpose>attach a standby to a new primary</refpurpose>
|
||||||
This command will force a restart of the standby server, which must be
|
</refnamediv>
|
||||||
running. It can only be used to attach a standby to a new primary node.
|
|
||||||
</para>
|
<refsect1>
|
||||||
<para>
|
<title>Description</title>
|
||||||
To re-add an inactive node to the replication cluster, see
|
|
||||||
<xref linkend="repmgr-node-rejoin">
|
<para>
|
||||||
</para>
|
Attaches the standby to a new primary. This command requires a valid
|
||||||
</chapter>
|
<filename>repmgr.conf</filename> file for the standby, either specified
|
||||||
|
explicitly with <literal>-f/--config-file</literal> or located in a
|
||||||
|
default location; no additional arguments are required.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This command will force a restart of the standby server, which must be
|
||||||
|
running. It can only be used to attach an active standby to the current primary node
|
||||||
|
(and not to another standby).
|
||||||
|
</para>
|
||||||
|
<tip>
|
||||||
|
<para>
|
||||||
|
To re-add an inactive node to the replication cluster, use
|
||||||
|
<xref linkend="repmgr-node-rejoin">.
|
||||||
|
</para>
|
||||||
|
</tip>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<command>repmgr standby follow</command> will wait up to
|
||||||
|
<varname>standby_follow_timeout</varname> seconds (default: <literal>30</literal>)
|
||||||
|
to verify the standby has actually connected to the new primary.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf standby follow
|
||||||
|
INFO: setting node 3's primary to node 2
|
||||||
|
NOTICE: restarting server using "pg_ctl -l /var/log/postgres/startup.log -w -D '/var/lib/postgres/data' restart"
|
||||||
|
waiting for server to shut down........ done
|
||||||
|
server stopped
|
||||||
|
waiting for server to start.... done
|
||||||
|
server started
|
||||||
|
NOTICE: STANDBY FOLLOW successful
|
||||||
|
DETAIL: node 3 is now attached to node 2</programlisting>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check prerequisites but don't actually follow a new standby.
|
||||||
|
</para>
|
||||||
|
<important>
|
||||||
|
<para>
|
||||||
|
This does not guarantee the standby can follow the primary; in
|
||||||
|
particular, whether the primary and standby timelines have diverged,
|
||||||
|
can currently only be determined by actually attempting to
|
||||||
|
attach the standby to the primary.
|
||||||
|
</para>
|
||||||
|
</important>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-w</option></term>
|
||||||
|
<term><option>--wait</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Wait for a primary to appear. &repmgr; will wait for up to
|
||||||
|
<varname>primary_follow_timeout</varname> seconds
|
||||||
|
(default: 60 seconds) to verify that the standby is following the new primary.
|
||||||
|
This value can be defined in <filename>repmgr.conf</filename>.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-follow-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>standby_follow</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If provided, &repmgr; will substitute the placeholders <literal>%p</literal> with the node ID of the primary
|
||||||
|
being followed, <literal>%c</literal> with its <literal>conninfo</literal> string, and
|
||||||
|
<literal>%a</literal> with its node name.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
<xref linkend="repmgr-node-rejoin">
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
</refentry>
|
||||||
|
|
||||||
|
|||||||
@@ -1,18 +1,60 @@
|
|||||||
<chapter id="repmgr-standby-promote" xreflabel="repmgr standby promote">
|
<refentry id="repmgr-standby-promote">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr standby promote</primary>
|
<primary>repmgr standby promote</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr standby promote</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
Promotes a standby to a primary if the current primary has failed. This
|
<refentrytitle>repmgr standby promote</refentrytitle>
|
||||||
command requires a valid <filename>repmgr.conf</filename> file for the standby, either
|
</refmeta>
|
||||||
specified explicitly with <literal>-f/--config-file</literal> or located in a
|
|
||||||
default location; no additional arguments are required.
|
<refnamediv>
|
||||||
</para>
|
<refname>repmgr standby promote</refname>
|
||||||
<para>
|
<refpurpose>promote a standby to a primary</refpurpose>
|
||||||
If the standby promotion succeeds, the server will not need to be
|
</refnamediv>
|
||||||
restarted. However any other standbys will need to follow the new server,
|
|
||||||
by using <xref linkend="repmgr-standby-follow">; if <command>repmgrd</command>
|
<refsect1>
|
||||||
is active, it will handle this automatically.
|
<title>Description</title>
|
||||||
</para>
|
<para>
|
||||||
</chapter>
|
Promotes a standby to a primary if the current primary has failed. This
|
||||||
|
command requires a valid <filename>repmgr.conf</filename> file for the standby, either
|
||||||
|
specified explicitly with <literal>-f/--config-file</literal> or located in a
|
||||||
|
default location; no additional arguments are required.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If the standby promotion succeeds, the server will not need to be
|
||||||
|
restarted. However any other standbys will need to follow the new server,
|
||||||
|
by using <xref linkend="repmgr-standby-follow">; if <application>repmgrd</application>
|
||||||
|
is active, it will handle this automatically.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Note that &repmgr; will wait for up to <varname>promote_check_timeout</varname> seconds
|
||||||
|
(default: 60 seconds) to verify that the standby has been promoted, and will
|
||||||
|
check the promotion every <varname>promote_check_interval</varname> seconds (default: 1 second).
|
||||||
|
Both values can be defined in <filename>repmgr.conf</filename>.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf standby promote
|
||||||
|
NOTICE: promoting standby to primary
|
||||||
|
DETAIL: promoting server "node2" (ID: 2) using "pg_ctl -l /var/log/postgres/startup.log -w -D '/var/lib/postgres/data' promote"
|
||||||
|
server promoting
|
||||||
|
DEBUG: setting node 2 as primary and marking existing primary as failed
|
||||||
|
NOTICE: STANDBY PROMOTE successful
|
||||||
|
DETAIL: server "node2" (ID: 2) was successfully promoted to primary</programlisting>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-promote-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>standby_promote</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,50 +1,183 @@
|
|||||||
<chapter id="repmgr-standby-register" xreflabel="repmgr standby register">
|
<refentry id="repmgr-standby-register" xreflabel="repmgr standby register">
|
||||||
<indexterm><primary>repmgr standby register</primary></indexterm>
|
<indexterm>
|
||||||
<title>repmgr standby register</title>
|
<primary>repmgr standby register</primary>
|
||||||
<para>
|
</indexterm>
|
||||||
<command>repmgr standby register</command> adds a standby's information to
|
|
||||||
the &repmgr; metadata. This command needs to be executed to enable
|
|
||||||
promote/follow operations and to allow <command>repmgrd</command> to work with the node.
|
|
||||||
An existing standby can be registered using this command. Execute with the
|
|
||||||
<literal>--dry-run</literal> option to check what would happen without actually registering the
|
|
||||||
standby.
|
|
||||||
</para>
|
|
||||||
|
|
||||||
<sect1 id="repmgr-standby-register-wait" xreflabel="repmgr standby register --wait">
|
<refmeta>
|
||||||
|
<refentrytitle>repmgr standby register</refentrytitle>
|
||||||
|
</refmeta>
|
||||||
|
|
||||||
|
<refnamediv>
|
||||||
|
<refname>repmgr standby register</refname>
|
||||||
|
<refpurpose>add a standby's information to the &repmgr; metadata</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr standby register</command> adds a standby's information to
|
||||||
|
the &repmgr; metadata. This command needs to be executed to enable
|
||||||
|
promote/follow operations and to allow <application>repmgrd</application> to work with the node.
|
||||||
|
An existing standby can be registered using this command. Execute with the
|
||||||
|
<literal>--dry-run</literal> option to check what would happen without actually registering the
|
||||||
|
standby.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If providing the configuration file location with <literal>-f/--config-file</literal>,
|
||||||
|
avoid using a relative path, as &repmgr; stores the configuration file location
|
||||||
|
in the repmgr metadata for use when &repmgr; is executed remotely (e.g. during
|
||||||
|
<xref linkend="repmgr-standby-switchover">). &repmgr; will attempt to convert the
|
||||||
|
a relative path into an absolute one, but this may not be the same as the path you
|
||||||
|
would explicitly provide (e.g. <filename>./repmgr.conf</filename> might be converted
|
||||||
|
to <filename>/path/to/./repmgr.conf</filename>, whereas you'd normally write
|
||||||
|
<filename>/path/to/repmgr.conf</filename>).
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-register-wait-start" xreflabel="repmgr standby register --wait-start">
|
||||||
|
<title>Waiting for the the standby to start</title>
|
||||||
|
<para>
|
||||||
|
By default, &repmgr; will wait 30 seconds for the standby to become available before
|
||||||
|
aborting with a connection error. This is useful when setting up a standby from a script,
|
||||||
|
as the standby may not have fully started up by the time <command>repmgr standby register</command>
|
||||||
|
is executed.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To change the timeout, pass the desired value with the <literal>--wait-start</literal> option.
|
||||||
|
A value of <literal>0</literal> will disable the timeout.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The timeout will be ignored if <literal>-F/--force</literal> was provided.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-register-wait-sync" xreflabel="repmgr standby register --wait-sync">
|
||||||
<title>Waiting for the registration to propagate to the standby</title>
|
<title>Waiting for the registration to propagate to the standby</title>
|
||||||
<para>
|
<para>
|
||||||
Depending on your environment and workload, it may take some time for
|
Depending on your environment and workload, it may take some time for the standby's node record
|
||||||
the standby's node record to propagate from the primary to the standby. Some
|
to propagate from the primary to the standby. Some actions (such as starting
|
||||||
actions (such as starting <command>repmgrd</command>) require that the standby's node record
|
<application>repmgrd</application>) require that the standby's node record
|
||||||
is present and up-to-date to function correctly.
|
is present and up-to-date to function correctly.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
By providing the option <literal>--wait-sync</literal> to the
|
By providing the option <option>--wait-sync</option> to the
|
||||||
<command>repmgr standby register</command> command, &repmgr; will wait
|
<command>repmgr standby register</command> command, &repmgr; will wait
|
||||||
until the record is synchronised before exiting. An optional timeout (in
|
until the record is synchronised before exiting. An optional timeout (in
|
||||||
seconds) can be added to this option (e.g. <literal>--wait-sync=60</literal>).
|
seconds) can be added to this option (e.g. <option>--wait-sync=60</option>).
|
||||||
</para>
|
</para>
|
||||||
</sect1>
|
</refsect1>
|
||||||
|
|
||||||
<sect1 id="rempgr-standby-register-inactive-node" xreflabel="Registering an inactive node">
|
<refsect1 id="repmgr-standby-register-inactive-node" xreflabel="Registering an inactive node">
|
||||||
<title>Registering an inactive node</title>
|
<title>Registering an inactive node</title>
|
||||||
<para>
|
<para>
|
||||||
Under some circumstances you may wish to register a standby which is not
|
Under some circumstances you may wish to register a standby which is not
|
||||||
yet running; this can be the case when using provisioning tools to create
|
yet running; this can be the case when using provisioning tools to create
|
||||||
a complex replication cluster. In this case, by using the <literal>-F/--force</literal>
|
a complex replication cluster. In this case, by using the <option>-F/--force</option>
|
||||||
option and providing the connection parameters to the primary server,
|
option and providing the connection parameters to the primary server,
|
||||||
the standby can be registered.
|
the standby can be registered.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Similarly, with cascading replication it may be necessary to register
|
Similarly, with cascading replication it may be necessary to register
|
||||||
a standby whose upstream node has not yet been registered - in this case,
|
a standby whose upstream node has not yet been registered - in this case,
|
||||||
using <literal>-F/--force</literal> will result in the creation of an inactive placeholder
|
using <option>-F/--force</option> will result in the creation of an inactive placeholder
|
||||||
record for the upstream node, which will however later need to be registered
|
record for the upstream node, which will however later need to be registered
|
||||||
with the <literal>-F/--force</literal> option too.
|
with the <option>-F/--force</option> option too.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
When used with <command>repmgr standby register</command>, care should be taken that use of the
|
When used with <command>repmgr standby register</command>, care should be taken that use of the
|
||||||
<literal>-F/--force</literal> option does not result in an incorrectly configured cluster.
|
<option>-F/--force</option> option does not result in an incorrectly configured cluster.
|
||||||
</para>
|
</para>
|
||||||
</sect1>
|
</refsect1>
|
||||||
</chapter>
|
|
||||||
|
<refsect1 id="repmgr-standby-register-node-cloned-other-source">
|
||||||
|
<title>Registering a node not cloned by repmgr</title>
|
||||||
|
<para>
|
||||||
|
If you've cloned a standby using another method (e.g. <application>barman</application>'s
|
||||||
|
<command>barman recover</command> command), first execute
|
||||||
|
<link linkend="repmgr-standby-create-recovery-conf">repmgr standby clone --recovery-conf-only</link>
|
||||||
|
to add the <filename>recovery.conf</filename> file, then register the standby as usual.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
|
||||||
|
<title>Options</title>
|
||||||
|
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check prerequisites but don't actually register the standby.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-F</option><option>--force</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Overwrite an existing node record
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--upstream-node-id</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
ID of the upstream node to replicate from (optional)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--wait-start</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
wait for the standby to start (timeout in seconds, default 30 seconds)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--wait-sync</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
wait for the node record to synchronise to the standby (optional timeout in seconds)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-register-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>standby_register</literal> <link linkend="event-notifications">event notification</link>
|
||||||
|
will be generated immediately after the node record is updated on the primary.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
If the <option>--wait-sync</option> option is provided, a <literal>standby_register_sync</literal>
|
||||||
|
event notification will be generated immediately after the node record has synchronised to the
|
||||||
|
standby.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
If provided, &repmgr; will substitute the placeholders <literal>%p</literal> with the node ID of the
|
||||||
|
primary node, <literal>%c</literal> with its <literal>conninfo</literal> string, and
|
||||||
|
<literal>%a</literal> with its node name.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,27 +1,289 @@
|
|||||||
<chapter id="repmgr-standby-switchover" xreflabel="repmgr standby switchover">
|
<refentry id="repmgr-standby-switchover">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>repmgr standby switchover</primary>
|
<primary>repmgr standby switchover</primary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>repmgr standby switchover</title>
|
|
||||||
<para>
|
<refmeta>
|
||||||
Promotes a standby to primary and demotes the existing primary to a standby.
|
<refentrytitle>repmgr standby switchover</refentrytitle>
|
||||||
This command must be run on the standby to be promoted, and requires a
|
</refmeta>
|
||||||
passwordless SSH connection to the current primary.
|
|
||||||
</para>
|
<refnamediv>
|
||||||
<para>
|
<refname>repmgr standby switchover</refname>
|
||||||
If other standbys are connected to the demotion candidate, &repmgr; can instruct
|
<refpurpose>promote a standby to primary and demote the existing primary to a standby</refpurpose>
|
||||||
these to follow the new primary if the option <literal>--siblings-follow</literal>
|
</refnamediv>
|
||||||
is specified.
|
|
||||||
</para>
|
|
||||||
<para>
|
<refsect1>
|
||||||
Execute with the <literal>--dry-run</literal> option to test the switchover as far as
|
<title>Description</title>
|
||||||
possible without actually changing the status of either node.
|
|
||||||
</para>
|
<para>
|
||||||
<para>
|
Promotes a standby to primary and demotes the existing primary to a standby.
|
||||||
<command>repmgrd</command> should not be active on any nodes while a switchover is being
|
This command must be run on the standby to be promoted, and requires a
|
||||||
executed. This restriction may be lifted in a later version.
|
passwordless SSH connection to the current primary.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
For more details see the section <xref linkend="performing-switchover">.
|
If other standbys are connected to the demotion candidate, &repmgr; can instruct
|
||||||
</para>
|
these to follow the new primary if the option <literal>--siblings-follow</literal>
|
||||||
</chapter>
|
is specified. This requires a passwordless SSH connection between the promotion
|
||||||
|
candidate (new primary) and the standbys attached to the demotion candidate
|
||||||
|
(existing primary).
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
Performing a switchover is a non-trivial operation. In particular it
|
||||||
|
relies on the current primary being able to shut down cleanly and quickly.
|
||||||
|
&repmgr; will attempt to check for potential issues but cannot guarantee
|
||||||
|
a successful switchover.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
&repmgr; will refuse to perform the switchover if an exclusive backup is running on
|
||||||
|
the current primary.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
For more details on performing a switchover, including preparation and configuration,
|
||||||
|
see section <xref linkend="performing-switchover">.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
From <link linkend="release-4.2">repmgr 4.2</link>, &repmgr; will instruct any running
|
||||||
|
<application>repmgrd</application> instances to pause operations while the switchover
|
||||||
|
is being carried out, to prevent <application>repmgrd</application> from
|
||||||
|
unintentionally promoting a node. For more details, see <xref linkend="repmgrd-pausing">.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Users of &repmgr; versions prior to 4.2 should ensure that <application>repmgrd</application>
|
||||||
|
is not running on any nodes while a switchover is being executed.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--always-promote</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Promote standby to primary, even if it is behind or has diverged
|
||||||
|
from the original primary. The original primary will be shut down in any case,
|
||||||
|
and will need to be manually reintegrated into the replication cluster.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check prerequisites but don't actually execute a switchover.
|
||||||
|
</para>
|
||||||
|
<important>
|
||||||
|
<para>
|
||||||
|
Success of <option>--dry-run</option> does not imply the switchover will
|
||||||
|
complete successfully, only that
|
||||||
|
the prerequisites for performing the operation are met.
|
||||||
|
</para>
|
||||||
|
</important>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-F</option></term>
|
||||||
|
<term><option>--force</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Ignore warnings and continue anyway.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Specifically, if a problem is encountered when shutting down the current primary,
|
||||||
|
using <option>-F/--force</option> will cause &repmgr; to continue by promoting
|
||||||
|
the standby to be the new primary, and if <option>--siblings-follow</option> is
|
||||||
|
specified, attach any other standbys to the new primary.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--force-rewind[=/path/to/pg_rewind]</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Use <application>pg_rewind</application> to reintegrate the old primary if necessary
|
||||||
|
(and the prerequisites for using <application>pg_rewind</application> are met).
|
||||||
|
If using PostgreSQL 9.3 or 9.4, and the <application>pg_rewind</application>
|
||||||
|
binary is not installed in the PostgreSQL <filename>bin</filename> directory,
|
||||||
|
provide its full path. For more details see also <xref linkend="switchover-pg-rewind">.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>-R</option></term>
|
||||||
|
<term><option>--remote-user</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
System username for remote SSH operations (defaults to local system user).
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--repmgrd-no-pause</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Don't pause <application>repmgrd</application> while executing a switchover.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This option should not be used unless you take steps by other means
|
||||||
|
to ensure <application>repmgrd</application> is paused or not
|
||||||
|
running on all nodes.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--siblings-follow</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Have standbys attached to the old primary follow the new primary.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
</variablelist>
|
||||||
|
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Configuration file settings</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Note that following parameters in <filename>repmgr.conf</filename> are relevant to the
|
||||||
|
switchover operation:
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>replication_lag_critical</literal>:
|
||||||
|
if replication lag (in seconds) on the standby exceeds this value, the
|
||||||
|
switchover will be aborted (unless the <literal>-F/--force</literal> option
|
||||||
|
is provided)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>shutdown_check_timeout</literal>: maximum number of seconds to wait for the
|
||||||
|
demotion candidate (current primary) to shut down, before aborting the switchover.
|
||||||
|
</simpara>
|
||||||
|
<simpara>
|
||||||
|
Note that this parameter is set on the node where <command>repmgr standby switchover</command>
|
||||||
|
is executed (promotion candidate); setting it on the demotion candidate (former primary) will
|
||||||
|
have no effect.
|
||||||
|
</simpara>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
In versions prior to <link linkend="release-4.2">&repmgr; 4.2</link>, <command>repmgr standby switchover</command> would
|
||||||
|
use the values defined in <literal>reconnect_attempts</literal> and <literal>reconnect_interval</literal>
|
||||||
|
to determine the timeout for demotion candidate shutdown.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<literal>standby_reconnect_timeout</literal>:
|
||||||
|
maximum number of seconds to attempt to wait for the demotion candidate (former primary)
|
||||||
|
to reconnect to the promoted primary (default: 60 seconds)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Execution</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Execute with the <literal>--dry-run</literal> option to test the switchover as far as
|
||||||
|
possible without actually changing the status of either node.
|
||||||
|
</para>
|
||||||
|
<important>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> must be shut down on all nodes while a switchover is being
|
||||||
|
executed. This restriction will be removed in a future &repmgr; version.
|
||||||
|
</para>
|
||||||
|
</important>
|
||||||
|
<para>
|
||||||
|
External database connections, e.g. from an application, should not be permitted while
|
||||||
|
the switchover is taking place. In particular, active transactions on the primary
|
||||||
|
can potentially disrupt the shutdown process.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-switchover-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
<literal>standby_switchover</literal> and <literal>standby_promote</literal>
|
||||||
|
<link linkend="event-notifications">event notifications</link> will be generated for the new primary,
|
||||||
|
and a <literal>node_rejoin</literal> event notification for the former primary (new standby).
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If using an event notification script, <literal>standby_switchover</literal>
|
||||||
|
will populate the placeholder parameter <literal>%p</literal> with the node ID of
|
||||||
|
the former primary.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Exit codes</title>
|
||||||
|
<para>
|
||||||
|
Following exit codes can be emitted by <command>repmgr standby switchover</command>:
|
||||||
|
</para>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>SUCCESS (0)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
The switchover completed successfully.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_SWITCHOVER_FAIL (18)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
The switchover could not be executed.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>ERR_SWITCHOVER_INCOMPLETE (22)</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
The switchover was executed but a problem was encountered.
|
||||||
|
Typically this means the former primary could not be reattached
|
||||||
|
as a standby. Check preceding log messages for more information.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>See also</title>
|
||||||
|
<para>
|
||||||
|
For more details see the section <xref linkend="performing-switchover">.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|||||||
@@ -1,29 +1,70 @@
|
|||||||
<chapter id="repmgr-standby-unregister" xreflabel="repmgr standby unregister">
|
<refentry id="repmgr-standby-unregister">
|
||||||
<indexterm><primary>repmgr standby unregister</primary></indexterm>
|
<indexterm>
|
||||||
<title>repmgr standby unregister</title>
|
<primary>repmgr standby unregister</primary>
|
||||||
<para>
|
</indexterm>
|
||||||
Unregisters a standby with `repmgr`. This command does not affect the actual
|
|
||||||
replication, just removes the standby's entry from the &repmgr; metadata.
|
<refmeta>
|
||||||
</para>
|
<refentrytitle>repmgr standby unregister</refentrytitle>
|
||||||
<para>
|
</refmeta>
|
||||||
To unregister a running standby, execute:
|
|
||||||
<programlisting>
|
<refnamediv>
|
||||||
repmgr standby unregister -f /etc/repmgr.conf</programlisting>
|
<refname>repmgr standby unregister</refname>
|
||||||
</para>
|
<refpurpose>remove a standby's information from the &repmgr; metadata</refpurpose>
|
||||||
<para>
|
</refnamediv>
|
||||||
This will remove the standby record from &repmgr;'s internal metadata
|
|
||||||
table (<literal>repmgr.nodes</literal>). A <literal>standby_unregister</literal>
|
<refsect1>
|
||||||
event notification will be recorded in the <literal>repmgr.events</literal> table.
|
<title>Description</title>
|
||||||
</para>
|
<para>
|
||||||
<para>
|
Unregisters a standby with &repmgr;. This command does not affect the actual
|
||||||
If the standby is not running, the command can be executed on another
|
replication, just removes the standby's entry from the &repmgr; metadata.
|
||||||
node by providing the id of the node to be unregistered using
|
</para>
|
||||||
the command line parameter <literal>--node-id</literal>, e.g. executing the following
|
</refsect1>
|
||||||
command on the master server will unregister the standby with
|
|
||||||
id <literal>3</literal>:
|
<refsect1>
|
||||||
<programlisting>
|
<title>Execution</title>
|
||||||
repmgr standby unregister -f /etc/repmgr.conf --node-id=3
|
<para>
|
||||||
</programlisting>
|
To unregister a running standby, execute:
|
||||||
</para>
|
<programlisting>
|
||||||
</chapter>
|
repmgr standby unregister -f /etc/repmgr.conf</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This will remove the standby record from &repmgr;'s internal metadata
|
||||||
|
table (<literal>repmgr.nodes</literal>). A <literal>standby_unregister</literal>
|
||||||
|
event notification will be recorded in the <literal>repmgr.events</literal> table.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If the standby is not running, the command can be executed on another
|
||||||
|
node by providing the id of the node to be unregistered using
|
||||||
|
the command line parameter <literal>--node-id</literal>, e.g. executing the following
|
||||||
|
command on the primary server will unregister the standby with
|
||||||
|
id <literal>3</literal>:
|
||||||
|
<programlisting>
|
||||||
|
repmgr standby unregister -f /etc/repmgr.conf --node-id=3</programlisting>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--node-id</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
<varname>node_id</varname> of the node to unregister (optional)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-standby-unregister-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>standby_unregister</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
|
|
||||||
|
|||||||
60
doc/repmgr-witness-register.sgml
Normal file
60
doc/repmgr-witness-register.sgml
Normal file
@@ -0,0 +1,60 @@
|
|||||||
|
<refentry id="repmgr-witness-register">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgr witness register</primary>
|
||||||
|
<seealso>witness server</seealso>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<refmeta>
|
||||||
|
<refentrytitle>repmgr witness register</refentrytitle>
|
||||||
|
</refmeta>
|
||||||
|
|
||||||
|
<refnamediv>
|
||||||
|
<refname>repmgr witness register</refname>
|
||||||
|
<refpurpose>add a witness node's information to the &repmgr; metadata</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr witness register</command> adds a witness server's node
|
||||||
|
record to the &repmgr; metadata, and if necessary initialises the witness
|
||||||
|
node by installing the &repmgr; extension and copying the &repmgr; metadata
|
||||||
|
to the witness server. This command needs to be executed to enable
|
||||||
|
use of the witness server with <application>repmgrd</application>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
When executing <command>repmgr witness register</command>, connection information
|
||||||
|
for the cluster primary server must also be provided. &repmgr; will automatically
|
||||||
|
use the <varname>user</varname> and <varname>dbname</varname> values defined
|
||||||
|
in the <varname>conninfo</varname> string defined in the witness node's
|
||||||
|
<filename>repmgr.conf</filename>, if these are not explicitly provided.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Execute with the <literal>--dry-run</literal> option to check what would happen
|
||||||
|
without actually registering the witness server.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
<refsect1>
|
||||||
|
<title>Example</title>
|
||||||
|
<para>
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf witness register -h node1
|
||||||
|
INFO: connecting to witness node "node3" (ID: 3)
|
||||||
|
INFO: connecting to primary node
|
||||||
|
NOTICE: attempting to install extension "repmgr"
|
||||||
|
NOTICE: "repmgr" extension successfully installed
|
||||||
|
INFO: witness registration complete
|
||||||
|
NOTICE: witness node "node3" (ID: 3) successfully registered
|
||||||
|
</programlisting>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-witness-register-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>witness_register</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
102
doc/repmgr-witness-unregister.sgml
Normal file
102
doc/repmgr-witness-unregister.sgml
Normal file
@@ -0,0 +1,102 @@
|
|||||||
|
<refentry id="repmgr-witness-unregister" xreflabel="repmgr witness unregister">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgr witness unregister</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<refmeta>
|
||||||
|
<refentrytitle>repmgr witness unregister</refentrytitle>
|
||||||
|
</refmeta>
|
||||||
|
|
||||||
|
<refnamediv>
|
||||||
|
<refname>repmgr witness unregister</refname>
|
||||||
|
<refpurpose>remove a witness node's information to the &repmgr; metadata</refpurpose>
|
||||||
|
</refnamediv>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Description</title>
|
||||||
|
<para>
|
||||||
|
<command>repmgr witness unregister</command> removes a witness server's node
|
||||||
|
record from the &repmgr; metadata.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The node does not have to be running to be unregistered, however if this is the
|
||||||
|
case then either provide connection information for the primary server, or
|
||||||
|
execute <command>repmgr witness unregister</command> on a running node and
|
||||||
|
provide the parameter <option>--node-id</option> with the node ID of the
|
||||||
|
witness server.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Execute with the <literal>--dry-run</literal> option to check what would happen
|
||||||
|
without actually registering the witness server.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
<refsect1>
|
||||||
|
<title>Examples</title>
|
||||||
|
<para>
|
||||||
|
Unregistering a running witness node:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf witness unregister
|
||||||
|
INFO: connecting to witness node "node3" (ID: 3)
|
||||||
|
INFO: unregistering witness node 3
|
||||||
|
INFO: witness unregistration complete
|
||||||
|
DETAIL: witness node with UD 3 successfully unregistered</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Unregistering a non-running witness node:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf witness unregister -h node1 -p 5501 -F
|
||||||
|
INFO: connecting to node "node3" (ID: 3)
|
||||||
|
NOTICE: unable to connect to node "node3" (ID: 3), removing node record on cluster primary only
|
||||||
|
INFO: unregistering witness node 3
|
||||||
|
INFO: witness unregistration complete
|
||||||
|
DETAIL: witness node with id ID 3 successfully unregistered</programlisting>
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
<title>Notes</title>
|
||||||
|
<para>
|
||||||
|
This command will not make any changes to the witness node itself and will neither
|
||||||
|
remove any data from the witness database nor stop the PostgreSQL instance.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
A witness node which has been unregistered, can be re-registered with
|
||||||
|
<link linkend="repmgr-witness-register">repmgr witness register --force</link>.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
<refsect1>
|
||||||
|
|
||||||
|
<title>Options</title>
|
||||||
|
<variablelist>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--dry-run</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Check prerequisites but don't actually unregister the witness.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>--node-id</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
Unregister witness server with the specified node ID.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
</variablelist>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
|
||||||
|
<refsect1 id="repmgr-witness-unregister-events">
|
||||||
|
<title>Event notifications</title>
|
||||||
|
<para>
|
||||||
|
A <literal>witness_unregister</literal> <link linkend="event-notifications">event notification</link> will be generated.
|
||||||
|
</para>
|
||||||
|
</refsect1>
|
||||||
|
|
||||||
|
</refentry>
|
||||||
@@ -23,13 +23,13 @@
|
|||||||
|
|
||||||
<abstract>
|
<abstract>
|
||||||
<para>
|
<para>
|
||||||
Thisis the official documentation of &repmgr; &repmgrversion; for
|
This is the official documentation of &repmgr; &repmgrversion; for
|
||||||
use with PostgreSQL 9.3 - PostgreSQL 10.
|
use with PostgreSQL 9.3 - PostgreSQL 10.
|
||||||
It describes the functionality supported by the current version of &repmgr;.
|
It describes the functionality supported by the current version of &repmgr;.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
repmgr was developed by
|
&repmgr; was developed by
|
||||||
<ulink url="https://2ndquadrant.com">2ndQuadrant</ulink>
|
<ulink url="https://2ndquadrant.com">2ndQuadrant</ulink>
|
||||||
along with contributions from other individuals and companies.
|
along with contributions from other individuals and companies.
|
||||||
Contributions from the community are appreciated and welcome - get
|
Contributions from the community are appreciated and welcome - get
|
||||||
@@ -73,6 +73,7 @@
|
|||||||
&promoting-standby;
|
&promoting-standby;
|
||||||
&follow-new-primary;
|
&follow-new-primary;
|
||||||
&switchover;
|
&switchover;
|
||||||
|
&configuring-witness-server;
|
||||||
&event-notifications;
|
&event-notifications;
|
||||||
&upgrading-repmgr;
|
&upgrading-repmgr;
|
||||||
</part>
|
</part>
|
||||||
@@ -84,8 +85,11 @@
|
|||||||
&repmgrd-demonstration;
|
&repmgrd-demonstration;
|
||||||
&repmgrd-cascading-replication;
|
&repmgrd-cascading-replication;
|
||||||
&repmgrd-network-split;
|
&repmgrd-network-split;
|
||||||
|
&repmgrd-witness-server;
|
||||||
|
&repmgrd-pausing;
|
||||||
&repmgrd-degraded-monitoring;
|
&repmgrd-degraded-monitoring;
|
||||||
&repmgrd-monitoring;
|
&repmgrd-monitoring;
|
||||||
|
&repmgrd-bdr;
|
||||||
</part>
|
</part>
|
||||||
|
|
||||||
<part id="repmgr-command-reference">
|
<part id="repmgr-command-reference">
|
||||||
@@ -99,6 +103,8 @@
|
|||||||
&repmgr-standby-promote;
|
&repmgr-standby-promote;
|
||||||
&repmgr-standby-follow;
|
&repmgr-standby-follow;
|
||||||
&repmgr-standby-switchover;
|
&repmgr-standby-switchover;
|
||||||
|
&repmgr-witness-register;
|
||||||
|
&repmgr-witness-unregister;
|
||||||
&repmgr-node-status;
|
&repmgr-node-status;
|
||||||
&repmgr-node-check;
|
&repmgr-node-check;
|
||||||
&repmgr-node-rejoin;
|
&repmgr-node-rejoin;
|
||||||
@@ -107,9 +113,15 @@
|
|||||||
&repmgr-cluster-crosscheck;
|
&repmgr-cluster-crosscheck;
|
||||||
&repmgr-cluster-event;
|
&repmgr-cluster-event;
|
||||||
&repmgr-cluster-cleanup;
|
&repmgr-cluster-cleanup;
|
||||||
|
&repmgr-daemon-status;
|
||||||
|
&repmgr-daemon-pause;
|
||||||
|
&repmgr-daemon-unpause;
|
||||||
</part>
|
</part>
|
||||||
|
|
||||||
|
&appendix-release-notes;
|
||||||
&appendix-signatures;
|
&appendix-signatures;
|
||||||
|
&appendix-faq;
|
||||||
|
&appendix-packages;
|
||||||
|
|
||||||
<![%include-index;[&bookindex;]]>
|
<![%include-index;[&bookindex;]]>
|
||||||
<![%include-xslt-index;[<index id="bookindex"></index>]]>
|
<![%include-xslt-index;[<index id="bookindex"></index>]]>
|
||||||
|
|||||||
@@ -1,8 +1,13 @@
|
|||||||
<chapter id="repmgrd-automatic-failover" xreflabel="Automatic failover with repmgrd">
|
<chapter id="repmgrd-automatic-failover" xreflabel="Automatic failover with repmgrd">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>automatic failover</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Automatic failover with repmgrd</title>
|
<title>Automatic failover with repmgrd</title>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
<command>repmgrd</command> is a management and monitoring daemon which runs
|
<application>repmgrd</application> is a management and monitoring daemon which runs
|
||||||
on each node in a replication cluster. It can automate actions such as
|
on each node in a replication cluster. It can automate actions such as
|
||||||
failover and updating standbys to follow the new primary, as well as
|
failover and updating standbys to follow the new primary, as well as
|
||||||
providing monitoring information about the state of each standby.
|
providing monitoring information about the state of each standby.
|
||||||
|
|||||||
415
doc/repmgrd-bdr.sgml
Normal file
415
doc/repmgrd-bdr.sgml
Normal file
@@ -0,0 +1,415 @@
|
|||||||
|
<chapter id="repmgrd-bdr">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>BDR</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>BDR</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>BDR failover with repmgrd</title>
|
||||||
|
<para>
|
||||||
|
&repmgr; 4.x provides support for monitoring BDR nodes and taking action in
|
||||||
|
case one of the nodes fails.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
Due to the nature of BDR 1.x/2.x, it's only safe to use this solution for
|
||||||
|
a two-node scenario. Introducing additional nodes will create an inherent
|
||||||
|
risk of node desynchronisation if a node goes down without being cleanly
|
||||||
|
removed from the cluster.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
In contrast to streaming replication, there's no concept of "promoting" a new
|
||||||
|
primary node with BDR. Instead, "failover" involves monitoring both nodes
|
||||||
|
with <application>repmgrd</application> and redirecting queries from the failed node to the remaining
|
||||||
|
active node. This can be done by using an
|
||||||
|
<link linkend="event-notifications">event notification</link> script
|
||||||
|
which is called by <application>repmgrd</application> to dynamically
|
||||||
|
reconfigure a proxy server/connection pooler such as <application>PgBouncer</application>.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<sect1 id="bdr-prerequisites" xreflabel="BDR prequisites">
|
||||||
|
<title>Prerequisites</title>
|
||||||
|
<para>
|
||||||
|
&repmgr; 4 requires PostgreSQL 9.4 or 9.6 with the BDR 2 extension
|
||||||
|
enabled and configured for a two-node BDR network. &repmgr; 4 packages
|
||||||
|
must be installed on each node before attempting to configure
|
||||||
|
<application>repmgr</application>.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
&repmgr; 4 will refuse to install if it detects more than two BDR nodes.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
Application database connections *must* be passed through a proxy server/
|
||||||
|
connection pooler such as <application>PgBouncer</application>, and it must be possible to dynamically
|
||||||
|
reconfigure that from <application>repmgrd</application>. The example demonstrated in this document
|
||||||
|
will use <application>PgBouncer</application>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The proxy server / connection poolers must <emphasis>not</emphasis>
|
||||||
|
be installed on the database servers.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For this example, it's assumed password-less SSH connections are available
|
||||||
|
from the PostgreSQL servers to the servers where <application>PgBouncer</application>
|
||||||
|
runs, and that the user on those servers has permission to alter the
|
||||||
|
<application>PgBouncer</application> configuration files.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
PostgreSQL connections must be possible between each node, and each node
|
||||||
|
must be able to connect to each PgBouncer instance.
|
||||||
|
</para>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="bdr-configuration" xreflabel="BDR configuration">
|
||||||
|
<title>Configuration</title>
|
||||||
|
<para>
|
||||||
|
A sample configuration for <filename>repmgr.conf</filename> on each
|
||||||
|
BDR node would look like this:
|
||||||
|
<programlisting>
|
||||||
|
# Node information
|
||||||
|
node_id=1
|
||||||
|
node_name='node1'
|
||||||
|
conninfo='host=node1 dbname=bdrtest user=repmgr connect_timeout=2'
|
||||||
|
data_directory='/var/lib/postgresql/data'
|
||||||
|
replication_type='bdr'
|
||||||
|
|
||||||
|
# Event notification configuration
|
||||||
|
event_notifications=bdr_failover
|
||||||
|
event_notification_command='/path/to/bdr-pgbouncer.sh %n %e %s "%c" "%a" >> /tmp/bdr-failover.log 2>&1'
|
||||||
|
|
||||||
|
# repmgrd options
|
||||||
|
monitor_interval_secs=5
|
||||||
|
reconnect_attempts=6
|
||||||
|
reconnect_interval=5</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Adjust settings as appropriate; copy and adjust for the second node (particularly
|
||||||
|
the values <varname>node_id</varname>, <varname>node_name</varname>
|
||||||
|
and <varname>conninfo</varname>).
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Note that the values provided for the <varname>conninfo</varname> string
|
||||||
|
must be valid for connections from <emphasis>both</emphasis> nodes in the
|
||||||
|
replication cluster. The database must be the BDR-enabled database.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If defined, the <varname>event_notifications</varname> parameter will restrict
|
||||||
|
execution of the script defined in <varname>event_notification_command</varname>
|
||||||
|
to the specified event(s).
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
<varname>event_notification_command</varname> is the script which does the actual "heavy lifting"
|
||||||
|
of reconfiguring the proxy server/ connection pooler. It is fully
|
||||||
|
user-definable; see section <xref linkend="bdr-event-notification-command"> for a reference
|
||||||
|
implementation.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="bdr-repmgr-setup" xreflabel="repmgr setup with BDR">
|
||||||
|
<title>repmgr setup</title>
|
||||||
|
<para>
|
||||||
|
Register both nodes; example on <literal>node1</literal>:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf bdr register
|
||||||
|
NOTICE: attempting to install extension "repmgr"
|
||||||
|
NOTICE: "repmgr" extension successfully installed
|
||||||
|
NOTICE: node record created for node 'node1' (ID: 1)
|
||||||
|
NOTICE: BDR node 1 registered (conninfo: host=node1 dbname=bdrtest user=repmgr)</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
and on <literal>node1</literal>:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf bdr register
|
||||||
|
NOTICE: node record created for node 'node2' (ID: 2)
|
||||||
|
NOTICE: BDR node 2 registered (conninfo: host=node2 dbname=bdrtest user=repmgr)</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The <literal>repmgr</literal> extension will be automatically created
|
||||||
|
when the first node is registered, and will be propagated to the second
|
||||||
|
node.
|
||||||
|
</para>
|
||||||
|
<important>
|
||||||
|
<simpara>
|
||||||
|
Ensure the &repmgr; package is available on both nodes before
|
||||||
|
attempting to register the first node.
|
||||||
|
</simpara>
|
||||||
|
</important>
|
||||||
|
<para>
|
||||||
|
At this point the meta data for both nodes has been created; executing
|
||||||
|
<xref linkend="repmgr-cluster-show"> (on either node) should produce output like this:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf cluster show
|
||||||
|
ID | Name | Role | Status | Upstream | Location | Connection string
|
||||||
|
----+-------+------+-----------+----------+--------------------------------------------------------
|
||||||
|
1 | node1 | bdr | * running | | default | host=node1 dbname=bdrtest user=repmgr connect_timeout=2
|
||||||
|
2 | node2 | bdr | * running | | default | host=node2 dbname=bdrtest user=repmgr connect_timeout=2</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Additionally it's possible to display log of significant events; executing
|
||||||
|
<xref linkend="repmgr-cluster-event"> (on either node) should produce output like this:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf cluster event
|
||||||
|
Node ID | Event | OK | Timestamp | Details
|
||||||
|
---------+--------------+----+---------------------+----------------------------------------------
|
||||||
|
2 | bdr_register | t | 2017-07-27 17:51:48 | node record created for node 'node2' (ID: 2)
|
||||||
|
1 | bdr_register | t | 2017-07-27 17:51:00 | node record created for node 'node1' (ID: 1)
|
||||||
|
</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
At this point there will only be records for the two node registrations (displayed here
|
||||||
|
in reverse chronological order).
|
||||||
|
</para>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="bdr-event-notification-command" xreflabel="Defining the BDR failover "event_notification command"">
|
||||||
|
<title>Defining the BDR failover "event_notification_command"</title>
|
||||||
|
<para>
|
||||||
|
Key to "failover" execution is the <literal>event_notification_command</literal>,
|
||||||
|
which is a user-definable script specified in <filename>repmpgr.conf</filename>
|
||||||
|
and which can use a &repmgr; <link linkend="event-notifications">event notification</link>
|
||||||
|
to reconfigure the proxy server / connection pooler so it points to the other, still-active node.
|
||||||
|
Details of the event will be passed as parameters to the script.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Following parameter placeholders are available for the script definition in <filename>repmpgr.conf</filename>;
|
||||||
|
these will be replaced with the appropriate value when the script is executed:
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<variablelist>
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>%n</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
node ID
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>%e</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
event type
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>%t</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
success (1 or 0)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>%t</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
timestamp
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>%d</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
details
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>%c</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
conninfo string of the next available node (<varname>bdr_failover</varname> and <varname>bdr_recovery</varname>)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
<varlistentry>
|
||||||
|
<term><option>%a</option></term>
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
name of the next available node (<varname>bdr_failover</varname> and <varname>bdr_recovery</varname>)
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
</varlistentry>
|
||||||
|
</variablelist>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Note that <literal>%c</literal> and <literal>%a</literal> are only provided with
|
||||||
|
particular failover events, in this case <varname>bdr_failover</varname>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The provided sample script
|
||||||
|
(<literal><ulink url="https://raw.githubusercontent.com/2ndQuadrant/repmgr/master/scripts/bdr-pgbouncer.sh">scripts/bdr-pgbouncer.sh</ulink></literal>)
|
||||||
|
is configured as follows:
|
||||||
|
<programlisting>
|
||||||
|
event_notification_command='/path/to/bdr-pgbouncer.sh %n %e %s "%c" "%a"'</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
and parses the placeholder parameters like this:
|
||||||
|
<programlisting>
|
||||||
|
NODE_ID=$1
|
||||||
|
EVENT_TYPE=$2
|
||||||
|
SUCCESS=$3
|
||||||
|
NEXT_CONNINFO=$4
|
||||||
|
NEXT_NODE_NAME=$5</programlisting>
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
The sample script also contains some hard-coded values for the <application>PgBouncer</application>
|
||||||
|
configuration for both nodes; these will need to be adjusted for your local environment
|
||||||
|
(ideally the scripts would be maintained as templates and generated by some
|
||||||
|
kind of provisioning system).
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
The script performs following steps:
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
<listitem>
|
||||||
|
<simpara>pauses <application>PgBouncer</application> on all nodes</simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara>recreates the <application>PgBouncer</application> configuration file on each
|
||||||
|
node using the information provided by <application>repmgrd</application>
|
||||||
|
(primarily the <varname>conninfo</varname> string) to configure
|
||||||
|
<application>PgBouncer</application></simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara>reloads the <application>PgBouncer</application> configuration</simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara>executes the <command>RESUME</command> command (in <application>PgBouncer</application>)</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Following successful script execution, any connections to PgBouncer on the failed BDR node
|
||||||
|
will be redirected to the active node.
|
||||||
|
</para>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="bdr-monitoring-failover" xreflabel="Node monitoring and failover">
|
||||||
|
<title>Node monitoring and failover</title>
|
||||||
|
<para>
|
||||||
|
At the intervals specified by <varname>monitor_interval_secs</varname>
|
||||||
|
in <filename>repmgr.conf</filename>, <application>repmgrd</application>
|
||||||
|
will ping each node to check if it's available. If a node isn't available,
|
||||||
|
<application>repmgrd</application> will enter failover mode and check <varname>reconnect_attempts</varname>
|
||||||
|
times at intervals of <varname>reconnect_interval</varname> to confirm the node is definitely unreachable.
|
||||||
|
This buffer period is necessary to avoid false positives caused by transient
|
||||||
|
network outages.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If the node is still unavailable, <application>repmgrd</application> will enter failover mode and execute
|
||||||
|
the script defined in <varname>event_notification_command</varname>; an entry will be logged
|
||||||
|
in the <literal>repmgr.events</literal> table and <application>repmgrd</application> will
|
||||||
|
(unless otherwise configured) resume monitoring of the node in "degraded" mode until it reappears.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> logfile output during a failover event will look something like this
|
||||||
|
on one node (usually the node which has failed, here <literal>node2</literal>):
|
||||||
|
<programlisting>
|
||||||
|
...
|
||||||
|
[2017-07-27 21:08:39] [INFO] starting continuous BDR node monitoring
|
||||||
|
[2017-07-27 21:08:39] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
||||||
|
[2017-07-27 21:08:55] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
||||||
|
[2017-07-27 21:09:11] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
||||||
|
[2017-07-27 21:09:23] [WARNING] unable to connect to node node2 (ID 2)
|
||||||
|
[2017-07-27 21:09:23] [INFO] checking state of node 2, 0 of 5 attempts
|
||||||
|
[2017-07-27 21:09:23] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:24] [INFO] checking state of node 2, 1 of 5 attempts
|
||||||
|
[2017-07-27 21:09:24] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:25] [INFO] checking state of node 2, 2 of 5 attempts
|
||||||
|
[2017-07-27 21:09:25] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:26] [INFO] checking state of node 2, 3 of 5 attempts
|
||||||
|
[2017-07-27 21:09:26] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:27] [INFO] checking state of node 2, 4 of 5 attempts
|
||||||
|
[2017-07-27 21:09:27] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:28] [WARNING] unable to reconnect to node 2 after 5 attempts
|
||||||
|
[2017-07-27 21:09:28] [NOTICE] setting node record for node 2 to inactive
|
||||||
|
[2017-07-27 21:09:28] [INFO] executing notification command for event "bdr_failover"
|
||||||
|
[2017-07-27 21:09:28] [DETAIL] command is:
|
||||||
|
/path/to/bdr-pgbouncer.sh 2 bdr_failover 1 "host=host=node1 dbname=bdrtest user=repmgr connect_timeout=2" "node1"
|
||||||
|
[2017-07-27 21:09:28] [INFO] node 'node2' (ID: 2) detected as failed; next available node is 'node1' (ID: 1)
|
||||||
|
[2017-07-27 21:09:28] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
||||||
|
[2017-07-27 21:09:28] [DETAIL] monitoring node "node2" (ID: 2) in degraded mode
|
||||||
|
...</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Output on the other node (<literal>node1</literal>) during the same event will look like this:
|
||||||
|
<programlisting>
|
||||||
|
...
|
||||||
|
[2017-07-27 21:08:35] [INFO] starting continuous BDR node monitoring
|
||||||
|
[2017-07-27 21:08:35] [INFO] monitoring BDR replication status on node "node1" (ID: 1)
|
||||||
|
[2017-07-27 21:08:51] [INFO] monitoring BDR replication status on node "node1" (ID: 1)
|
||||||
|
[2017-07-27 21:09:07] [INFO] monitoring BDR replication status on node "node1" (ID: 1)
|
||||||
|
[2017-07-27 21:09:23] [WARNING] unable to connect to node node2 (ID 2)
|
||||||
|
[2017-07-27 21:09:23] [INFO] checking state of node 2, 0 of 5 attempts
|
||||||
|
[2017-07-27 21:09:23] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:24] [INFO] checking state of node 2, 1 of 5 attempts
|
||||||
|
[2017-07-27 21:09:24] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:25] [INFO] checking state of node 2, 2 of 5 attempts
|
||||||
|
[2017-07-27 21:09:25] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:26] [INFO] checking state of node 2, 3 of 5 attempts
|
||||||
|
[2017-07-27 21:09:26] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:27] [INFO] checking state of node 2, 4 of 5 attempts
|
||||||
|
[2017-07-27 21:09:27] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2017-07-27 21:09:28] [WARNING] unable to reconnect to node 2 after 5 attempts
|
||||||
|
[2017-07-27 21:09:28] [NOTICE] other node's repmgrd is handling failover
|
||||||
|
[2017-07-27 21:09:28] [INFO] monitoring BDR replication status on node "node1" (ID: 1)
|
||||||
|
[2017-07-27 21:09:28] [DETAIL] monitoring node "node2" (ID: 2) in degraded mode
|
||||||
|
...</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This assumes only the PostgreSQL instance on <literal>node2</literal> has failed. In this case the
|
||||||
|
<application>repmgrd</application> instance running on <literal>node2</literal> has performed the failover. However if
|
||||||
|
the entire server becomes unavailable, <application>repmgrd</application> on <literal>node1</literal> will perform
|
||||||
|
the failover.
|
||||||
|
</para>
|
||||||
|
</sect1>
|
||||||
|
<sect1 id="bdr-node-recovery" xreflabel="Node recovery">
|
||||||
|
<title>Node recovery</title>
|
||||||
|
<para>
|
||||||
|
Following failure of a BDR node, if the node subsequently becomes available again,
|
||||||
|
a <varname>bdr_recovery</varname> event will be generated. This could potentially be used to
|
||||||
|
reconfigure PgBouncer automatically to bring the node back into the available pool,
|
||||||
|
however it would be prudent to manually verify the node's status before
|
||||||
|
exposing it to the application.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If the failed node comes back up and connects correctly, output similar to this
|
||||||
|
will be visible in the <application>repmgrd</application> log:
|
||||||
|
<programlisting>
|
||||||
|
[2017-07-27 21:25:30] [DETAIL] monitoring node "node2" (ID: 2) in degraded mode
|
||||||
|
[2017-07-27 21:25:46] [INFO] monitoring BDR replication status on node "node2" (ID: 2)
|
||||||
|
[2017-07-27 21:25:46] [DETAIL] monitoring node "node2" (ID: 2) in degraded mode
|
||||||
|
[2017-07-27 21:25:55] [INFO] active replication slot for node "node1" found after 1 seconds
|
||||||
|
[2017-07-27 21:25:55] [NOTICE] node "node2" (ID: 2) has recovered after 986 seconds</programlisting>
|
||||||
|
</para>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="bdr-complete-shutdown" xreflabel="Shutdown of both nodes">
|
||||||
|
<title>Shutdown of both nodes</title>
|
||||||
|
<para>
|
||||||
|
If both PostgreSQL instances are shut down, <application>repmgrd</application> will try and handle the
|
||||||
|
situation as gracefully as possible, though with no failover candidates available
|
||||||
|
there's not much it can do. Should this case ever occur, we recommend shutting
|
||||||
|
down <application>repmgrd</application> on both nodes and restarting it once the PostgreSQL instances
|
||||||
|
are running properly.
|
||||||
|
</para>
|
||||||
|
</sect1>
|
||||||
|
</chapter>
|
||||||
|
|
||||||
@@ -1,9 +1,14 @@
|
|||||||
<chapter id="repmgrd-cascading-replication">
|
<chapter id="repmgrd-cascading-replication">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>cascading replication</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>repmgrd and cascading replication</title>
|
<title>repmgrd and cascading replication</title>
|
||||||
<para>
|
<para>
|
||||||
Cascading replication - where a standby can connect to an upstream node and not
|
Cascading replication - where a standby can connect to an upstream node and not
|
||||||
the primary server itself - was introduced in PostgreSQL 9.2. &repmgr; and
|
the primary server itself - was introduced in PostgreSQL 9.2. &repmgr; and
|
||||||
<command>repmgrd</command> support cascading replication by keeping track of the relationship
|
<application>repmgrd</application> support cascading replication by keeping track of the relationship
|
||||||
between standby servers - each node record is stored with the node id of its
|
between standby servers - each node record is stored with the node id of its
|
||||||
upstream ("parent") server (except of course the primary server).
|
upstream ("parent") server (except of course the primary server).
|
||||||
</para>
|
</para>
|
||||||
|
|||||||
@@ -1,54 +1,499 @@
|
|||||||
<chapter id="repmgrd-configuration">
|
<chapter id="repmgrd-configuration">
|
||||||
<title>repmgrd configuration</title>
|
|
||||||
<para>
|
|
||||||
To use <command>repmgrd</command>, its associated function library must be
|
|
||||||
included in <filename>postgresql.conf</filename> with:
|
|
||||||
|
|
||||||
<programlisting>
|
<indexterm>
|
||||||
shared_preload_libraries = 'repmgr'</programlisting>
|
<primary>repmgrd</primary>
|
||||||
</para>
|
<secondary>configuration</secondary>
|
||||||
<para>
|
</indexterm>
|
||||||
Changing this setting requires a restart of PostgreSQL; for more details see
|
|
||||||
the <ulink url="https://www.postgresql.org/docs/current/static/runtime-config-client.html#GUC-SHARED-PRELOAD-LIBRARIES">PostgreSQL documentation</ulink>.
|
<title>repmgrd configuration</title>
|
||||||
</para>
|
|
||||||
<para>
|
<para>
|
||||||
Additionally the following <command>repmgrd</command> options *must* be set in
|
<application>repmgrd</application> is a daemon which runs on each PostgreSQL node,
|
||||||
<filename>repmgr.conf</filename> (adjust configuration file locations as appropriate):
|
monitoring the local node, and (unless it's the primary node) the upstream server
|
||||||
<programlisting>
|
(the primary server or with cascading replication, another standby) which it's
|
||||||
failover=automatic
|
connected to.
|
||||||
promote_command='repmgr standby promote -f /etc/repmgr.conf --log-to-file'
|
</para>
|
||||||
follow_command='repmgr standby follow -f /etc/repmgr.conf --log-to-file --upstream-node-id=%n'</programlisting>
|
<para>
|
||||||
</para>
|
<application>repmgrd</application> can be configured to provide failover
|
||||||
<para>
|
capability in case the primary upstream node becomes unreachable, and/or
|
||||||
Note that the <literal>--log-to-file</literal> option will cause
|
provide monitoring data to the &repmgr; metadatabase.
|
||||||
output generated by the &repmgr; command, when executed by <command>repmgrd</command>,
|
</para>
|
||||||
to be logged to the same destination configured to receive log output for <command>repmgrd</command>.
|
|
||||||
See <filename>repmgr.conf.sample</filename> for further <command>repmgrd</command>-specific settings.
|
<sect1 id="repmgrd-basic-configuration">
|
||||||
</para>
|
<title>repmgrd basic configuration</title>
|
||||||
<para>
|
|
||||||
When <varname>failover</varname> is set to <literal>automatic</literal>, upon detecting failure
|
<para>
|
||||||
of the current primary, <command>repmgrd</command> will execute one of
|
To use <application>repmgrd</application>, its associated function library <emphasis>must</emphasis> be
|
||||||
<varname>promote_command</varname> or <varname>follow_command</varname>,
|
included via <filename>postgresql.conf</filename> with:
|
||||||
depending on whether the current server is to become the new primary, or
|
|
||||||
needs to follow another server which has become the new primary. Note that
|
<programlisting>
|
||||||
these commands can be any valid shell script which results in one of these
|
shared_preload_libraries = 'repmgr'</programlisting>
|
||||||
two actions happening, but if &repmgr;'s <command>standby follow</command> or
|
</para>
|
||||||
<command>standby promote</command>
|
<para>
|
||||||
commands are not executed (either directly as shown here, or from a script which
|
Changing this setting requires a restart of PostgreSQL; for more details see
|
||||||
performs other actions), the &repmgr; metadata will not be updated and
|
the <ulink url="https://www.postgresql.org/docs/current/static/runtime-config-client.html#GUC-SHARED-PRELOAD-LIBRARIES">PostgreSQL documentation</ulink>.
|
||||||
&repmgr; will no longer function reliably.
|
</para>
|
||||||
</para>
|
|
||||||
<para>
|
|
||||||
The <varname>follow_command</varname> should provide the <literal>--upstream-node-id=%n</literal>
|
<sect2 id="repmgrd-automatic-failover-configuration">
|
||||||
option to <command>repmgr standby follow</command>; the <literal>%n</literal> will be replaced by
|
<title>automatic failover configuration</title>
|
||||||
<command>repmgrd</command> with the ID of the new primary node. If this is not provided, &repmgr;
|
<para>
|
||||||
will attempt to determine the new primary by itself, but if the
|
If using automatic failover, the following <application>repmgrd</application> options *must* be set in
|
||||||
original primary comes back online after the new primary is promoted, there is a risk that
|
<filename>repmgr.conf</filename> :
|
||||||
<command>repmgr standby follow</command> will result in the node continuing to follow
|
<programlisting>
|
||||||
the original primary.
|
failover=automatic
|
||||||
</para>
|
promote_command='/usr/bin/repmgr standby promote -f /etc/repmgr.conf --log-to-file'
|
||||||
<sect1 id="repmgrd-connection-settings">
|
follow_command='/usr/bin/repmgr standby follow -f /etc/repmgr.conf --log-to-file --upstream-node-id=%n'</programlisting>
|
||||||
<title>repmgrd connection settings</title>
|
</para>
|
||||||
|
<para>
|
||||||
|
Adjust file paths as appropriate; alway specify the full path to the &repmgr; binary.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
&repmgr; will not apply <option>pg_bindir</option> when executing <option>promote_command</option>
|
||||||
|
or <option>follow_command</option>; these can be user-defined scripts so must always be
|
||||||
|
specified with the full path.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Note that the <literal>--log-to-file</literal> option will cause
|
||||||
|
output generated by the &repmgr; command, when executed by <application>repmgrd</application>,
|
||||||
|
to be logged to the same destination configured to receive log output for <application>repmgrd</application>.
|
||||||
|
See <filename><ulink url="https://raw.githubusercontent.com/2ndQuadrant/repmgr/master/repmgr.conf.sample">repmgr.conf.sample</ulink></filename>
|
||||||
|
for further <application>repmgrd</application>-specific settings.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
When <varname>failover</varname> is set to <literal>automatic</literal>, upon detecting failure
|
||||||
|
of the current primary, <application>repmgrd</application> will execute one of:
|
||||||
|
</para>
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>promote_command</varname> (if the current server is to become the new primary)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>follow_command</varname> (if the current server needs to follow another server which has
|
||||||
|
become the new primary)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
These commands can be any valid shell script which results in one of these
|
||||||
|
two actions happening, but if &repmgr;'s <command>standby follow</command> or
|
||||||
|
<command>standby promote</command>
|
||||||
|
commands are not executed (either directly as shown here, or from a script which
|
||||||
|
performs other actions), the &repmgr; metadata will not be updated and
|
||||||
|
&repmgr; will no longer function reliably.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
The <varname>follow_command</varname> should provide the <literal>--upstream-node-id=%n</literal>
|
||||||
|
option to <command>repmgr standby follow</command>; the <literal>%n</literal> will be replaced by
|
||||||
|
<application>repmgrd</application> with the ID of the new primary node. If this is not provided, &repmgr;
|
||||||
|
will attempt to determine the new primary by itself, but if the
|
||||||
|
original primary comes back online after the new primary is promoted, there is a risk that
|
||||||
|
<command>repmgr standby follow</command> will result in the node continuing to follow
|
||||||
|
the original primary.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="repmgrd-service-configuration">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>PostgreSQL service configuration</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>PostgreSQL service configuration</title>
|
||||||
|
<para>
|
||||||
|
If using automatic failover, currently <application>repmgrd</application> will need to execute
|
||||||
|
<link linkend="repmgr-standby-follow"><command>repmgr standby follow</command></link>
|
||||||
|
to restart PostgreSQL on standbys to have them follow a new primary.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To ensure this happens smoothly, it's essential to provide the appropriate system/service restart
|
||||||
|
command appropriate to your operating system via <varname>service_restart_command</varname>
|
||||||
|
in <filename>repmgr.conf</filename>. If you don't do this, <application>repmgrd</application>
|
||||||
|
will default to using <command>pg_ctl</command>, which can result in unexpected problems,
|
||||||
|
particularly on <application>systemd</application>-based systems.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For more details, see <xref linkend="configuration-file-service-commands">.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="repmgrd-monitoring-configuration" xreflabel="repmgrd monitoring configuration">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>monitoring configuration</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Monitoring configuration</title>
|
||||||
|
<para>
|
||||||
|
To enable monitoring, set:
|
||||||
|
<programlisting>
|
||||||
|
monitoring_history=yes</programlisting>
|
||||||
|
in <filename>repmgr.conf</filename>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The default monitoring interval is 2 seconds; this value can be explicitly set using:
|
||||||
|
<programlisting>
|
||||||
|
monitor_interval_secs=<seconds></programlisting>
|
||||||
|
in <filename>repmgr.conf</filename>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For more details on monitoring, see <xref linkend="repmgrd-monitoring">.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="repmgrd-reloading-configuration"xreflabel="reloading repmgrd configuration">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>applying configuration changes</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Applying configuration changes to repmgrd</title>
|
||||||
|
<para>
|
||||||
|
To apply configuration file changes to a running <application>repmgrd</application>
|
||||||
|
daemon, execute the operating system's <application>repmgrd</application> service reload command
|
||||||
|
(see <xref linkend="appendix-packages"> for examples),
|
||||||
|
or for instances which were manually started, execute <command>kill -HUP</command>, e.g.
|
||||||
|
<command>kill -HUP `cat /tmp/repmgrd.pid`</command>.
|
||||||
|
</para>
|
||||||
|
<tip>
|
||||||
|
<para>
|
||||||
|
Check the <application>repmgrd</application> log to see what changes were
|
||||||
|
applied, or if any issues were encountered when reloading the configuration.
|
||||||
|
</para>
|
||||||
|
</tip>
|
||||||
|
<para>
|
||||||
|
Note that only the following subset of configuration file parameters can be changed on a
|
||||||
|
running <application>repmgrd</application> daemon:
|
||||||
|
</para>
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>async_query_timeout</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>bdr_local_monitoring_only</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>bdr_recovery_timeout</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>conninfo</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>degraded_monitoring_timeout</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>event_notification_command</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>event_notifications</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>failover</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>follow_command</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>log_facility</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>log_file</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>log_level</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>log_status_interval</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>monitor_interval_secs</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>monitoring_history</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>primary_notification_timeout</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>promote_command</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>reconnect_attempts</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>reconnect_interval</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>repmgrd_standby_startup_timeout</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
The following set of configuration file parameters must be updated via
|
||||||
|
<command><link linkend="repmgr-standby-register">repmgr standby register --force</link></command>,
|
||||||
|
as they require changes to the <literal>repmgr.nodes</literal> table so they are visible to
|
||||||
|
all nodes in the replication cluster:
|
||||||
|
</para>
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>node_id</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>node_name</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>data_directory</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>location</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
<varname>priority</varname>
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
After executing <command><link linkend="repmgr-standby-register">repmgr standby register --force</link></command>,
|
||||||
|
<application>repmgrd</application> <emphasis>must</emphasis> be restarted for the changes to take effect.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="repmgrd-daemon">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>starting and stopping</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>repmgrd daemon</title>
|
||||||
|
<para>
|
||||||
|
If installed from a package, the <application>repmgrd</application> can be started
|
||||||
|
via the operating system's service command, e.g. in <application>systemd</application>
|
||||||
|
using <command>systemctl</command>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
See appendix <xref linkend="appendix-packages"> for details of service commands
|
||||||
|
for different distributions.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> can be started manually like this:
|
||||||
|
<programlisting>
|
||||||
|
repmgrd -f /etc/repmgr.conf --pid-file /tmp/repmgrd.pid</programlisting>
|
||||||
|
and stopped with <command>kill `cat /tmp/repmgrd.pid`</command>. Adjust paths as appropriate.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<sect2 id="repmgrd-pid-file" xreflabel="repmgrd's PID file">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>PID file</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>PID file</primary>
|
||||||
|
<secondary>repmgrd</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>repmgrd's PID file</title>
|
||||||
|
<para>
|
||||||
|
<application>repmgrd</application> will generate a PID file by default.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
This is a behaviour change from previous versions (earlier than 4.1), where
|
||||||
|
the PID file had to be explicitly specified with the command line
|
||||||
|
parameter <option> --pid-file</option>.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
The PID file can be specified in <filename>repmgr.conf</filename> with the configuration
|
||||||
|
parameter <varname>repmgrd_pid_file</varname>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
It can also be specified on the command line (as in previous versions) with
|
||||||
|
the command line parameter <option>--pid-file</option>. Note this will override
|
||||||
|
any value set in <filename>repmgr.conf</filename> with <varname>repmgrd_pid_file</varname>.
|
||||||
|
<option>--pid-file</option> may be deprecated in future releases.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If a PID file location was specified by the package maintainer, <application>repmgrd</application>
|
||||||
|
will use that. This only applies if &repmgr; was installed from a package and the package
|
||||||
|
maintainer has specified the PID file location.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If none of the above apply, <application>repmgrd</application> will create a PID file
|
||||||
|
in the operating system's temporary directory (das etermined by the environment variable
|
||||||
|
<varname>TMPDIR</varname>, or if that is not set, will use <filename>/tmp</filename>).
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To prevent a PID file being generated at all, provide the command line option
|
||||||
|
<option>--no-pid-file</option>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To see which PID file <application>repmgrd</application> would use, execute <application>repmgrd</application>
|
||||||
|
with the option <option>--show-pid-file</option>. <application>repmgrd</application>
|
||||||
|
will not start if this option is provided. Note that the value shown is the
|
||||||
|
file <application>repmgrd</application> would use next time it starts, and is
|
||||||
|
not necessarily the PID file currently in use.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="repmgrd-configuration-debian-ubuntu">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>Debian/Ubuntu and daemon configuration</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>Debian/Ubuntu</primary>
|
||||||
|
<secondary>repmgrd daemon configuration</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>repmgrd daemon configuration on Debian/Ubuntu</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
If &repmgr; was installed from Debian/Ubuntu packages, additional configuration
|
||||||
|
is required before <application>repmgrd</application> is started as a daemon.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This is done via the file <filename>/etc/default/repmgrd</filename>, which by default
|
||||||
|
looks like this:
|
||||||
|
<programlisting>
|
||||||
|
# default settings for repmgrd. This file is source by /bin/sh from
|
||||||
|
# /etc/init.d/repmgrd
|
||||||
|
|
||||||
|
# disable repmgrd by default so it won't get started upon installation
|
||||||
|
# valid values: yes/no
|
||||||
|
REPMGRD_ENABLED=no
|
||||||
|
|
||||||
|
# configuration file (required)
|
||||||
|
#REPMGRD_CONF="/path/to/repmgr.conf"
|
||||||
|
|
||||||
|
# additional options
|
||||||
|
REPMGRD_OPTS="--daemonize=false"
|
||||||
|
|
||||||
|
# user to run repmgrd as
|
||||||
|
#REPMGRD_USER=postgres
|
||||||
|
|
||||||
|
# repmgrd binary
|
||||||
|
#REPMGRD_BIN=/usr/bin/repmgrd
|
||||||
|
|
||||||
|
# pid file
|
||||||
|
#REPMGRD_PIDFILE=/var/run/repmgrd.pid</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Set <varname>REPMGRD_ENABLED</varname> to <literal>yes</literal>, and <varname>REPMGRD_CONF</varname>
|
||||||
|
to the <filename>repmgr.conf</filename> file you are using.
|
||||||
|
</para>
|
||||||
|
<tip>
|
||||||
|
<para>
|
||||||
|
See <xref linkend="packages-debian-ubuntu"> for details of the Debian/Ubuntu packages and
|
||||||
|
typical file locations (including <filename>repmgr.conf</filename>).
|
||||||
|
</para>
|
||||||
|
</tip>
|
||||||
|
<para>
|
||||||
|
From <application>repmgrd</application> 4.1, ensure <varname>REPMGRD_OPTS</varname> includes
|
||||||
|
<option>--daemonize=false</option>, as daemonization is handled by the service command.
|
||||||
|
We recommend setting <varname>repmgrd_pid_file</varname> in <filename>repmgr.conf</filename> to the
|
||||||
|
same value set in <varname>REPMGRD_PIDFILE</varname> to prevent another <application>repmgrd</application>
|
||||||
|
instance from being started manually.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If using <application>systemd</application>, you may need to execute <command>systemctl daemon-reload</command>.
|
||||||
|
Also, if you attempted to start <application>repmgrd</application> using <command>systemctl start repmgrd</command>,
|
||||||
|
you'll need to execute <command>systemctl stop repmgrd</command>. Because that's how <application>systemd</application>
|
||||||
|
rolls.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
</sect2>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="repmgrd-connection-settings">
|
||||||
|
<title>repmgrd connection settings</title>
|
||||||
<para>
|
<para>
|
||||||
In addition to the &repmgr; configuration settings, parameters in the
|
In addition to the &repmgr; configuration settings, parameters in the
|
||||||
<varname>conninfo</varname> string influence how &repmgr; makes a network connection to
|
<varname>conninfo</varname> string influence how &repmgr; makes a network connection to
|
||||||
@@ -70,25 +515,43 @@
|
|||||||
<ulink url="https://www.postgresql.org/docs/current/static/libpq-connect.html#LIBPQ-PARAMKEYWORDS">PostgreSQL documentation</ulink>.
|
<ulink url="https://www.postgresql.org/docs/current/static/libpq-connect.html#LIBPQ-PARAMKEYWORDS">PostgreSQL documentation</ulink>.
|
||||||
</para>
|
</para>
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
<sect1 id="repmgrd-log-rotation">
|
<sect1 id="repmgrd-log-rotation">
|
||||||
|
<indexterm>
|
||||||
|
<primary>log rotation</primary>
|
||||||
|
<secondary>repmgrd</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>log rotation</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>repmgrd log rotation</title>
|
<title>repmgrd log rotation</title>
|
||||||
<para>
|
<para>
|
||||||
To ensure the current <command>repmgrd</command> logfile does not grow
|
To ensure the current <application>repmgrd</application> logfile
|
||||||
indefinitely, configure your system's <command>logrotate</command> to
|
(specified in <filename>repmgr.conf</filename> with the parameter
|
||||||
regularly rotate it.
|
<option>log_file</option>) does not grow indefinitely, configure your
|
||||||
|
system's <command>logrotate</command> to regularly rotate it.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Sample configuration to rotate logfiles weekly with retention for
|
Sample configuration to rotate logfiles weekly with retention for
|
||||||
up to 52 weeks and rotation forced if a file grows beyond 100Mb:
|
up to 52 weeks and rotation forced if a file grows beyond 100Mb:
|
||||||
<programlisting>
|
<programlisting>
|
||||||
/var/log/postgresql/repmgr-9.6.log {
|
/var/log/repmgr/repmgrd.log {
|
||||||
missingok
|
missingok
|
||||||
compress
|
compress
|
||||||
rotate 52
|
rotate 52
|
||||||
maxsize 100M
|
maxsize 100M
|
||||||
weekly
|
weekly
|
||||||
create 0600 postgres postgres
|
create 0600 postgres postgres
|
||||||
|
postrotate
|
||||||
|
/usr/bin/killall -HUP repmgrd
|
||||||
|
endscript
|
||||||
}</programlisting>
|
}</programlisting>
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
</sect1>
|
</sect1>
|
||||||
</chapter>
|
</chapter>
|
||||||
|
|||||||
@@ -1,9 +1,14 @@
|
|||||||
<chapter id="repmgrd-degraded-monitoring">
|
<chapter id="repmgrd-degraded-monitoring" xreflabel="repmgrd degraded monitoring">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>degraded monitoring</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>"degraded monitoring" mode</title>
|
<title>"degraded monitoring" mode</title>
|
||||||
<para>
|
<para>
|
||||||
In certain circumstances, <command>repmgrd</command> is not able to fulfill its primary mission
|
In certain circumstances, <application>repmgrd</application> is not able to fulfill its primary mission
|
||||||
of monitoring the nodes' upstream server. In these cases it enters "degraded
|
of monitoring the node's upstream server. In these cases it enters "degraded monitoring"
|
||||||
monitoring" mode, where <command>repmgrd</command> remains active but is waiting for the situation
|
mode, where <application>repmgrd</application> remains active but is waiting for the situation
|
||||||
to be resolved.
|
to be resolved.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
@@ -35,7 +40,7 @@
|
|||||||
</listitem>
|
</listitem>
|
||||||
|
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>repmgrd is monitoring the primary node, but it is not available</simpara>
|
<simpara>repmgrd is monitoring the primary node, but it is not available (and no other node has been promoted as primary)</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
</para>
|
</para>
|
||||||
@@ -63,8 +68,16 @@
|
|||||||
<para>
|
<para>
|
||||||
By default, <literal>repmgrd</literal> will continue in degraded monitoring mode indefinitely.
|
By default, <literal>repmgrd</literal> will continue in degraded monitoring mode indefinitely.
|
||||||
However a timeout (in seconds) can be set with <varname>degraded_monitoring_timeout</varname>,
|
However a timeout (in seconds) can be set with <varname>degraded_monitoring_timeout</varname>,
|
||||||
after which <command>repmgrd</command> will terminate.
|
after which <application>repmgrd</application> will terminate.
|
||||||
|
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If <application>repmgrd</application> is monitoring a primary mode which has been stopped
|
||||||
|
and manually restarted as a standby attached to a new primary, it will automatically detect
|
||||||
|
the status change and update the node record to reflect the node's new status
|
||||||
|
as an active standby. It will then resume monitoring the node as a standby.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
</chapter>
|
</chapter>
|
||||||
|
|||||||
@@ -10,19 +10,19 @@
|
|||||||
----+-------+---------+-----------+----------+----------+--------------------------------------
|
----+-------+---------+-----------+----------+----------+--------------------------------------
|
||||||
1 | node1 | primary | * running | | default | host=node1 dbname=repmgr user=repmgr
|
1 | node1 | primary | * running | | default | host=node1 dbname=repmgr user=repmgr
|
||||||
2 | node2 | standby | running | node1 | default | host=node2 dbname=repmgr user=repmgr
|
2 | node2 | standby | running | node1 | default | host=node2 dbname=repmgr user=repmgr
|
||||||
3 | node3 | standby | running | node1 | default | host=node3 dbname=repmgr user=repmgr </programlisting>
|
3 | node3 | standby | running | node1 | default | host=node3 dbname=repmgr user=repmgr</programlisting>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Start <command>repmgrd</command> on each standby and verify that it's running by examining the
|
Start <application>repmgrd</application> on each standby and verify that it's running by examining the
|
||||||
log output, which at log level <literal>INFO</literal> will look like this:
|
log output, which at log level <literal>INFO</literal> will look like this:
|
||||||
<programlisting>
|
<programlisting>
|
||||||
[2017-08-24 17:31:00] [NOTICE] using configuration file "/etc/repmgr.conf"
|
[2017-08-24 17:31:00] [NOTICE] using configuration file "/etc/repmgr.conf"
|
||||||
[2017-08-24 17:31:00] [INFO] connecting to database "host=node2 dbname=repmgr user=repmgr"
|
[2017-08-24 17:31:00] [INFO] connecting to database "host=node2 dbname=repmgr user=repmgr"
|
||||||
[2017-08-24 17:31:00] [NOTICE] starting monitoring of node <literal>node2</literal> (ID: 2)
|
[2017-08-24 17:31:00] [NOTICE] starting monitoring of node <literal>node2</literal> (ID: 2)
|
||||||
[2017-08-24 17:31:00] [INFO] monitoring connection to upstream node "node1" (node ID: 1) </programlisting>
|
[2017-08-24 17:31:00] [INFO] monitoring connection to upstream node "node1" (node ID: 1)</programlisting>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Each <command>repmgrd</command> should also have recorded its successful startup as an event:
|
Each <application>repmgrd</application> should also have recorded its successful startup as an event:
|
||||||
<programlisting>
|
<programlisting>
|
||||||
$ repmgr -f /etc/repmgr.conf cluster event --event=repmgrd_start
|
$ repmgr -f /etc/repmgr.conf cluster event --event=repmgrd_start
|
||||||
Node ID | Name | Event | OK | Timestamp | Details
|
Node ID | Name | Event | OK | Timestamp | Details
|
||||||
@@ -38,8 +38,8 @@
|
|||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
This will force the primary to shut down straight away, aborting all processes
|
This will force the primary to shut down straight away, aborting all processes
|
||||||
and transactions. This will cause a flurry of activity in the <command>repmgrd</command> log
|
and transactions. This will cause a flurry of activity in the <application>repmgrd</application> log
|
||||||
files as each <command>repmgrd</command> detects the failure of the primary and a failover
|
files as each <application>repmgrd</application> detects the failure of the primary and a failover
|
||||||
decision is made. This is an extract from the log of a standby server (<literal>node2</literal>)
|
decision is made. This is an extract from the log of a standby server (<literal>node2</literal>)
|
||||||
which has promoted to new primary after failure of the original primary (<literal>node1</literal>).
|
which has promoted to new primary after failure of the original primary (<literal>node1</literal>).
|
||||||
<programlisting>
|
<programlisting>
|
||||||
@@ -61,7 +61,7 @@
|
|||||||
[2017-08-24 23:32:12] [NOTICE] this node is the winner, will now promote self and inform other nodes
|
[2017-08-24 23:32:12] [NOTICE] this node is the winner, will now promote self and inform other nodes
|
||||||
INFO: connecting to standby database
|
INFO: connecting to standby database
|
||||||
NOTICE: promoting standby
|
NOTICE: promoting standby
|
||||||
DETAIL: promoting server using '/home/barwick/devel/builds/HEAD/bin/pg_ctl -l /tmp/postgres.5602.log -w -D '/tmp/repmgr-test/node_2/data' promote'
|
DETAIL: promoting server using 'pg_ctl -l /var/log/postgres/startup.log -w -D '/var/lib/pgsql/data' promote'
|
||||||
INFO: reconnecting to promoted server
|
INFO: reconnecting to promoted server
|
||||||
NOTICE: STANDBY PROMOTE successful
|
NOTICE: STANDBY PROMOTE successful
|
||||||
DETAIL: node 2 was successfully promoted to primary
|
DETAIL: node 2 was successfully promoted to primary
|
||||||
|
|||||||
@@ -1,7 +1,16 @@
|
|||||||
<chapter id="repmgrd-monitoring">
|
<chapter id="repmgrd-monitoring" xreflabel="Monitoring with repmgrd">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>monitoring</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>monitoring</primary>
|
||||||
|
<secondary>with repmgrd</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Monitoring with repmgrd</title>
|
<title>Monitoring with repmgrd</title>
|
||||||
<para>
|
<para>
|
||||||
When `repmgrd` is running with the option <literal>monitoring_history=true</literal>,
|
When <application>repmgrd</application> is running with the option <literal>monitoring_history=true</literal>,
|
||||||
it will constantly write standby node status information to the
|
it will constantly write standby node status information to the
|
||||||
<varname>monitoring_history</varname> table, providing a near-real time
|
<varname>monitoring_history</varname> table, providing a near-real time
|
||||||
overview of replication status on all nodes
|
overview of replication status on all nodes
|
||||||
@@ -39,7 +48,7 @@
|
|||||||
specify how many day's worth of data should be retained.
|
specify how many day's worth of data should be retained.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
It's possible to use <command>repmgrd</command> to run in monitoring
|
It's possible to use <application>repmgrd</application> to run in monitoring
|
||||||
mode only (without automatic failover capability) for some or all
|
mode only (without automatic failover capability) for some or all
|
||||||
nodes by setting <literal>failover=manual</literal> in the node's
|
nodes by setting <literal>failover=manual</literal> in the node's
|
||||||
<filename>repmgr.conf</filename> file. In the event of the node's upstream failing,
|
<filename>repmgr.conf</filename> file. In the event of the node's upstream failing,
|
||||||
|
|||||||
@@ -1,4 +1,9 @@
|
|||||||
<chapter id="repmgrd-network-split">
|
<chapter id="repmgrd-network-split" xreflabel="Handling network splits with repmgrd">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>network splits</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Handling network splits with repmgrd</title>
|
<title>Handling network splits with repmgrd</title>
|
||||||
<para>
|
<para>
|
||||||
A common pattern for replication cluster setups is to spread servers over
|
A common pattern for replication cluster setups is to spread servers over
|
||||||
@@ -10,7 +15,7 @@
|
|||||||
in the main data centre and promoted a standby among themselves.
|
in the main data centre and promoted a standby among themselves.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Previous &repmgr; versions used the concept of a "witness server" to
|
&repmgr; enables provision of "<xref linkend="witness-server">" to
|
||||||
artificially create a quorum of servers in a particular location, ensuring
|
artificially create a quorum of servers in a particular location, ensuring
|
||||||
that nodes in another location will not elect a new primary if they
|
that nodes in another location will not elect a new primary if they
|
||||||
are unable to see the majority of nodes. However this approach does not
|
are unable to see the majority of nodes. However this approach does not
|
||||||
@@ -32,11 +37,11 @@
|
|||||||
location='dc1'</programlisting>
|
location='dc1'</programlisting>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
In a failover situation, <command>repmgrd</command> will check if any servers in the
|
In a failover situation, <application>repmgrd</application> will check if any servers in the
|
||||||
same location as the current primary node are visible. If not, <command>repmgrd</command>
|
same location as the current primary node are visible. If not, <application>repmgrd</application>
|
||||||
will assume a network interruption and not promote any node in any
|
will assume a network interruption and not promote any node in any
|
||||||
other location (it will however enter <xref linkend="repmgrd-degraded-monitoring"> mode until
|
other location (it will however enter <link linkend="repmgrd-degraded-monitoring">degraded monitoring</link>
|
||||||
a primary becomes visible).
|
mode until a primary becomes visible).
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
</chapter>
|
</chapter>
|
||||||
|
|||||||
169
doc/repmgrd-pausing.sgml
Normal file
169
doc/repmgrd-pausing.sgml
Normal file
@@ -0,0 +1,169 @@
|
|||||||
|
<chapter id="repmgrd-pausing" xreflabel="Pausing repmgrd">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>pausing</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>pausing repmgrd</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>Pausing repmgrd</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
In normal operation, <application>repmgrd</application> monitors the state of the
|
||||||
|
PostgreSQL node it is running on, and will take appropriate action if problems
|
||||||
|
are detected, e.g. (if so configured) promote the node to primary, if the existing
|
||||||
|
primary has been determined as failed.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
However, <application>repmgrd</application> is unable to distinguish between
|
||||||
|
planned outages (such as performing a <link linkend="performing-switchover">switchover</link>
|
||||||
|
or upgrading a server), and an actual server outage. In versions prior to &repmgr; 4.2
|
||||||
|
it was necessary to stop <application>repmgrd</application> on all nodes (or at least
|
||||||
|
on all nodes where <application>repmgrd</application> is
|
||||||
|
<link linkend="repmgrd-automatic-failover">configured for automatic failover</link>)
|
||||||
|
to prevent <application>repmgrd</application> from making changes to the
|
||||||
|
replication cluster.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
From <link linkend="release-4.2">&repmgr; 4.2</link>, <application>repmgrd</application>
|
||||||
|
can now be "paused", i.e. instructed not to take any action such as performing a failover.
|
||||||
|
This can be done from any node in the cluster, removing the need to stop/restart
|
||||||
|
each <application>repmgrd</application> individually.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<sect1 id="repmgrd-pausing-prerequisites">
|
||||||
|
<title>Prerequisites for pausing <application>repmgrd</application></title>
|
||||||
|
<para>
|
||||||
|
In order to be able to pause/unpause <application>repmgrd</application>, following
|
||||||
|
prerequisites must be met:
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara><link linkend="release-4.2">&repmgr; 4.2</link> or later must be installed on all nodes.</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>The same major &repmgr; version (e.g. 4.2) must be installed on all nodes (and preferably the same minor version).</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
PostgreSQL on all nodes must be accessible from the node where the
|
||||||
|
<literal>pause</literal>/<literal>unpause</literal> operation is executed, using the
|
||||||
|
<varname>conninfo</varname> string shown by <link linkend="repmgr-cluster-show"><command>repmgr cluster show</command></link>.
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
These conditions are required for normal &repmgr; operation in any case.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="repmgrd-pausing-execution">
|
||||||
|
<title>Pausing/unpausing <application>repmgrd</application></title>
|
||||||
|
<para>
|
||||||
|
To pause <application>repmgrd</application>, execute <link linkend="repmgr-daemon-pause"><command>repmgr daemon pause</command></link>, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf daemon pause
|
||||||
|
NOTICE: node 1 (node1) paused
|
||||||
|
NOTICE: node 2 (node2) paused
|
||||||
|
NOTICE: node 3 (node3) paused</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
The state of <application>repmgrd</application> on each node can be checked with
|
||||||
|
<link linkend="repmgr-daemon-status"><command>repmgr daemon status</command></link>, e.g.:
|
||||||
|
<programlisting>$ repmgr -f /etc/repmgr.conf daemon status
|
||||||
|
ID | Name | Role | Status | repmgrd | PID | Paused?
|
||||||
|
----+-------+---------+---------+---------+------+---------
|
||||||
|
1 | node1 | primary | running | running | 7851 | yes
|
||||||
|
2 | node2 | standby | running | running | 7889 | yes
|
||||||
|
3 | node3 | standby | running | running | 7918 | yes</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If executing a switchover with <link linkend="repmgr-standby-switchover"><command>repmgr standby switchover</command></link>,
|
||||||
|
&repmgr; will automatically pause/unpause <application>repmgrd</application> as part of the switchover process.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
If the primary (in this example, <literal>node1</literal>) is stopped, <application>repmgrd</application>
|
||||||
|
running on one of the standbys (here: <literal>node2</literal>) will react like this:
|
||||||
|
<programlisting>
|
||||||
|
[2018-09-20 12:22:21] [WARNING] unable to connect to upstream node "node1" (node ID: 1)
|
||||||
|
[2018-09-20 12:22:21] [INFO] checking state of node 1, 1 of 5 attempts
|
||||||
|
[2018-09-20 12:22:21] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
...
|
||||||
|
[2018-09-20 12:22:24] [INFO] sleeping 1 seconds until next reconnection attempt
|
||||||
|
[2018-09-20 12:22:25] [INFO] checking state of node 1, 5 of 5 attempts
|
||||||
|
[2018-09-20 12:22:25] [WARNING] unable to reconnect to node 1 after 5 attempts
|
||||||
|
[2018-09-20 12:22:25] [NOTICE] node is paused
|
||||||
|
[2018-09-20 12:22:33] [INFO] node "node2" (node ID: 2) monitoring upstream node "node1" (node ID: 1) in degraded state
|
||||||
|
[2018-09-20 12:22:33] [DETAIL] repmgrd paused by administrator
|
||||||
|
[2018-09-20 12:22:33] [HINT] execute "repmgr daemon unpause" to resume normal failover mode</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If the primary becomes available again (e.g. following a software upgrade), <application>repmgrd</application>
|
||||||
|
will automatically reconnect, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
[2018-09-20 13:12:41] [NOTICE] reconnected to upstream node 1 after 8 seconds, resuming monitoring</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
To unpause <application>repmgrd</application>, execute <link linkend="repmgr-daemon-unpause"><command>repmgr daemon unpause</command></link>, e.g.:
|
||||||
|
<programlisting>
|
||||||
|
$ repmgr -f /etc/repmgr.conf daemon pause
|
||||||
|
NOTICE: node 1 (node1) unpaused
|
||||||
|
NOTICE: node 2 (node2) unpaused
|
||||||
|
NOTICE: node 3 (node3) unpaused</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If the previous primary is no longer accessible when <application>repmgrd</application>
|
||||||
|
is unpaused, no failover action will be taken. Instead, a new primary must be manually promoted using
|
||||||
|
<link linkend="repmgr-standby-promote"><command>repmgr standby promote</command></link>,
|
||||||
|
and any standbys attached to the new primary with
|
||||||
|
<link linkend="repmgr-standby-follow"><command>repmgr standby follow</command></link>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This is to prevent <link linkend="repmgr-daemon-unpause"><command>repmgr daemon unpause</command></link>
|
||||||
|
resulting in the automatic promotion of a new primary, which may be a problem particularly
|
||||||
|
in larger clusters, where <application>repmgrd</application> could select a different promotion
|
||||||
|
candidate to the one intended by the administrator.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<sect2 id="repmgrd-pausing-details">
|
||||||
|
<title>Details on the <application>repmgrd</application> pausing mechanism</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
The pause state of each node will be stored over a PostgreSQL restart.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<link linkend="repmgr-daemon-pause"><command>repmgr daemon pause</command></link> and
|
||||||
|
<link linkend="repmgr-daemon-unpause"><command>repmgr daemon unpause</command></link> can be
|
||||||
|
executed even if <application>repmgrd</application> is not running; in this case,
|
||||||
|
<application>repmgrd</application> will start up in whichever pause state has been set.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
<link linkend="repmgr-daemon-pause"><command>repmgr daemon pause</command></link> and
|
||||||
|
<link linkend="repmgr-daemon-unpause"><command>repmgr daemon unpause</command></link>
|
||||||
|
<emphasis>do not</emphasis> stop/start <application>repmgrd</application>.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
</sect2>
|
||||||
|
</sect1>
|
||||||
|
</chapter>
|
||||||
|
|
||||||
31
doc/repmgrd-witness-server.sgml
Normal file
31
doc/repmgrd-witness-server.sgml
Normal file
@@ -0,0 +1,31 @@
|
|||||||
|
<chapter id="repmgrd-witness-server" xreflabel="Using a witness server with repmgrd">
|
||||||
|
<indexterm>
|
||||||
|
<primary>repmgrd</primary>
|
||||||
|
<secondary>witness server</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>Using a witness server with repmgrd</title>
|
||||||
|
<para>
|
||||||
|
In a situation caused e.g. by a network interruption between two
|
||||||
|
data centres, it's important to avoid a "split-brain" situation where
|
||||||
|
both sides of the network assume they are the active segment and the
|
||||||
|
side without an active primary unilaterally promotes one of its standbys.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To prevent this situation happening, it's essential to ensure that one
|
||||||
|
network segment has a "voting majority", so other segments will know
|
||||||
|
they're in the minority and not attempt to promote a new primary. Where
|
||||||
|
an odd number of servers exists, this is not an issue. However, if each
|
||||||
|
network has an even number of nodes, it's necessary to provide some way
|
||||||
|
of ensuring a majority, which is where the witness server becomes useful.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This is not a fully-fledged standby node and is not integrated into
|
||||||
|
replication, but it effectively represents the "casting vote" when
|
||||||
|
deciding which network segment has a majority. A witness server can
|
||||||
|
be set up using <xref linkend="repmgr-witness-register">. Note that it only
|
||||||
|
makes sense to create a witness server in conjunction with running
|
||||||
|
<application>repmgrd</application>; the witness server will require its own
|
||||||
|
<application>repmgrd</application> instance.
|
||||||
|
</para>
|
||||||
|
</chapter>
|
||||||
@@ -1,4 +1,9 @@
|
|||||||
<chapter id="performing-switchover" xreflabel="Performing a switchover with repmgr">
|
<chapter id="performing-switchover" xreflabel="Performing a switchover with repmgr">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>switchover</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Performing a switchover with repmgr</title>
|
<title>Performing a switchover with repmgr</title>
|
||||||
<para>
|
<para>
|
||||||
A typical use-case for replication is a combination of primary and standby
|
A typical use-case for replication is a combination of primary and standby
|
||||||
@@ -14,9 +19,10 @@
|
|||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
<command>repmgr standby switchover</command> differs from other &repmgr;
|
<command>repmgr standby switchover</command> differs from other &repmgr;
|
||||||
actions in that it lso performs actions on another server (the demotion
|
actions in that it also performs actions on other servers (the demotion
|
||||||
candidate), which means passwordless SSH access is required to that server
|
candidate, and optionally any other servers which are to follow the new primary),
|
||||||
from the one where <command>repmgr standby switchover</command> is executed.
|
which means passwordless SSH access is required to those servers from the one where
|
||||||
|
<command>repmgr standby switchover</command> is executed.
|
||||||
</para>
|
</para>
|
||||||
<note>
|
<note>
|
||||||
<simpara>
|
<simpara>
|
||||||
@@ -39,7 +45,7 @@
|
|||||||
</simpara>
|
</simpara>
|
||||||
<simpara>
|
<simpara>
|
||||||
Please also read carefully the sections <xref linkend="preparing-for-switchover"> and
|
Please also read carefully the sections <xref linkend="preparing-for-switchover"> and
|
||||||
`Caveats` below.
|
<xref linkend="switchover-caveats"> below.
|
||||||
</simpara>
|
</simpara>
|
||||||
</note>
|
</note>
|
||||||
|
|
||||||
@@ -49,45 +55,119 @@
|
|||||||
<secondary>preparation</secondary>
|
<secondary>preparation</secondary>
|
||||||
</indexterm>
|
</indexterm>
|
||||||
<title>Preparing for switchover</title>
|
<title>Preparing for switchover</title>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
As mentioned above, success of the switchover operation depends on &repmgr;
|
As mentioned in the previous section, success of the switchover operation depends on
|
||||||
being able to shut down the current primary server quickly and cleanly.
|
&repmgr; being able to shut down the current primary server quickly and cleanly.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Ensure that the promotion candidate has sufficient free walsenders available
|
||||||
|
(PostgreSQL configuration item <varname>max_wal_senders</varname>), and if replication
|
||||||
|
slots are in use, at least one free slot is available for the demotion candidate (
|
||||||
|
PostgreSQL configuration item <varname>max_replication_slots</varname>).
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Ensure that a passwordless SSH connection is possible from the promotion candidate
|
||||||
|
(standby) to the demotion candidate (current primary). If <literal>--siblings-follow</literal>
|
||||||
|
will be used, ensure that passwordless SSH connections are possible from the
|
||||||
|
promotion candidate to all standbys attached to the demotion candidate.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
&repmgr; expects to find the &repmgr; binary in the same path on the remote
|
||||||
|
server as on the local server.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Double-check which commands will be used to stop/start/restart the current
|
Double-check which commands will be used to stop/start/restart the current
|
||||||
primary; on the primary execute:
|
primary; on the current primary execute:
|
||||||
<programlisting>
|
<programlisting>
|
||||||
repmgr -f /etc./repmgr.conf node service --list --action=stop
|
repmgr -f /etc/repmgr.conf node service --list --action=stop
|
||||||
repmgr -f /etc./repmgr.conf node service --list --action=start
|
repmgr -f /etc/repmgr.conf node service --list --action=start
|
||||||
repmgr -f /etc./repmgr.conf node service --list --action=restart
|
repmgr -f /etc/repmgr.conf node service --list --action=restart</programlisting>
|
||||||
</programlisting>
|
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
These commands can be defined in <filename>repmgr.conf</filename> with
|
||||||
|
<option>service_start_command</option>, <option>service_stop_command</option>
|
||||||
|
and <option>service_restart_command</option>.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<important>
|
||||||
|
<para>
|
||||||
|
If &repmgr; is installed from a package. you should set these commands
|
||||||
|
to use the appropriate service commands defined by the package/operating
|
||||||
|
system as these will ensure PostgreSQL is stopped/started properly
|
||||||
|
taking into account configuration and log file locations etc.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If the <option>service_*_command</option> options aren't defined, &repmgr; will
|
||||||
|
fall back to using <application>pg_ctl</application> to stop/start/restart
|
||||||
|
PostgreSQL, which may not work properly, particularly when executed on a remote
|
||||||
|
server.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
For more details, see <xref linkend="configuration-file-service-commands">.
|
||||||
|
</para>
|
||||||
|
</important>
|
||||||
|
|
||||||
<note>
|
<note>
|
||||||
<simpara>
|
<simpara>
|
||||||
On <literal>systemd</literal> systems we strongly recommend using the appropriate
|
On <literal>systemd</literal> systems we strongly recommend using the appropriate
|
||||||
<command>systemctl</command> commands (typically run via <command>sudo</command>) to ensure
|
<command>systemctl</command> commands (typically run via <command>sudo</command>) to ensure
|
||||||
<literal>systemd</literal> informed about the status of the PostgreSQL service.
|
<literal>systemd</literal> is informed about the status of the PostgreSQL service.
|
||||||
|
</simpara>
|
||||||
|
<simpara>
|
||||||
|
If using <command>sudo</command> for the <command>systemctl</command> calls, make sure the
|
||||||
|
<command>sudo</command> specification doesn't require a real tty for the user. If not set
|
||||||
|
this way, <command>repmgr</command> will fail to stop the primary.
|
||||||
</simpara>
|
</simpara>
|
||||||
</note>
|
</note>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Check that access from applications is minimalized or preferably blocked
|
Check that access from applications is minimalized or preferably blocked
|
||||||
completely, so applications are not unexpectedly interrupted.
|
completely, so applications are not unexpectedly interrupted.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
If an exclusive backup is running on the current primary, &repmgr; will not perform the
|
||||||
|
switchover.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Check there is no significant replication lag on standbys attached to the
|
Check there is no significant replication lag on standbys attached to the
|
||||||
current primary.
|
current primary.
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
If WAL file archiving is set up, check that there is no backlog of files waiting
|
If WAL file archiving is set up, check that there is no backlog of files waiting
|
||||||
to be archived, as PostgreSQL will not finally shut down until all these have been
|
to be archived, as PostgreSQL will not finally shut down until all of these have been
|
||||||
archived. If there is a backlog exceeding <varname>archive_ready_warning</varname> WAL files,
|
archived. If there is a backlog exceeding <varname>archive_ready_warning</varname> WAL files,
|
||||||
`repmgr` will emit a warning before attempting to perform a switchover; you can also check
|
&repmgr; will emit a warning before attempting to perform a switchover; you can also check
|
||||||
manually with <command>repmgr node check --archive-ready</command>.
|
manually with <command>repmgr node check --archive-ready</command>.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
|
||||||
Ensure that <command>repmgrd</command> is *not* running anywhere to prevent it unintentionally
|
<note>
|
||||||
promoting a node.
|
<para>
|
||||||
</para>
|
From <link linkend="release-4.2">repmgr 4.2</link>, &repmgr; will instruct any running
|
||||||
|
<application>repmgrd</application> instances to pause operations while the switchover
|
||||||
|
is being carried out, to prevent <application>repmgrd</application> from
|
||||||
|
unintentionally promoting a node. For more details, see <xref linkend="repmgrd-pausing">.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Users of &repmgr; versions prior to 4.2 should ensure that <application>repmgrd</application>
|
||||||
|
is not running on any nodes while a switchover is being executed.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
Finally, consider executing <command>repmgr standby switchover</command> with the
|
Finally, consider executing <command>repmgr standby switchover</command> with the
|
||||||
<literal>--dry-run</literal> option; this will perform any necessary checks and inform you about
|
<literal>--dry-run</literal> option; this will perform any necessary checks and inform you about
|
||||||
@@ -96,7 +176,7 @@
|
|||||||
<programlisting>
|
<programlisting>
|
||||||
$ repmgr standby switchover -f /etc/repmgr.conf --siblings-follow --dry-run
|
$ repmgr standby switchover -f /etc/repmgr.conf --siblings-follow --dry-run
|
||||||
NOTICE: checking switchover on node "node2" (ID: 2) in --dry-run mode
|
NOTICE: checking switchover on node "node2" (ID: 2) in --dry-run mode
|
||||||
INFO: SSH connection to host "localhost" succeeded
|
INFO: SSH connection to host "node1" succeeded
|
||||||
INFO: archive mode is "off"
|
INFO: archive mode is "off"
|
||||||
INFO: replication lag on this standby is 0 seconds
|
INFO: replication lag on this standby is 0 seconds
|
||||||
INFO: all sibling nodes are reachable via SSH
|
INFO: all sibling nodes are reachable via SSH
|
||||||
@@ -105,6 +185,74 @@
|
|||||||
"pg_ctl -l /var/log/postgresql/startup.log -D '/var/lib/postgresql/data' -m fast -W stop"
|
"pg_ctl -l /var/log/postgresql/startup.log -D '/var/lib/postgresql/data' -m fast -W stop"
|
||||||
</programlisting>
|
</programlisting>
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
|
<important>
|
||||||
|
<para>
|
||||||
|
Be aware that <option>--dry-run</option> checks the prerequisites
|
||||||
|
for performing the switchover and some basic sanity checks on the
|
||||||
|
state of the database which might effect the switchover operation
|
||||||
|
(e.g. replication lag); it cannot however guarantee the switchover
|
||||||
|
operation will succeed. In particular, if the current primary
|
||||||
|
does not shut down cleanly, &repmgr; will not be able to reliably
|
||||||
|
execute the switchover (as there would be a danger of divergence
|
||||||
|
between the former and new primary nodes).
|
||||||
|
</para>
|
||||||
|
</important>
|
||||||
|
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
See <xref linkend="repmgr-standby-switchover"> for a full list of available
|
||||||
|
command line options and <filename>repmgr.conf</filename> settings relevant
|
||||||
|
to performing a switchover.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<sect2 id="switchover-pg-rewind" xreflabel="Switchover and pg_rewind">
|
||||||
|
<indexterm>
|
||||||
|
<primary>pg_rewind</primary>
|
||||||
|
<secondary>using with "repmgr standby switchover"</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Switchover and pg_rewind</title>
|
||||||
|
<para>
|
||||||
|
If the demotion candidate does not shut down smoothly or cleanly, there's a risk it
|
||||||
|
will have a slightly divergent timeline and will not be able to attach to the new
|
||||||
|
primary. To fix this situation without needing to reclone the old primary, it's
|
||||||
|
possible to use the <application>pg_rewind</application> utility, which will usually be
|
||||||
|
able to resync the two servers.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To have &repmgr; execute <application>pg_rewind</application> if it detects this
|
||||||
|
situation after promoting the new primary, add the <option>--force-rewind</option>
|
||||||
|
option.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
If &repmgr; detects a situation where it needs to execute <application>pg_rewind</application>,
|
||||||
|
it will execute a <literal>CHECKPOINT</literal> on the new primary before executing
|
||||||
|
<application>pg_rewind</application>.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
For more details on <application>pg_rewind</application>, see:
|
||||||
|
<ulink url="https://www.postgresql.org/docs/current/static/app-pgrewind.html">https://www.postgresql.org/docs/current/static/app-pgrewind.html</ulink>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
<application>pg_rewind</application> has been part of the core PostgreSQL distribution since
|
||||||
|
version 9.5. Users of versions 9.3 and 9.4 will need to manually install it; the source code is available here:
|
||||||
|
<ulink url="https://github.com/vmware/pg_rewind">https://github.com/vmware/pg_rewind</ulink>.
|
||||||
|
If the <application>pg_rewind</application>
|
||||||
|
binary is not installed in the PostgreSQL <filename>bin</filename> directory, provide
|
||||||
|
its full path on the demotion candidate with <option>--force-rewind</option>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
Note that building the 9.3/9.4 version of <application>pg_rewind</application> requires the PostgreSQL
|
||||||
|
source code. Also, PostgreSQL 9.3 does not provide <varname>wal_log_hints</varname>,
|
||||||
|
meaning data checksums must have been enabled when the database was initialized.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|
||||||
<sect1 id="switchover-execution" xreflabel="Executing the switchover command">
|
<sect1 id="switchover-execution" xreflabel="Executing the switchover command">
|
||||||
@@ -128,7 +276,7 @@
|
|||||||
INFO: searching for primary node
|
INFO: searching for primary node
|
||||||
INFO: checking if node 1 is primary
|
INFO: checking if node 1 is primary
|
||||||
INFO: current primary node is 1
|
INFO: current primary node is 1
|
||||||
INFO: SSH connection to host "localhost" succeeded
|
INFO: SSH connection to host "node1" succeeded
|
||||||
INFO: archive mode is "off"
|
INFO: archive mode is "off"
|
||||||
INFO: replication lag on this standby is 0 seconds
|
INFO: replication lag on this standby is 0 seconds
|
||||||
NOTICE: local node "node2" (ID: 2) will be promoted to primary; current primary "node1" (ID: 1) will be demoted to standby
|
NOTICE: local node "node2" (ID: 2) will be promoted to primary; current primary "node1" (ID: 1) will be demoted to standby
|
||||||
@@ -162,7 +310,21 @@
|
|||||||
2 | node2 | primary | * running | | default | host=node2 dbname=repmgr user=repmgr
|
2 | node2 | primary | * running | | default | host=node2 dbname=repmgr user=repmgr
|
||||||
</programlisting>
|
</programlisting>
|
||||||
</para>
|
</para>
|
||||||
|
<para>
|
||||||
|
If <application>repmgrd</application> is in use, it's worth double-checking that
|
||||||
|
all nodes are unpaused by executing <command><link linkend="repmgr-daemon-status">repmgr-daemon-status</link></command>.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
Users of &repmgr; versions prior to 4.2 will need to manually restart <application>repmgrd</application>
|
||||||
|
on all nodes after the switchover is completed.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|
||||||
|
|
||||||
<sect1 id="switchover-caveats" xreflabel="Caveats">
|
<sect1 id="switchover-caveats" xreflabel="Caveats">
|
||||||
<indexterm>
|
<indexterm>
|
||||||
<primary>switchover</primary>
|
<primary>switchover</primary>
|
||||||
@@ -188,17 +350,76 @@
|
|||||||
for details.
|
for details.
|
||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
|
||||||
<simpara>
|
|
||||||
<command>repmgrd</command> should not be running with setting <varname>failover=automatic</varname>
|
|
||||||
in <filename>repmgr.conf</filename> when a switchover is carried out, otherwise the
|
|
||||||
<command>repmgrd</command> daemon may try and promote a standby by itself.
|
|
||||||
</simpara>
|
|
||||||
</listitem>
|
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
</para>
|
</para>
|
||||||
<para>
|
|
||||||
We hope to remove some of these restrictions in future versions of `repmgr`.
|
|
||||||
</para>
|
|
||||||
</sect1>
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="switchover-troubleshooting" xreflabel="Troubleshooting">
|
||||||
|
<indexterm>
|
||||||
|
<primary>switchover</primary>
|
||||||
|
<secondary>troubleshooting</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Troubleshooting switchover issues</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
As <link linkend="performing-switchover">emphasised previously</link>, performing a switchover
|
||||||
|
is a non-trivial operation and there are a number of potential issues which can occur.
|
||||||
|
While &repmgr; attempts to perform sanity checks, there's no guaranteed way of determining the success of
|
||||||
|
a switchover without actually carrying it out.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<sect2 id="switchover-troubleshooting-primary-shutdown">
|
||||||
|
<title>Demotion candidate (old primary) does not shut down</title>
|
||||||
|
<para>
|
||||||
|
&repmgr; may abort a switchover with a message like:
|
||||||
|
<programlisting>
|
||||||
|
ERROR: shutdown of the primary server could not be confirmed
|
||||||
|
HINT: check the primary server status before performing any further actions</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This means the shutdown of the old primary has taken longer than &repmgr; expected,
|
||||||
|
and it has given up waiting.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
In this case, check the PostgreSQL log on the primary server to see what is going
|
||||||
|
on. It's entirely possible the shutdown process is just taking longer than the
|
||||||
|
timeout set by the configuration parameter <varname>shutdown_check_timeout</varname>
|
||||||
|
(default: 60 seconds), in which case you may need to adjust this parameter.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
Note that <varname>shutdown_check_timeout</varname>is set on the node where
|
||||||
|
<command>repmgr standby switchover</command> is executed (promotion candidate); setting it on the
|
||||||
|
demotion candidate (former primary) will have no effect.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
If the primary server has shut down cleanly, and no other node has been promoted,
|
||||||
|
it is safe to restart it, in which case the replication cluster will be restored
|
||||||
|
to its original configuration.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="switchover-troubleshooting-exclusive-backup">
|
||||||
|
<title>Switchover aborts with an "exclusive backup" error</title>
|
||||||
|
<para>
|
||||||
|
&repmgr; may abort a switchover with a message like:
|
||||||
|
<programlisting>
|
||||||
|
ERROR: unable to perform a switchover while primary server is in exclusive backup mode
|
||||||
|
HINT: stop backup before attempting the switchover</programlisting>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
This means an exclusive backup is running on the current primary; interrupting this
|
||||||
|
will not only abort the backup, but potentially leave the primary with an ambiguous
|
||||||
|
backup state.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To proceed, either wait until the backup has finished, or cancel it with the command
|
||||||
|
<command>SELECT pg_stop_backup()</command>. For more details see the PostgreSQL
|
||||||
|
documentation section
|
||||||
|
<ulink url="https://www.postgresql.org/docs/current/static/continuous-archiving.html#BACKUP-LOWLEVEL-BASE-BACKUP-EXCLUSIVE">Making an exclusive low level backup</ulink>.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
</chapter>
|
</chapter>
|
||||||
|
|||||||
@@ -1,140 +1,9 @@
|
|||||||
Upgrading from repmgr 3
|
Upgrading from repmgr 3
|
||||||
=======================
|
=======================
|
||||||
|
|
||||||
The upgrade process consists of two steps:
|
This document has been integrated into the main `repmgr` documentation
|
||||||
|
and is now located here:
|
||||||
|
|
||||||
1) converting the repmgr.conf configuration files
|
> [Upgrading from repmgr 3.x](https://repmgr.org/docs/4.0/upgrading-from-repmgr-3.html)
|
||||||
2) upgrading the repmgr schema
|
|
||||||
|
|
||||||
A script is provided to assist with converting `repmgr.conf`.
|
|
||||||
|
|
||||||
The schema upgrade (which converts the `repmgr` metadata into
|
|
||||||
a packaged PostgreSQL extension) is normally carried out
|
|
||||||
automatically when the `repmgr` extension is created.
|
|
||||||
|
|
||||||
|
|
||||||
Converting repmgr.conf configuration files
|
|
||||||
------------------------------------------
|
|
||||||
|
|
||||||
With a completely new repmgr version, we've taken the opportunity
|
|
||||||
to rename some configuration items have had their names changed for
|
|
||||||
clarity and consistency, both between the configuration file and
|
|
||||||
the column names in `repmgr.nodes` (e.g. `node` → `node_id`), and
|
|
||||||
also for consistency with PostgreSQL naming conventions
|
|
||||||
(e.g. `loglevel` → `log_level`).
|
|
||||||
|
|
||||||
Other configuration items have been changed to command line options,
|
|
||||||
and vice-versa, e.g. to avoid hard-coding items such as a a node's
|
|
||||||
upstream ID, which might change over time.
|
|
||||||
|
|
||||||
`repmgr` will issue a warning about deprecated/altered options.
|
|
||||||
|
|
||||||
|
|
||||||
### Changed parameters
|
|
||||||
|
|
||||||
Following parameters have been added:
|
|
||||||
|
|
||||||
- `data_directory`: this is mandatory and must contain the path
|
|
||||||
to the node's data directory
|
|
||||||
- `monitoring_history`: this replaces the `repmgrd` command line
|
|
||||||
option `--monitoring-history`
|
|
||||||
|
|
||||||
Following parameters have been renamed:
|
|
||||||
|
|
||||||
- `node` → `node_id`
|
|
||||||
- `loglevel` → `log_level`
|
|
||||||
- `logfacility` → `log_facility`
|
|
||||||
- `logfile` → `log_file`
|
|
||||||
- `master_reponse_timeout` → `async_query_timeout`
|
|
||||||
|
|
||||||
Following parameters have been removed:
|
|
||||||
|
|
||||||
- `cluster` is no longer required and will be ignored.
|
|
||||||
- `upstream_node_id` is replaced by the command-line parameter
|
|
||||||
`--upstream-node-id`
|
|
||||||
|
|
||||||
### Conversion script
|
|
||||||
|
|
||||||
To assist with conversion of `repmgr.conf` files, a Perl script
|
|
||||||
is provided in `contrib/convert-config.pl`. Use like this:
|
|
||||||
|
|
||||||
$ ./convert-config.pl /etc/repmgr.conf
|
|
||||||
node_id=2
|
|
||||||
node_name=node2
|
|
||||||
conninfo=host=node2 dbname=repmgr user=repmgr connect_timeout=2
|
|
||||||
pg_ctl_options='-l /var/log/postgres/startup.log'
|
|
||||||
rsync_options=--exclude=postgresql.local.conf --archive
|
|
||||||
log_level=INFO
|
|
||||||
pg_basebackup_options=--no-slot
|
|
||||||
data_directory=
|
|
||||||
|
|
||||||
The converted file is printed to `STDOUT` and the original file is not
|
|
||||||
changed.
|
|
||||||
|
|
||||||
Please note that the parameter `data_directory` *must* be provided;
|
|
||||||
if not already present, the conversion script will add an empty
|
|
||||||
placeholder parameter.
|
|
||||||
|
|
||||||
|
|
||||||
Upgrading the repmgr schema
|
|
||||||
---------------------------
|
|
||||||
|
|
||||||
Ensure `repmgrd` is not running, or any cron jobs which execute the
|
|
||||||
`repmgr` binary.
|
|
||||||
|
|
||||||
Install `repmgr4`; any `repmgr3` packages should be uninstalled
|
|
||||||
(if not automatically uninstalled already).
|
|
||||||
|
|
||||||
### Upgrading from repmgr 3.1.1 or earlier
|
|
||||||
|
|
||||||
If your repmgr version is 3.1.1 or earlier, you will need to update
|
|
||||||
the schema to the latest version in the 3.x series (3.3.2) before
|
|
||||||
converting the installation to repmgr 4.
|
|
||||||
|
|
||||||
To do this, apply the following upgrade scripts as appropriate for
|
|
||||||
your current version:
|
|
||||||
|
|
||||||
- repmgr3.0_repmgr3.1.sql
|
|
||||||
- repmgr3.1.1_repmgr3.1.2.sql
|
|
||||||
|
|
||||||
For more details see:
|
|
||||||
|
|
||||||
https://repmgr.org/release-notes-3.3.2.html#upgrading
|
|
||||||
|
|
||||||
### Manually create the repmgr extension
|
|
||||||
|
|
||||||
In the database used by the existing `repmgr` configuration, execute:
|
|
||||||
|
|
||||||
CREATE EXTENSION repmgr FROM unpackaged;
|
|
||||||
|
|
||||||
This will move and convert all objects from the existing schema
|
|
||||||
into the new, standard `repmgr` schema.
|
|
||||||
|
|
||||||
> *NOTE* there must be only one schema matching 'repmgr_%' in the
|
|
||||||
> database, otherwise this step may not work.
|
|
||||||
|
|
||||||
### Re-register each node
|
|
||||||
|
|
||||||
This is necessary to update the `repmgr` metadata with some additional items.
|
|
||||||
|
|
||||||
On the primary node, execute e.g.
|
|
||||||
|
|
||||||
repmgr primary register -f /etc/repmgr.conf --force
|
|
||||||
|
|
||||||
On each standby node, execute e.g.
|
|
||||||
|
|
||||||
repmgr standby register -f /etc/repmgr.conf --force
|
|
||||||
|
|
||||||
Check the data is updated as expected by examining the `repmgr.nodes` table;
|
|
||||||
restart `repmgrd` if required.
|
|
||||||
|
|
||||||
The original `repmgr_$cluster` schema can be dropped at any time.
|
|
||||||
|
|
||||||
* * *
|
|
||||||
|
|
||||||
> *TIP* If you don't care about any data from the existing `repmgr` installation,
|
|
||||||
> (e.g. the contents of the `events` and `monitoring` tables), the manual
|
|
||||||
> "CREATE EXTENSION" step can be skipped; just re-register each node, starting
|
|
||||||
> with the primary node, and the `repmgr` extension will be automatically created.
|
|
||||||
|
|
||||||
* * *
|
|
||||||
|
|||||||
@@ -1,24 +1,275 @@
|
|||||||
<chapter id="upgrading-repmgr" xreflabel="Upgrading repmgr">
|
<chapter id="upgrading-repmgr" xreflabel="Upgrading repmgr">
|
||||||
|
|
||||||
|
<indexterm>
|
||||||
|
<primary>upgrading</primary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
<title>Upgrading repmgr</title>
|
<title>Upgrading repmgr</title>
|
||||||
|
|
||||||
<para>
|
<para>
|
||||||
&repmgr; is updated regularly with point releases (e.g. 4.0.1 to 4.0.2)
|
&repmgr; is updated regularly with minor releases (e.g. 4.0.1 to 4.0.2)
|
||||||
containing bugfixes and other minor improvements. Any substantial new
|
containing bugfixes and other minor improvements. Any substantial new
|
||||||
functionality will be included in a feature release (e.g. 4.0.x to 4.1.x).
|
functionality will be included in a major release (e.g. 4.0 to 4.1).
|
||||||
</para>
|
|
||||||
<para>
|
|
||||||
&repmgr; is implemented as a PostgreSQL extension; to upgrade it, first
|
|
||||||
install the updated package (or compile the updated source), then in the
|
|
||||||
database where the &repmgr; extension is installed, execute
|
|
||||||
<command>ALTER EXTENSION repmgr UPDATE</command>.
|
|
||||||
</para>
|
|
||||||
<para>
|
|
||||||
If <command>repmgrd</command> is running, it may be necessary to restart
|
|
||||||
the PostgreSQL server if the upgrade contains changes to the shared object
|
|
||||||
file used by <command>repmgrd</command>; check the release notes for details.
|
|
||||||
</para>
|
</para>
|
||||||
|
|
||||||
<sect1 id="upgrading-from-repmgr-3">
|
<sect1 id="upgrading-repmgr-extension" xreflabel="Upgrading repmgr 4.x and later">
|
||||||
<title>Upgrading from repmgr 3</title>
|
<indexterm>
|
||||||
|
<primary>upgrading</primary>
|
||||||
|
<secondary>repmgr 4.x and later</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Upgrading repmgr 4.x and later</title>
|
||||||
|
<para>
|
||||||
|
From version 4, &repmgr; consists of three elements:
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
the <application>repmgr</application> and <application>repmgrd</application> executables
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
the objects for the &repmgr; PostgreSQL extension (SQL files for creating/updating
|
||||||
|
repmgr metadata, and the extension control file)
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
the shared library module used by <application>repmgrd</application> which
|
||||||
|
is resident in the PostgreSQL backend
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
</itemizedlist>
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
With <emphasis>minor releases</emphasis>, usually changes are only made to the <application>repmgr</application>
|
||||||
|
and <application>repmgrd</application> executables. In this case, the upgrade is quite straightforward,
|
||||||
|
and is simply a case of installing the new version, and restarting <application>repmgrd</application>
|
||||||
|
(if running).
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
For <emphasis>major releases</emphasis>, the &repmgr; PostgreSQL extension will need to be updated
|
||||||
|
to the latest version. Additionally, if the shared library module has been updated (this is sometimes,
|
||||||
|
but not always the case), PostgreSQL itself will need to be restarted on each node.
|
||||||
|
</para>
|
||||||
|
<important>
|
||||||
|
<para>
|
||||||
|
Always check the <link linkend="appendix-release-notes">release notes</link> for every
|
||||||
|
release as they may contain upgrade instructions particular to individual versions.
|
||||||
|
</para>
|
||||||
|
</important>
|
||||||
|
|
||||||
|
<sect2 id="upgrading-minor-version" xreflabel="Upgrading a minor version release">
|
||||||
|
<indexterm>
|
||||||
|
<primary>upgrading</primary>
|
||||||
|
<secondary>minor release</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Upgrading a minor version release</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
The process for installing minor version upgrades is quite straightforward:
|
||||||
|
|
||||||
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
install the new &repmgr; version
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
restart <application>repmgrd</application> on all nodes where it is running
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</itemizedlist>
|
||||||
|
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
Some packaging systems (e.g. <link linkend="packages-debian-ubuntu">Debian/Ubuntu</link>
|
||||||
|
may restart <application>repmgrd</application> as part of the package upgrade process.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
Minor version upgrades can be performed in any order on the nodes in the replication
|
||||||
|
cluster.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
A PostgreSQL restart is <emphasis>not</emphasis> required for minor version upgrades.
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
The same &repmgr; "major version" (e.g. <literal>4.2</literal>) must be
|
||||||
|
installed on all nodes in the replication cluster. While it's possible to have differing
|
||||||
|
&repmgr; "minor versions" (e.g. <literal>4.2.1</literal>) on different nodes,
|
||||||
|
we strongly recommend updating all nodes to the latest minor version.
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
|
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="upgrading-major-version" xreflabel="Upgrading a major version release">
|
||||||
|
<indexterm>
|
||||||
|
<primary>upgrading</primary>
|
||||||
|
<secondary>major release</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Upgrading a major version release</title>
|
||||||
|
<para>
|
||||||
|
"major version" upgrades need to be planned more carefully, as they may include
|
||||||
|
changes to the &repmgr; metadata (which need to be propagated from the primary to all
|
||||||
|
standbys) and/or changes to the shared object file used by <application>repmgrd</application>
|
||||||
|
(which require a PostgreSQL restart).
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
With this in mind,
|
||||||
|
</para>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<orderedlist>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
Stop <application>repmgrd</application> (if in use) on all nodes where it is running.
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
Disable the <application>repmgrd</application> service on all nodes where it is in use;
|
||||||
|
this is to prevent packages from prematurely restarting <application>repmgrd</application>.
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
Install the updated package (or compile the updated source) on all nodes.
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
If running a <literal>systemd</literal>-based Linux distribution, execute (as <literal>root</literal>,
|
||||||
|
or with appropriate <literal>sudo</literal> permissions):
|
||||||
|
<programlisting>
|
||||||
|
systemctl daemon-reload</programlisting>
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
If the &repmgr; shared library module has been updated (check the <link linkend="appendix-release-notes">release notes</link>!),
|
||||||
|
restart PostgreSQL, then <application>repmgrd</application> (if in use) on each node,
|
||||||
|
The order in which this is applied to individual nodes is not critical,
|
||||||
|
and it's also fine to restart PostgreSQL on all nodes first before starting <application>repmgrd</application>.
|
||||||
|
</simpara>
|
||||||
|
<simpara>
|
||||||
|
Note that if the upgrade requires a PostgreSQL restart, <application>repmgrd</application>
|
||||||
|
will only function correctly once all nodes have been restarted.
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<para>
|
||||||
|
On the primary node, execute
|
||||||
|
<programlisting>
|
||||||
|
ALTER EXTENSION repmgr UPDATE</programlisting>
|
||||||
|
in the database where &repmgr; is installed.
|
||||||
|
</para>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
<listitem>
|
||||||
|
<simpara>
|
||||||
|
Reenable the <application>repmgrd</application> service on all nodes where it is in use.
|
||||||
|
</simpara>
|
||||||
|
</listitem>
|
||||||
|
|
||||||
|
</orderedlist>
|
||||||
|
</para>
|
||||||
|
<tip>
|
||||||
|
<para>
|
||||||
|
If the &repmgr; upgrade requires a PostgreSQL restart, combine the &repmgr; upgrade
|
||||||
|
with a PostgreSQL minor version upgrade, which will require a restart in any case.
|
||||||
|
New PostgreSQL minor version are usually released every couple of months.
|
||||||
|
</para>
|
||||||
|
</tip>
|
||||||
|
</sect2>
|
||||||
|
|
||||||
|
<sect2 id="upgrading-check-repmgrd" xreflabel="Checking repmgrd status after an upgrade">
|
||||||
|
<indexterm>
|
||||||
|
<primary>upgrading</primary>
|
||||||
|
<secondary>checking repmgrd status</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<title>Checking repmgrd status after an upgrade</title>
|
||||||
|
<para>
|
||||||
|
From &repmgr; 4.2, once the upgrade is complete, execute the <command><link linkend="repmgr-daemon-status">repmgr daemon status</link></command>
|
||||||
|
command (on any node) to show an overview of the status of <application>repmgrd</application> on all nodes.
|
||||||
|
</para>
|
||||||
|
</sect2>
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
<sect1 id="upgrading-and-pg-upgrade" xreflabel="pg_upgrade and repmgr">
|
||||||
|
<indexterm>
|
||||||
|
<primary>upgrading</primary>
|
||||||
|
<secondary>pg_upgrade</secondary>
|
||||||
|
</indexterm>
|
||||||
|
<indexterm>
|
||||||
|
<primary>pg_upgrade</primary>
|
||||||
|
</indexterm>
|
||||||
|
<title>pg_upgrade and repmgr</title>
|
||||||
|
|
||||||
|
<para>
|
||||||
|
<application>pg_upgrade</application> requires that if any functions are
|
||||||
|
dependent on a shared library, this library must be present in both
|
||||||
|
the old and new installations before <application>pg_upgrade</application>
|
||||||
|
can be executed.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
To minimize the risk of any upgrade issues (particularly if an upgrade to
|
||||||
|
a new major &repmgr; version is involved), we recommend upgrading
|
||||||
|
&repmgr; on the old server <emphasis>before</emphasis> running
|
||||||
|
<application>pg_upgrade</application> to ensure that old and new
|
||||||
|
versions are the same.
|
||||||
|
</para>
|
||||||
|
<note>
|
||||||
|
<simpara>
|
||||||
|
This issue applies to any PostgreSQL extension which has
|
||||||
|
dependencies on a shared library.
|
||||||
|
</simpara>
|
||||||
|
</note>
|
||||||
|
<para>
|
||||||
|
For further details please see the <ulink url="https://www.postgresql.org/docs/current/static/pgupgrade.html">pg_upgrade documentation</ulink>.
|
||||||
|
</para>
|
||||||
|
<para>
|
||||||
|
If replication slots are in use, bear in mind these will <emphasis>not</emphasis>
|
||||||
|
be recreated by <application>pg_upgrade</application>. These will need to
|
||||||
|
be recreated manually.
|
||||||
|
</para>
|
||||||
|
<tip>
|
||||||
|
<para>
|
||||||
|
Use <command><link linkend="repmgr-node-check">repmgr node check</link></command>
|
||||||
|
to determine which replacation slots need to be recreated.
|
||||||
|
</para>
|
||||||
|
</tip>
|
||||||
|
|
||||||
|
</sect1>
|
||||||
|
|
||||||
|
|
||||||
|
<sect1 id="upgrading-from-repmgr-3" xreflabel="Upgrading from repmgr 3.x">
|
||||||
|
<indexterm>
|
||||||
|
<primary>upgrading</primary>
|
||||||
|
<secondary>from repmgr 3.x</secondary>
|
||||||
|
</indexterm>
|
||||||
|
|
||||||
|
<title>Upgrading from repmgr 3.x</title>
|
||||||
<para>
|
<para>
|
||||||
The upgrade process consists of two steps:
|
The upgrade process consists of two steps:
|
||||||
<orderedlist>
|
<orderedlist>
|
||||||
@@ -29,7 +280,7 @@
|
|||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara>
|
<simpara>
|
||||||
upgrading the repmgr schema
|
upgrading the repmgr schema using <command>CREATE EXTENSION</command>
|
||||||
</simpara>
|
</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</orderedlist>
|
</orderedlist>
|
||||||
@@ -42,11 +293,19 @@
|
|||||||
a packaged PostgreSQL extension) is normally carried out
|
a packaged PostgreSQL extension) is normally carried out
|
||||||
automatically when the &repmgr; extension is created.
|
automatically when the &repmgr; extension is created.
|
||||||
</para>
|
</para>
|
||||||
|
<para>
|
||||||
|
The shared library has been renamed from <literal>repmgr_funcs</literal> to
|
||||||
|
<literal>repmgr</literal> - if it's set in <varname>shared_preload_libraries</varname>
|
||||||
|
in <filename>postgresql.conf</filename> it will need to be updated to the new name:
|
||||||
|
<programlisting>
|
||||||
|
shared_preload_libraries = 'repmgr'</programlisting>
|
||||||
|
</para>
|
||||||
|
|
||||||
<sect2 id="converting-repmgr-conf">
|
<sect2 id="converting-repmgr-conf">
|
||||||
<title>Converting repmgr.conf configuration files</title>
|
<title>Converting repmgr.conf configuration files</title>
|
||||||
<para>
|
<para>
|
||||||
With a completely new repmgr version, we've taken the opportunity
|
With a completely new repmgr version, we've taken the opportunity
|
||||||
to rename some configuration items have had their names changed for
|
to rename some configuration items for
|
||||||
clarity and consistency, both between the configuration file and
|
clarity and consistency, both between the configuration file and
|
||||||
the column names in <structname>repmgr.nodes</structname>
|
the column names in <structname>repmgr.nodes</structname>
|
||||||
(e.g. <varname>node</varname> to <varname>node_id</varname>), and
|
(e.g. <varname>node</varname> to <varname>node_id</varname>), and
|
||||||
@@ -72,7 +331,7 @@
|
|||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><varname>monitoring_history</varname>: this replaces the
|
<simpara><varname>monitoring_history</varname>: this replaces the
|
||||||
<command>repmgrd</command> command line option
|
<application>repmgrd</application> command line option
|
||||||
<literal>--monitoring-history</literal></simpara>
|
<literal>--monitoring-history</literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
@@ -106,6 +365,10 @@
|
|||||||
<entry><varname>logfile</varname></entry>
|
<entry><varname>logfile</varname></entry>
|
||||||
<entry><varname>log_file</varname></entry>
|
<entry><varname>log_file</varname></entry>
|
||||||
</row>
|
</row>
|
||||||
|
<row>
|
||||||
|
<entry><varname>barman_server</varname></entry>
|
||||||
|
<entry><varname>barman_host</varname></entry>
|
||||||
|
</row>
|
||||||
<row>
|
<row>
|
||||||
<entry><varname>master_reponse_timeout</varname></entry>
|
<entry><varname>master_reponse_timeout</varname></entry>
|
||||||
<entry><varname>async_query_timeout</varname></entry>
|
<entry><varname>async_query_timeout</varname></entry>
|
||||||
@@ -113,6 +376,16 @@
|
|||||||
</tbody>
|
</tbody>
|
||||||
</tgroup>
|
</tgroup>
|
||||||
</table>
|
</table>
|
||||||
|
<note>
|
||||||
|
<para>
|
||||||
|
From &repmgr; 4, <literal>barman_server</literal> refers
|
||||||
|
to the server configured in Barman (in &repmgr; 3, the deprecated
|
||||||
|
<literal>cluster</literal> parameter was used for this);
|
||||||
|
the physical Barman hostname is configured with
|
||||||
|
<literal>barman_host</literal> (see <xref linkend="cloning-from-barman-prerequisites">
|
||||||
|
for details).
|
||||||
|
</para>
|
||||||
|
</note>
|
||||||
<para>
|
<para>
|
||||||
Following parameters have been removed:
|
Following parameters have been removed:
|
||||||
<itemizedlist spacing="compact" mark="bullet">
|
<itemizedlist spacing="compact" mark="bullet">
|
||||||
@@ -121,7 +394,7 @@
|
|||||||
be ignored.</simpara>
|
be ignored.</simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
<listitem>
|
<listitem>
|
||||||
<simpara><varname>upstream_node_id</varname>: is replaced by the
|
<simpara><varname>upstream_node</varname>: is replaced by the
|
||||||
command-line parameter <literal>--upstream-node-id</literal></simpara>
|
command-line parameter <literal>--upstream-node-id</literal></simpara>
|
||||||
</listitem>
|
</listitem>
|
||||||
</itemizedlist>
|
</itemizedlist>
|
||||||
@@ -137,7 +410,7 @@
|
|||||||
$ ./convert-config.pl /etc/repmgr.conf
|
$ ./convert-config.pl /etc/repmgr.conf
|
||||||
node_id=2
|
node_id=2
|
||||||
node_name=node2
|
node_name=node2
|
||||||
conninfo=host=localhost dbname=repmgr user=repmgr connect_timeout=2
|
conninfo=host=node2 dbname=repmgr user=repmgr connect_timeout=2
|
||||||
pg_ctl_options='-l /var/log/postgres/startup.log'
|
pg_ctl_options='-l /var/log/postgres/startup.log'
|
||||||
rsync_options=--exclude=postgresql.local.conf --archive
|
rsync_options=--exclude=postgresql.local.conf --archive
|
||||||
log_level=INFO
|
log_level=INFO
|
||||||
@@ -149,21 +422,22 @@
|
|||||||
changed.
|
changed.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Please note that the parameter <varname>data_directory</varname> <emphasis>must</emphasis>
|
Please note that the the conversion script will add an empty
|
||||||
be provided; if not already present, the conversion script will add an empty
|
placeholder parameter for <varname>data_directory</varname>, which
|
||||||
placeholder parameter.
|
is a required parameter in repmgr4 and which <emphasis>must</emphasis>
|
||||||
|
be provided.
|
||||||
</para>
|
</para>
|
||||||
</sect3>
|
</sect3>
|
||||||
</sect2>
|
</sect2>
|
||||||
<sect2>
|
<sect2>
|
||||||
<title>Upgrading the repmgr schema</title>
|
<title>Upgrading the repmgr schema</title>
|
||||||
<para>
|
<para>
|
||||||
Ensure <command>repmgrd</command> is not running, or any cron jobs which execute the
|
Ensure <application>repmgrd</application> is not running, or any cron jobs which execute the
|
||||||
<command>repmgr</command> binary.
|
<command>repmgr</command> binary.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Install <literal>repmgr4</literal>; any <literal>repmgr3</literal> packages should be uninstalled
|
Install <literal>repmgr 4</literal> packages; any <literal>repmgr 3.x</literal> packages
|
||||||
(if not automatically uninstalled already).
|
should be uninstalled (if not automatically uninstalled already by your packaging system).
|
||||||
</para>
|
</para>
|
||||||
<sect3>
|
<sect3>
|
||||||
<title>Upgrading from repmgr 3.1.1 or earlier</title>
|
<title>Upgrading from repmgr 3.1.1 or earlier</title>
|
||||||
@@ -203,7 +477,8 @@
|
|||||||
</para>
|
</para>
|
||||||
<note>
|
<note>
|
||||||
<simpara>there must be only one schema matching <literal>repmgr_%</literal> in the
|
<simpara>there must be only one schema matching <literal>repmgr_%</literal> in the
|
||||||
database, otherwise this step may not work.</simpara>
|
database, otherwise this step may not work.
|
||||||
|
</simpara>
|
||||||
</note>
|
</note>
|
||||||
</sect3>
|
</sect3>
|
||||||
<sect3>
|
<sect3>
|
||||||
@@ -223,7 +498,7 @@
|
|||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
Check the data is updated as expected by examining the <structname>repmgr.nodes</structname>
|
Check the data is updated as expected by examining the <structname>repmgr.nodes</structname>
|
||||||
table; restart <command>repmgrd</command> if required.
|
table; restart <application>repmgrd</application> if required.
|
||||||
</para>
|
</para>
|
||||||
<para>
|
<para>
|
||||||
The original <literal>repmgr_$cluster</literal> schema can be dropped at any time.
|
The original <literal>repmgr_$cluster</literal> schema can be dropped at any time.
|
||||||
|
|||||||
@@ -1 +1 @@
|
|||||||
<!ENTITY repmgrversion "4.0dev">
|
<!ENTITY repmgrversion "4.2">
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* errcode.h
|
* errcode.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -43,5 +43,10 @@
|
|||||||
#define ERR_BARMAN 19
|
#define ERR_BARMAN 19
|
||||||
#define ERR_REGISTRATION_SYNC 20
|
#define ERR_REGISTRATION_SYNC 20
|
||||||
#define ERR_OUT_OF_MEMORY 21
|
#define ERR_OUT_OF_MEMORY 21
|
||||||
|
#define ERR_SWITCHOVER_INCOMPLETE 22
|
||||||
|
#define ERR_FOLLOW_FAIL 23
|
||||||
|
#define ERR_REJOIN_FAIL 24
|
||||||
|
#define ERR_NODE_STATUS 25
|
||||||
|
#define ERR_REPMGRD_PAUSE 26
|
||||||
|
|
||||||
#endif /* _ERRCODE_H_ */
|
#endif /* _ERRCODE_H_ */
|
||||||
|
|||||||
@@ -38,15 +38,15 @@ SELECT repmgr.am_bdr_failover_handler(-1);
|
|||||||
|
|
||||||
(1 row)
|
(1 row)
|
||||||
|
|
||||||
SELECT repmgr.get_new_primary();
|
SELECT repmgr.am_bdr_failover_handler(NULL);
|
||||||
get_new_primary
|
am_bdr_failover_handler
|
||||||
-----------------
|
-------------------------
|
||||||
|
|
||||||
(1 row)
|
(1 row)
|
||||||
|
|
||||||
SELECT repmgr.get_voting_status();
|
SELECT repmgr.get_new_primary();
|
||||||
get_voting_status
|
get_new_primary
|
||||||
-------------------
|
-----------------
|
||||||
|
|
||||||
(1 row)
|
(1 row)
|
||||||
|
|
||||||
@@ -56,15 +56,9 @@ SELECT repmgr.notify_follow_primary(-1);
|
|||||||
|
|
||||||
(1 row)
|
(1 row)
|
||||||
|
|
||||||
SELECT repmgr.other_node_is_candidate(-1,-1);
|
SELECT repmgr.notify_follow_primary(NULL);
|
||||||
other_node_is_candidate
|
notify_follow_primary
|
||||||
-------------------------
|
-----------------------
|
||||||
|
|
||||||
(1 row)
|
|
||||||
|
|
||||||
SELECT repmgr.request_vote(-1,-1);
|
|
||||||
request_vote
|
|
||||||
--------------
|
|
||||||
|
|
||||||
(1 row)
|
(1 row)
|
||||||
|
|
||||||
@@ -80,9 +74,9 @@ SELECT repmgr.set_local_node_id(-1);
|
|||||||
|
|
||||||
(1 row)
|
(1 row)
|
||||||
|
|
||||||
SELECT repmgr.set_voting_status_initiated();
|
SELECT repmgr.set_local_node_id(NULL);
|
||||||
set_voting_status_initiated
|
set_local_node_id
|
||||||
-----------------------------
|
-------------------
|
||||||
|
|
||||||
(1 row)
|
(1 row)
|
||||||
|
|
||||||
|
|||||||
21
log.c
21
log.c
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* log.c - Logging methods
|
* log.c - Logging methods
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -42,7 +42,7 @@ _stderr_log_with_level(const char *level_name, int level, const char *fmt, va_li
|
|||||||
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 0)));
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 0)));
|
||||||
|
|
||||||
int log_type = REPMGR_STDERR;
|
int log_type = REPMGR_STDERR;
|
||||||
int log_level = LOG_NOTICE;
|
int log_level = LOG_INFO;
|
||||||
int last_log_level = LOG_INFO;
|
int last_log_level = LOG_INFO;
|
||||||
int verbose_logging = false;
|
int verbose_logging = false;
|
||||||
int terse_logging = false;
|
int terse_logging = false;
|
||||||
@@ -70,7 +70,7 @@ _stderr_log_with_level(const char *level_name, int level, const char *fmt, va_li
|
|||||||
|
|
||||||
/*
|
/*
|
||||||
* Store the requested level so that if there's a subsequent log_hint() or
|
* Store the requested level so that if there's a subsequent log_hint() or
|
||||||
* log_detail(), we can suppress that if appropriate.
|
* log_detail(), we can suppress that if --terse was specified,
|
||||||
*/
|
*/
|
||||||
last_log_level = level;
|
last_log_level = level;
|
||||||
|
|
||||||
@@ -329,6 +329,21 @@ logger_set_terse(void)
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
logger_set_level(int new_log_level)
|
||||||
|
{
|
||||||
|
log_level = new_log_level;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
logger_set_min_level(int min_log_level)
|
||||||
|
{
|
||||||
|
if (min_log_level > log_level)
|
||||||
|
log_level = min_log_level;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
int
|
int
|
||||||
detect_log_level(const char *level)
|
detect_log_level(const char *level)
|
||||||
{
|
{
|
||||||
|
|||||||
4
log.h
4
log.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* log.h
|
* log.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -128,6 +128,8 @@ bool logger_shutdown(void);
|
|||||||
|
|
||||||
void logger_set_verbose(void);
|
void logger_set_verbose(void);
|
||||||
void logger_set_terse(void);
|
void logger_set_terse(void);
|
||||||
|
void logger_set_min_level(int min_log_level);
|
||||||
|
void logger_set_level(int new_log_level);
|
||||||
|
|
||||||
void
|
void
|
||||||
log_detail(const char *fmt,...)
|
log_detail(const char *fmt,...)
|
||||||
|
|||||||
2
repmgr--4.0--4.1.sql
Normal file
2
repmgr--4.0--4.1.sql
Normal file
@@ -0,0 +1,2 @@
|
|||||||
|
-- complain if script is sourced in psql, rather than via CREATE EXTENSION
|
||||||
|
\echo Use "CREATE EXTENSION repmgr" to load this file. \quit
|
||||||
@@ -6,7 +6,7 @@ CREATE TABLE repmgr.nodes (
|
|||||||
upstream_node_id INTEGER NULL REFERENCES nodes (node_id) DEFERRABLE,
|
upstream_node_id INTEGER NULL REFERENCES nodes (node_id) DEFERRABLE,
|
||||||
active BOOLEAN NOT NULL DEFAULT TRUE,
|
active BOOLEAN NOT NULL DEFAULT TRUE,
|
||||||
node_name TEXT NOT NULL,
|
node_name TEXT NOT NULL,
|
||||||
type TEXT NOT NULL CHECK (type IN('primary','standby','bdr')),
|
type TEXT NOT NULL CHECK (type IN('primary','standby','witness','bdr')),
|
||||||
location TEXT NOT NULL DEFAULT 'default',
|
location TEXT NOT NULL DEFAULT 'default',
|
||||||
priority INT NOT NULL DEFAULT 100,
|
priority INT NOT NULL DEFAULT 100,
|
||||||
conninfo TEXT NOT NULL,
|
conninfo TEXT NOT NULL,
|
||||||
@@ -79,6 +79,19 @@ LEFT JOIN repmgr.nodes un
|
|||||||
ON un.node_id = n.upstream_node_id;
|
ON un.node_id = n.upstream_node_id;
|
||||||
|
|
||||||
|
|
||||||
|
/* XXX update upgrade scripts! */
|
||||||
|
CREATE TABLE repmgr.voting_term (
|
||||||
|
term INT NOT NULL
|
||||||
|
);
|
||||||
|
|
||||||
|
CREATE UNIQUE INDEX voting_term_restrict
|
||||||
|
ON repmgr.voting_term ((TRUE));
|
||||||
|
|
||||||
|
CREATE RULE voting_term_delete AS
|
||||||
|
ON DELETE TO repmgr.voting_term
|
||||||
|
DO INSTEAD NOTHING;
|
||||||
|
|
||||||
|
|
||||||
/* ================= */
|
/* ================= */
|
||||||
/* repmgrd functions */
|
/* repmgrd functions */
|
||||||
/* ================= */
|
/* ================= */
|
||||||
@@ -90,6 +103,11 @@ CREATE FUNCTION set_local_node_id(INT)
|
|||||||
AS 'MODULE_PATHNAME', 'set_local_node_id'
|
AS 'MODULE_PATHNAME', 'set_local_node_id'
|
||||||
LANGUAGE C STRICT;
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_local_node_id()
|
||||||
|
RETURNS INT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_local_node_id'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
CREATE FUNCTION standby_set_last_updated()
|
CREATE FUNCTION standby_set_last_updated()
|
||||||
RETURNS TIMESTAMP WITH TIME ZONE
|
RETURNS TIMESTAMP WITH TIME ZONE
|
||||||
AS 'MODULE_PATHNAME', 'standby_set_last_updated'
|
AS 'MODULE_PATHNAME', 'standby_set_last_updated'
|
||||||
@@ -102,49 +120,6 @@ CREATE FUNCTION standby_get_last_updated()
|
|||||||
|
|
||||||
/* failover functions */
|
/* failover functions */
|
||||||
|
|
||||||
|
|
||||||
DO $repmgr$
|
|
||||||
DECLARE
|
|
||||||
DECLARE server_version_num INT;
|
|
||||||
BEGIN
|
|
||||||
SELECT setting
|
|
||||||
FROM pg_catalog.pg_settings
|
|
||||||
WHERE name = 'server_version_num'
|
|
||||||
INTO server_version_num;
|
|
||||||
|
|
||||||
IF server_version_num >= 90400 THEN
|
|
||||||
EXECUTE $repmgr_func$
|
|
||||||
CREATE FUNCTION request_vote(INT,INT)
|
|
||||||
RETURNS pg_lsn
|
|
||||||
AS 'MODULE_PATHNAME', 'request_vote'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
$repmgr_func$;
|
|
||||||
ELSE
|
|
||||||
EXECUTE $repmgr_func$
|
|
||||||
CREATE FUNCTION request_vote(INT,INT)
|
|
||||||
RETURNS TEXT
|
|
||||||
AS 'MODULE_PATHNAME', 'request_vote'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
$repmgr_func$;
|
|
||||||
END IF;
|
|
||||||
END$repmgr$;
|
|
||||||
|
|
||||||
|
|
||||||
CREATE FUNCTION get_voting_status()
|
|
||||||
RETURNS INT
|
|
||||||
AS 'MODULE_PATHNAME', 'get_voting_status'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
|
|
||||||
CREATE FUNCTION set_voting_status_initiated()
|
|
||||||
RETURNS INT
|
|
||||||
AS 'MODULE_PATHNAME', 'set_voting_status_initiated'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
|
|
||||||
CREATE FUNCTION other_node_is_candidate(INT, INT)
|
|
||||||
RETURNS BOOL
|
|
||||||
AS 'MODULE_PATHNAME', 'other_node_is_candidate'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
|
|
||||||
CREATE FUNCTION notify_follow_primary(INT)
|
CREATE FUNCTION notify_follow_primary(INT)
|
||||||
RETURNS VOID
|
RETURNS VOID
|
||||||
AS 'MODULE_PATHNAME', 'notify_follow_primary'
|
AS 'MODULE_PATHNAME', 'notify_follow_primary'
|
||||||
@@ -160,13 +135,11 @@ CREATE FUNCTION reset_voting_status()
|
|||||||
AS 'MODULE_PATHNAME', 'reset_voting_status'
|
AS 'MODULE_PATHNAME', 'reset_voting_status'
|
||||||
LANGUAGE C STRICT;
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
|
||||||
CREATE FUNCTION am_bdr_failover_handler(INT)
|
CREATE FUNCTION am_bdr_failover_handler(INT)
|
||||||
RETURNS BOOL
|
RETURNS BOOL
|
||||||
AS 'MODULE_PATHNAME', 'am_bdr_failover_handler'
|
AS 'MODULE_PATHNAME', 'am_bdr_failover_handler'
|
||||||
LANGUAGE C STRICT;
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
|
||||||
CREATE FUNCTION unset_bdr_failover_handler()
|
CREATE FUNCTION unset_bdr_failover_handler()
|
||||||
RETURNS VOID
|
RETURNS VOID
|
||||||
AS 'MODULE_PATHNAME', 'unset_bdr_failover_handler'
|
AS 'MODULE_PATHNAME', 'unset_bdr_failover_handler'
|
||||||
|
|||||||
32
repmgr--4.1--4.2.sql
Normal file
32
repmgr--4.1--4.2.sql
Normal file
@@ -0,0 +1,32 @@
|
|||||||
|
-- complain if script is sourced in psql, rather than via CREATE EXTENSION
|
||||||
|
\echo Use "CREATE EXTENSION repmgr" to load this file. \quit
|
||||||
|
|
||||||
|
CREATE FUNCTION get_repmgrd_pid()
|
||||||
|
RETURNS INT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_repmgrd_pid'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_repmgrd_pidfile()
|
||||||
|
RETURNS TEXT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_repmgrd_pidfile'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION set_repmgrd_pid(INT, TEXT)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'set_repmgrd_pid'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION repmgrd_is_running()
|
||||||
|
RETURNS BOOL
|
||||||
|
AS 'MODULE_PATHNAME', 'repmgrd_is_running'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION repmgrd_pause(BOOL)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'repmgrd_pause'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION repmgrd_is_paused()
|
||||||
|
RETURNS BOOL
|
||||||
|
AS 'MODULE_PATHNAME', 'repmgrd_is_paused'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
166
repmgr--4.1.sql
Normal file
166
repmgr--4.1.sql
Normal file
@@ -0,0 +1,166 @@
|
|||||||
|
-- complain if script is sourced in psql, rather than via CREATE EXTENSION
|
||||||
|
\echo Use "CREATE EXTENSION repmgr" to load this file. \quit
|
||||||
|
|
||||||
|
CREATE TABLE repmgr.nodes (
|
||||||
|
node_id INTEGER PRIMARY KEY,
|
||||||
|
upstream_node_id INTEGER NULL REFERENCES nodes (node_id) DEFERRABLE,
|
||||||
|
active BOOLEAN NOT NULL DEFAULT TRUE,
|
||||||
|
node_name TEXT NOT NULL,
|
||||||
|
type TEXT NOT NULL CHECK (type IN('primary','standby','witness','bdr')),
|
||||||
|
location TEXT NOT NULL DEFAULT 'default',
|
||||||
|
priority INT NOT NULL DEFAULT 100,
|
||||||
|
conninfo TEXT NOT NULL,
|
||||||
|
repluser VARCHAR(63) NOT NULL,
|
||||||
|
slot_name TEXT NULL,
|
||||||
|
config_file TEXT NOT NULL
|
||||||
|
);
|
||||||
|
|
||||||
|
CREATE TABLE repmgr.events (
|
||||||
|
node_id INTEGER NOT NULL,
|
||||||
|
event TEXT NOT NULL,
|
||||||
|
successful BOOLEAN NOT NULL DEFAULT TRUE,
|
||||||
|
event_timestamp TIMESTAMP WITH TIME ZONE NOT NULL DEFAULT CURRENT_TIMESTAMP,
|
||||||
|
details TEXT NULL
|
||||||
|
);
|
||||||
|
|
||||||
|
DO $repmgr$
|
||||||
|
DECLARE
|
||||||
|
DECLARE server_version_num INT;
|
||||||
|
BEGIN
|
||||||
|
SELECT setting
|
||||||
|
FROM pg_catalog.pg_settings
|
||||||
|
WHERE name = 'server_version_num'
|
||||||
|
INTO server_version_num;
|
||||||
|
IF server_version_num >= 90400 THEN
|
||||||
|
EXECUTE $repmgr_func$
|
||||||
|
CREATE TABLE repmgr.monitoring_history (
|
||||||
|
primary_node_id INTEGER NOT NULL,
|
||||||
|
standby_node_id INTEGER NOT NULL,
|
||||||
|
last_monitor_time TIMESTAMP WITH TIME ZONE NOT NULL,
|
||||||
|
last_apply_time TIMESTAMP WITH TIME ZONE,
|
||||||
|
last_wal_primary_location PG_LSN NOT NULL,
|
||||||
|
last_wal_standby_location PG_LSN,
|
||||||
|
replication_lag BIGINT NOT NULL,
|
||||||
|
apply_lag BIGINT NOT NULL
|
||||||
|
)
|
||||||
|
$repmgr_func$;
|
||||||
|
ELSE
|
||||||
|
EXECUTE $repmgr_func$
|
||||||
|
CREATE TABLE repmgr.monitoring_history (
|
||||||
|
primary_node_id INTEGER NOT NULL,
|
||||||
|
standby_node_id INTEGER NOT NULL,
|
||||||
|
last_monitor_time TIMESTAMP WITH TIME ZONE NOT NULL,
|
||||||
|
last_apply_time TIMESTAMP WITH TIME ZONE,
|
||||||
|
last_wal_primary_location TEXT NOT NULL,
|
||||||
|
last_wal_standby_location TEXT,
|
||||||
|
replication_lag BIGINT NOT NULL,
|
||||||
|
apply_lag BIGINT NOT NULL
|
||||||
|
)
|
||||||
|
$repmgr_func$;
|
||||||
|
END IF;
|
||||||
|
END$repmgr$;
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
CREATE INDEX idx_monitoring_history_time
|
||||||
|
ON repmgr.monitoring_history (last_monitor_time, standby_node_id);
|
||||||
|
|
||||||
|
CREATE VIEW repmgr.show_nodes AS
|
||||||
|
SELECT n.node_id,
|
||||||
|
n.node_name,
|
||||||
|
n.active,
|
||||||
|
n.upstream_node_id,
|
||||||
|
un.node_name AS upstream_node_name,
|
||||||
|
n.type,
|
||||||
|
n.priority,
|
||||||
|
n.conninfo
|
||||||
|
FROM repmgr.nodes n
|
||||||
|
LEFT JOIN repmgr.nodes un
|
||||||
|
ON un.node_id = n.upstream_node_id;
|
||||||
|
|
||||||
|
|
||||||
|
/* XXX update upgrade scripts! */
|
||||||
|
CREATE TABLE repmgr.voting_term (
|
||||||
|
term INT NOT NULL
|
||||||
|
);
|
||||||
|
|
||||||
|
CREATE UNIQUE INDEX voting_term_restrict
|
||||||
|
ON repmgr.voting_term ((TRUE));
|
||||||
|
|
||||||
|
CREATE RULE voting_term_delete AS
|
||||||
|
ON DELETE TO repmgr.voting_term
|
||||||
|
DO INSTEAD NOTHING;
|
||||||
|
|
||||||
|
|
||||||
|
/* ================= */
|
||||||
|
/* repmgrd functions */
|
||||||
|
/* ================= */
|
||||||
|
|
||||||
|
/* monitoring functions */
|
||||||
|
|
||||||
|
CREATE FUNCTION set_local_node_id(INT)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'set_local_node_id'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_local_node_id()
|
||||||
|
RETURNS INT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_local_node_id'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION standby_set_last_updated()
|
||||||
|
RETURNS TIMESTAMP WITH TIME ZONE
|
||||||
|
AS 'MODULE_PATHNAME', 'standby_set_last_updated'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION standby_get_last_updated()
|
||||||
|
RETURNS TIMESTAMP WITH TIME ZONE
|
||||||
|
AS 'MODULE_PATHNAME', 'standby_get_last_updated'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
/* failover functions */
|
||||||
|
|
||||||
|
CREATE FUNCTION notify_follow_primary(INT)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'notify_follow_primary'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_new_primary()
|
||||||
|
RETURNS INT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_new_primary'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION reset_voting_status()
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'reset_voting_status'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION am_bdr_failover_handler(INT)
|
||||||
|
RETURNS BOOL
|
||||||
|
AS 'MODULE_PATHNAME', 'am_bdr_failover_handler'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION unset_bdr_failover_handler()
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'unset_bdr_failover_handler'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE VIEW repmgr.replication_status AS
|
||||||
|
SELECT m.primary_node_id, m.standby_node_id, n.node_name AS standby_name,
|
||||||
|
n.type AS node_type, n.active, last_monitor_time,
|
||||||
|
CASE WHEN n.type='standby' THEN m.last_wal_primary_location ELSE NULL END AS last_wal_primary_location,
|
||||||
|
m.last_wal_standby_location,
|
||||||
|
CASE WHEN n.type='standby' THEN pg_catalog.pg_size_pretty(m.replication_lag) ELSE NULL END AS replication_lag,
|
||||||
|
CASE WHEN n.type='standby' THEN
|
||||||
|
CASE WHEN replication_lag > 0 THEN age(now(), m.last_apply_time) ELSE '0'::INTERVAL END
|
||||||
|
ELSE NULL
|
||||||
|
END AS replication_time_lag,
|
||||||
|
CASE WHEN n.type='standby' THEN pg_catalog.pg_size_pretty(m.apply_lag) ELSE NULL END AS apply_lag,
|
||||||
|
AGE(NOW(), CASE WHEN pg_catalog.pg_is_in_recovery() THEN repmgr.standby_get_last_updated() ELSE m.last_monitor_time END) AS communication_time_lag
|
||||||
|
FROM repmgr.monitoring_history m
|
||||||
|
JOIN repmgr.nodes n ON m.standby_node_id = n.node_id
|
||||||
|
WHERE (m.standby_node_id, m.last_monitor_time) IN (
|
||||||
|
SELECT m1.standby_node_id, MAX(m1.last_monitor_time)
|
||||||
|
FROM repmgr.monitoring_history m1 GROUP BY 1
|
||||||
|
);
|
||||||
|
|
||||||
197
repmgr--4.2.sql
Normal file
197
repmgr--4.2.sql
Normal file
@@ -0,0 +1,197 @@
|
|||||||
|
-- complain if script is sourced in psql, rather than via CREATE EXTENSION
|
||||||
|
\echo Use "CREATE EXTENSION repmgr" to load this file. \quit
|
||||||
|
|
||||||
|
CREATE TABLE repmgr.nodes (
|
||||||
|
node_id INTEGER PRIMARY KEY,
|
||||||
|
upstream_node_id INTEGER NULL REFERENCES nodes (node_id) DEFERRABLE,
|
||||||
|
active BOOLEAN NOT NULL DEFAULT TRUE,
|
||||||
|
node_name TEXT NOT NULL,
|
||||||
|
type TEXT NOT NULL CHECK (type IN('primary','standby','witness','bdr')),
|
||||||
|
location TEXT NOT NULL DEFAULT 'default',
|
||||||
|
priority INT NOT NULL DEFAULT 100,
|
||||||
|
conninfo TEXT NOT NULL,
|
||||||
|
repluser VARCHAR(63) NOT NULL,
|
||||||
|
slot_name TEXT NULL,
|
||||||
|
config_file TEXT NOT NULL
|
||||||
|
);
|
||||||
|
|
||||||
|
CREATE TABLE repmgr.events (
|
||||||
|
node_id INTEGER NOT NULL,
|
||||||
|
event TEXT NOT NULL,
|
||||||
|
successful BOOLEAN NOT NULL DEFAULT TRUE,
|
||||||
|
event_timestamp TIMESTAMP WITH TIME ZONE NOT NULL DEFAULT CURRENT_TIMESTAMP,
|
||||||
|
details TEXT NULL
|
||||||
|
);
|
||||||
|
|
||||||
|
DO $repmgr$
|
||||||
|
DECLARE
|
||||||
|
DECLARE server_version_num INT;
|
||||||
|
BEGIN
|
||||||
|
SELECT setting
|
||||||
|
FROM pg_catalog.pg_settings
|
||||||
|
WHERE name = 'server_version_num'
|
||||||
|
INTO server_version_num;
|
||||||
|
IF server_version_num >= 90400 THEN
|
||||||
|
EXECUTE $repmgr_func$
|
||||||
|
CREATE TABLE repmgr.monitoring_history (
|
||||||
|
primary_node_id INTEGER NOT NULL,
|
||||||
|
standby_node_id INTEGER NOT NULL,
|
||||||
|
last_monitor_time TIMESTAMP WITH TIME ZONE NOT NULL,
|
||||||
|
last_apply_time TIMESTAMP WITH TIME ZONE,
|
||||||
|
last_wal_primary_location PG_LSN NOT NULL,
|
||||||
|
last_wal_standby_location PG_LSN,
|
||||||
|
replication_lag BIGINT NOT NULL,
|
||||||
|
apply_lag BIGINT NOT NULL
|
||||||
|
)
|
||||||
|
$repmgr_func$;
|
||||||
|
ELSE
|
||||||
|
EXECUTE $repmgr_func$
|
||||||
|
CREATE TABLE repmgr.monitoring_history (
|
||||||
|
primary_node_id INTEGER NOT NULL,
|
||||||
|
standby_node_id INTEGER NOT NULL,
|
||||||
|
last_monitor_time TIMESTAMP WITH TIME ZONE NOT NULL,
|
||||||
|
last_apply_time TIMESTAMP WITH TIME ZONE,
|
||||||
|
last_wal_primary_location TEXT NOT NULL,
|
||||||
|
last_wal_standby_location TEXT,
|
||||||
|
replication_lag BIGINT NOT NULL,
|
||||||
|
apply_lag BIGINT NOT NULL
|
||||||
|
)
|
||||||
|
$repmgr_func$;
|
||||||
|
END IF;
|
||||||
|
END$repmgr$;
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
CREATE INDEX idx_monitoring_history_time
|
||||||
|
ON repmgr.monitoring_history (last_monitor_time, standby_node_id);
|
||||||
|
|
||||||
|
CREATE VIEW repmgr.show_nodes AS
|
||||||
|
SELECT n.node_id,
|
||||||
|
n.node_name,
|
||||||
|
n.active,
|
||||||
|
n.upstream_node_id,
|
||||||
|
un.node_name AS upstream_node_name,
|
||||||
|
n.type,
|
||||||
|
n.priority,
|
||||||
|
n.conninfo
|
||||||
|
FROM repmgr.nodes n
|
||||||
|
LEFT JOIN repmgr.nodes un
|
||||||
|
ON un.node_id = n.upstream_node_id;
|
||||||
|
|
||||||
|
|
||||||
|
/* XXX update upgrade scripts! */
|
||||||
|
CREATE TABLE repmgr.voting_term (
|
||||||
|
term INT NOT NULL
|
||||||
|
);
|
||||||
|
|
||||||
|
CREATE UNIQUE INDEX voting_term_restrict
|
||||||
|
ON repmgr.voting_term ((TRUE));
|
||||||
|
|
||||||
|
CREATE RULE voting_term_delete AS
|
||||||
|
ON DELETE TO repmgr.voting_term
|
||||||
|
DO INSTEAD NOTHING;
|
||||||
|
|
||||||
|
|
||||||
|
/* ================= */
|
||||||
|
/* repmgrd functions */
|
||||||
|
/* ================= */
|
||||||
|
|
||||||
|
/* monitoring functions */
|
||||||
|
|
||||||
|
CREATE FUNCTION set_local_node_id(INT)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'set_local_node_id'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_local_node_id()
|
||||||
|
RETURNS INT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_local_node_id'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION standby_set_last_updated()
|
||||||
|
RETURNS TIMESTAMP WITH TIME ZONE
|
||||||
|
AS 'MODULE_PATHNAME', 'standby_set_last_updated'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION standby_get_last_updated()
|
||||||
|
RETURNS TIMESTAMP WITH TIME ZONE
|
||||||
|
AS 'MODULE_PATHNAME', 'standby_get_last_updated'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
/* failover functions */
|
||||||
|
|
||||||
|
CREATE FUNCTION notify_follow_primary(INT)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'notify_follow_primary'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_new_primary()
|
||||||
|
RETURNS INT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_new_primary'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION reset_voting_status()
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'reset_voting_status'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION am_bdr_failover_handler(INT)
|
||||||
|
RETURNS BOOL
|
||||||
|
AS 'MODULE_PATHNAME', 'am_bdr_failover_handler'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION unset_bdr_failover_handler()
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'unset_bdr_failover_handler'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_repmgrd_pid()
|
||||||
|
RETURNS INT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_repmgrd_pid'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_repmgrd_pidfile()
|
||||||
|
RETURNS TEXT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_repmgrd_pidfile'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION set_repmgrd_pid(INT, TEXT)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'set_repmgrd_pid'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION repmgrd_is_running()
|
||||||
|
RETURNS BOOL
|
||||||
|
AS 'MODULE_PATHNAME', 'repmgrd_is_running'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION repmgrd_pause(BOOL)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'repmgrd_pause'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION repmgrd_is_paused()
|
||||||
|
RETURNS BOOL
|
||||||
|
AS 'MODULE_PATHNAME', 'repmgrd_is_paused'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
|
||||||
|
CREATE VIEW repmgr.replication_status AS
|
||||||
|
SELECT m.primary_node_id, m.standby_node_id, n.node_name AS standby_name,
|
||||||
|
n.type AS node_type, n.active, last_monitor_time,
|
||||||
|
CASE WHEN n.type='standby' THEN m.last_wal_primary_location ELSE NULL END AS last_wal_primary_location,
|
||||||
|
m.last_wal_standby_location,
|
||||||
|
CASE WHEN n.type='standby' THEN pg_catalog.pg_size_pretty(m.replication_lag) ELSE NULL END AS replication_lag,
|
||||||
|
CASE WHEN n.type='standby' THEN
|
||||||
|
CASE WHEN replication_lag > 0 THEN age(now(), m.last_apply_time) ELSE '0'::INTERVAL END
|
||||||
|
ELSE NULL
|
||||||
|
END AS replication_time_lag,
|
||||||
|
CASE WHEN n.type='standby' THEN pg_catalog.pg_size_pretty(m.apply_lag) ELSE NULL END AS apply_lag,
|
||||||
|
AGE(NOW(), CASE WHEN pg_catalog.pg_is_in_recovery() THEN repmgr.standby_get_last_updated() ELSE m.last_monitor_time END) AS communication_time_lag
|
||||||
|
FROM repmgr.monitoring_history m
|
||||||
|
JOIN repmgr.nodes n ON m.standby_node_id = n.node_id
|
||||||
|
WHERE (m.standby_node_id, m.last_monitor_time) IN (
|
||||||
|
SELECT m1.standby_node_id, MAX(m1.last_monitor_time)
|
||||||
|
FROM repmgr.monitoring_history m1 GROUP BY 1
|
||||||
|
);
|
||||||
|
|
||||||
@@ -32,7 +32,7 @@ CREATE TABLE repmgr.nodes (
|
|||||||
upstream_node_id INTEGER NULL REFERENCES repmgr.nodes (node_id) DEFERRABLE,
|
upstream_node_id INTEGER NULL REFERENCES repmgr.nodes (node_id) DEFERRABLE,
|
||||||
active BOOLEAN NOT NULL DEFAULT TRUE,
|
active BOOLEAN NOT NULL DEFAULT TRUE,
|
||||||
node_name TEXT NOT NULL,
|
node_name TEXT NOT NULL,
|
||||||
type TEXT NOT NULL CHECK (type IN('primary','standby','bdr')),
|
type TEXT NOT NULL CHECK (type IN('primary','standby','witness','bdr')),
|
||||||
location TEXT NOT NULL DEFAULT 'default',
|
location TEXT NOT NULL DEFAULT 'default',
|
||||||
priority INT NOT NULL DEFAULT 100,
|
priority INT NOT NULL DEFAULT 100,
|
||||||
conninfo TEXT NOT NULL,
|
conninfo TEXT NOT NULL,
|
||||||
@@ -54,8 +54,34 @@ SELECT id, upstream_node_id, active, name,
|
|||||||
|
|
||||||
ALTER TABLE repmgr.repl_events RENAME TO events;
|
ALTER TABLE repmgr.repl_events RENAME TO events;
|
||||||
|
|
||||||
|
-- create new table "repmgr.voting_term"
|
||||||
|
CREATE TABLE repmgr.voting_term (
|
||||||
|
term INT NOT NULL
|
||||||
|
);
|
||||||
|
|
||||||
|
CREATE UNIQUE INDEX voting_term_restrict
|
||||||
|
ON repmgr.voting_term ((TRUE));
|
||||||
|
|
||||||
|
CREATE RULE voting_term_delete AS
|
||||||
|
ON DELETE TO repmgr.voting_term
|
||||||
|
DO INSTEAD NOTHING;
|
||||||
|
|
||||||
|
INSERT INTO repmgr.voting_term (term) VALUES (1);
|
||||||
|
|
||||||
|
|
||||||
-- convert "repmgr_$cluster.repl_monitor" to "monitoring_history"
|
-- convert "repmgr_$cluster.repl_monitor" to "monitoring_history"
|
||||||
|
|
||||||
|
|
||||||
|
DO $repmgr$
|
||||||
|
DECLARE
|
||||||
|
DECLARE server_version_num INT;
|
||||||
|
BEGIN
|
||||||
|
SELECT setting
|
||||||
|
FROM pg_catalog.pg_settings
|
||||||
|
WHERE name = 'server_version_num'
|
||||||
|
INTO server_version_num;
|
||||||
|
IF server_version_num >= 90400 THEN
|
||||||
|
EXECUTE $repmgr_func$
|
||||||
CREATE TABLE repmgr.monitoring_history (
|
CREATE TABLE repmgr.monitoring_history (
|
||||||
primary_node_id INTEGER NOT NULL,
|
primary_node_id INTEGER NOT NULL,
|
||||||
standby_node_id INTEGER NOT NULL,
|
standby_node_id INTEGER NOT NULL,
|
||||||
@@ -65,12 +91,32 @@ CREATE TABLE repmgr.monitoring_history (
|
|||||||
last_wal_standby_location PG_LSN,
|
last_wal_standby_location PG_LSN,
|
||||||
replication_lag BIGINT NOT NULL,
|
replication_lag BIGINT NOT NULL,
|
||||||
apply_lag BIGINT NOT NULL
|
apply_lag BIGINT NOT NULL
|
||||||
);
|
)
|
||||||
|
$repmgr_func$;
|
||||||
|
INSERT INTO repmgr.monitoring_history
|
||||||
|
(primary_node_id, standby_node_id, last_monitor_time, last_apply_time, last_wal_primary_location, last_wal_standby_location, replication_lag, apply_lag)
|
||||||
|
SELECT primary_node, standby_node, last_monitor_time, last_apply_time, last_wal_primary_location::pg_lsn, last_wal_standby_location::pg_lsn, replication_lag, apply_lag
|
||||||
|
FROM repmgr.repl_monitor;
|
||||||
|
ELSE
|
||||||
|
EXECUTE $repmgr_func$
|
||||||
|
CREATE TABLE repmgr.monitoring_history (
|
||||||
|
primary_node_id INTEGER NOT NULL,
|
||||||
|
standby_node_id INTEGER NOT NULL,
|
||||||
|
last_monitor_time TIMESTAMP WITH TIME ZONE NOT NULL,
|
||||||
|
last_apply_time TIMESTAMP WITH TIME ZONE,
|
||||||
|
last_wal_primary_location TEXT NOT NULL,
|
||||||
|
last_wal_standby_location TEXT,
|
||||||
|
replication_lag BIGINT NOT NULL,
|
||||||
|
apply_lag BIGINT NOT NULL
|
||||||
|
)
|
||||||
|
$repmgr_func$;
|
||||||
|
INSERT INTO repmgr.monitoring_history
|
||||||
|
(primary_node_id, standby_node_id, last_monitor_time, last_apply_time, last_wal_primary_location, last_wal_standby_location, replication_lag, apply_lag)
|
||||||
|
SELECT primary_node, standby_node, last_monitor_time, last_apply_time, last_wal_primary_location, last_wal_standby_location, replication_lag, apply_lag
|
||||||
|
FROM repmgr.repl_monitor;
|
||||||
|
|
||||||
INSERT INTO repmgr.monitoring_history
|
END IF;
|
||||||
(primary_node_id, standby_node_id, last_monitor_time, last_apply_time, last_wal_primary_location, last_wal_standby_location, replication_lag, apply_lag)
|
END$repmgr$;
|
||||||
SELECT primary_node, standby_node, last_monitor_time, last_apply_time, last_wal_primary_location::pg_lsn, last_wal_standby_location::pg_lsn, replication_lag, apply_lag
|
|
||||||
FROM repmgr.repl_monitor;
|
|
||||||
|
|
||||||
CREATE INDEX idx_monitoring_history_time
|
CREATE INDEX idx_monitoring_history_time
|
||||||
ON repmgr.monitoring_history (last_monitor_time, standby_node_id);
|
ON repmgr.monitoring_history (last_monitor_time, standby_node_id);
|
||||||
@@ -95,6 +141,16 @@ LEFT JOIN repmgr.nodes un
|
|||||||
|
|
||||||
/* monitoring functions */
|
/* monitoring functions */
|
||||||
|
|
||||||
|
CREATE FUNCTION set_local_node_id(INT)
|
||||||
|
RETURNS VOID
|
||||||
|
AS 'MODULE_PATHNAME', 'set_local_node_id'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
|
CREATE FUNCTION get_local_node_id()
|
||||||
|
RETURNS INT
|
||||||
|
AS 'MODULE_PATHNAME', 'get_local_node_id'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
|
||||||
CREATE FUNCTION standby_set_last_updated()
|
CREATE FUNCTION standby_set_last_updated()
|
||||||
RETURNS TIMESTAMP WITH TIME ZONE
|
RETURNS TIMESTAMP WITH TIME ZONE
|
||||||
AS '$libdir/repmgr', 'standby_set_last_updated'
|
AS '$libdir/repmgr', 'standby_set_last_updated'
|
||||||
@@ -108,26 +164,6 @@ CREATE FUNCTION standby_get_last_updated()
|
|||||||
|
|
||||||
/* failover functions */
|
/* failover functions */
|
||||||
|
|
||||||
CREATE FUNCTION request_vote(INT,INT)
|
|
||||||
RETURNS pg_lsn
|
|
||||||
AS '$libdir/repmgr', 'request_vote'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
|
|
||||||
CREATE FUNCTION get_voting_status()
|
|
||||||
RETURNS INT
|
|
||||||
AS '$libdir/repmgr', 'get_voting_status'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
|
|
||||||
CREATE FUNCTION set_voting_status_initiated()
|
|
||||||
RETURNS INT
|
|
||||||
AS '$libdir/repmgr', 'set_voting_status_initiated'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
|
|
||||||
CREATE FUNCTION other_node_is_candidate(INT, INT)
|
|
||||||
RETURNS BOOL
|
|
||||||
AS '$libdir/repmgr', 'other_node_is_candidate'
|
|
||||||
LANGUAGE C STRICT;
|
|
||||||
|
|
||||||
CREATE FUNCTION notify_follow_primary(INT)
|
CREATE FUNCTION notify_follow_primary(INT)
|
||||||
RETURNS VOID
|
RETURNS VOID
|
||||||
AS '$libdir/repmgr', 'notify_follow_primary'
|
AS '$libdir/repmgr', 'notify_follow_primary'
|
||||||
|
|||||||
@@ -1,9 +1,9 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr-action-standby.c
|
* repmgr-action-bdr.c
|
||||||
*
|
*
|
||||||
* Implements BDR-related actions for the repmgr command line utility
|
* Implements BDR-related actions for the repmgr command line utility
|
||||||
*
|
*
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -28,7 +28,7 @@
|
|||||||
/*
|
/*
|
||||||
* do_bdr_register()
|
* do_bdr_register()
|
||||||
*
|
*
|
||||||
* As each BDR node is its own master, registering a BDR node
|
* As each BDR node is its own primary, registering a BDR node
|
||||||
* will create the repmgr metadata schema if necessary.
|
* will create the repmgr metadata schema if necessary.
|
||||||
*/
|
*/
|
||||||
void
|
void
|
||||||
@@ -83,16 +83,49 @@ do_bdr_register(void)
|
|||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (bdr_nodes.node_count > 2)
|
/* BDR 2 implementation is for 2 nodes only */
|
||||||
|
if (get_bdr_version_num() < 3 && bdr_nodes.node_count > 2)
|
||||||
{
|
{
|
||||||
log_error(_("repmgr can only support BDR clusters with 2 nodes"));
|
log_error(_("repmgr can only support BDR 2.x clusters with 2 nodes"));
|
||||||
log_detail(_("this BDR cluster has %i nodes"), bdr_nodes.node_count);
|
log_detail(_("this BDR cluster has %i nodes"), bdr_nodes.node_count);
|
||||||
PQfinish(conn);
|
PQfinish(conn);
|
||||||
pfree(dbname);
|
pfree(dbname);
|
||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
}
|
}
|
||||||
|
|
||||||
/* check whether repmgr extension exists, and that any other nodes are BDR */
|
/* check for a matching BDR node */
|
||||||
|
{
|
||||||
|
PQExpBufferData bdr_local_node_name;
|
||||||
|
bool node_match = false;
|
||||||
|
|
||||||
|
initPQExpBuffer(&bdr_local_node_name);
|
||||||
|
node_match = bdr_node_name_matches(conn, config_file_options.node_name, &bdr_local_node_name);
|
||||||
|
|
||||||
|
if (node_match == false)
|
||||||
|
{
|
||||||
|
if (strlen(bdr_local_node_name.data))
|
||||||
|
{
|
||||||
|
log_error(_("local node BDR node name is \"%s\", expected: \"%s\""),
|
||||||
|
bdr_local_node_name.data,
|
||||||
|
config_file_options.node_name);
|
||||||
|
log_hint(_("\"node_name\" in repmgr.conf must match \"node_name\" in bdr.bdr_nodes"));
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
log_error(_("local node does not report BDR node name"));
|
||||||
|
log_hint(_("ensure this is an active BDR node"));
|
||||||
|
}
|
||||||
|
|
||||||
|
PQfinish(conn);
|
||||||
|
pfree(dbname);
|
||||||
|
termPQExpBuffer(&bdr_local_node_name);
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
termPQExpBuffer(&bdr_local_node_name);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* check whether repmgr extension exists, and there are no non-BDR nodes registered */
|
||||||
extension_status = get_repmgr_extension_status(conn);
|
extension_status = get_repmgr_extension_status(conn);
|
||||||
|
|
||||||
if (extension_status == REPMGR_UNKNOWN)
|
if (extension_status == REPMGR_UNKNOWN)
|
||||||
@@ -142,17 +175,10 @@ do_bdr_register(void)
|
|||||||
|
|
||||||
pfree(dbname);
|
pfree(dbname);
|
||||||
|
|
||||||
/* check for a matching BDR node */
|
if (bdr_node_has_repmgr_set(conn, config_file_options.node_name) == false)
|
||||||
{
|
{
|
||||||
bool node_exists = bdr_node_exists(conn, config_file_options.node_name);
|
log_debug("bdr_node_has_repmgr_set() = false");
|
||||||
|
bdr_node_set_repmgr_set(conn, config_file_options.node_name);
|
||||||
if (node_exists == false)
|
|
||||||
{
|
|
||||||
log_error(_("no BDR node with node_name \"%s\" found"), config_file_options.node_name);
|
|
||||||
log_hint(_("\"node_name\" in repmgr.conf must match \"node_name\" in bdr.bdr_nodes"));
|
|
||||||
PQfinish(conn);
|
|
||||||
exit(ERR_BAD_CONFIG);
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
@@ -165,7 +191,7 @@ do_bdr_register(void)
|
|||||||
{
|
{
|
||||||
NodeInfoList local_node_records = T_NODE_INFO_LIST_INITIALIZER;
|
NodeInfoList local_node_records = T_NODE_INFO_LIST_INITIALIZER;
|
||||||
|
|
||||||
get_all_node_records(conn, &local_node_records);
|
(void) get_all_node_records(conn, &local_node_records);
|
||||||
|
|
||||||
if (local_node_records.node_count == 0)
|
if (local_node_records.node_count == 0)
|
||||||
{
|
{
|
||||||
@@ -177,6 +203,7 @@ do_bdr_register(void)
|
|||||||
if (bdr_nodes.node_count == 0)
|
if (bdr_nodes.node_count == 0)
|
||||||
{
|
{
|
||||||
log_error(_("unable to retrieve any BDR node records"));
|
log_error(_("unable to retrieve any BDR node records"));
|
||||||
|
log_detail("%s", PQerrorMessage(conn));
|
||||||
PQfinish(conn);
|
PQfinish(conn);
|
||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
}
|
}
|
||||||
@@ -212,7 +239,7 @@ do_bdr_register(void)
|
|||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
get_all_node_records(bdr_node_conn, &existing_nodes);
|
(void) get_all_node_records(bdr_node_conn, &existing_nodes);
|
||||||
|
|
||||||
for (cell = existing_nodes.head; cell; cell = cell->next)
|
for (cell = existing_nodes.head; cell; cell = cell->next)
|
||||||
{
|
{
|
||||||
@@ -228,7 +255,35 @@ do_bdr_register(void)
|
|||||||
}
|
}
|
||||||
|
|
||||||
/* Add the repmgr extension tables to a replication set */
|
/* Add the repmgr extension tables to a replication set */
|
||||||
add_extension_tables_to_bdr_replication_set(conn);
|
|
||||||
|
if (get_bdr_version_num() < 3)
|
||||||
|
{
|
||||||
|
add_extension_tables_to_bdr_replication_set(conn);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
/* this is the only table we need to replicate */
|
||||||
|
char *replication_set = get_default_bdr_replication_set(conn);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* this probably won't happen, but we need to be sure we're using
|
||||||
|
* the replication set metadata correctly...
|
||||||
|
*/
|
||||||
|
if (conn == NULL)
|
||||||
|
{
|
||||||
|
log_error(_("unable to retrieve default BDR replication set"));
|
||||||
|
log_hint(_("see preceding messages"));
|
||||||
|
log_debug("check query in get_default_bdr_replication_set()");
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (is_table_in_bdr_replication_set(conn, "nodes", replication_set) == false)
|
||||||
|
{
|
||||||
|
add_table_to_bdr_replication_set(conn, "nodes", replication_set);
|
||||||
|
}
|
||||||
|
|
||||||
|
pfree(replication_set);
|
||||||
|
}
|
||||||
|
|
||||||
initPQExpBuffer(&event_details);
|
initPQExpBuffer(&event_details);
|
||||||
|
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr-action-bdr.h
|
* repmgr-action-bdr.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
|||||||
File diff suppressed because it is too large
Load Diff
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr-action-cluster.h
|
* repmgr-action-cluster.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2017
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
|||||||
420
repmgr-action-daemon.c
Normal file
420
repmgr-action-daemon.c
Normal file
@@ -0,0 +1,420 @@
|
|||||||
|
/*
|
||||||
|
* repmgr-action-daemon.c
|
||||||
|
*
|
||||||
|
* Implements repmgrd actions for the repmgr command line utility
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include "repmgr.h"
|
||||||
|
|
||||||
|
#include "repmgr-client-global.h"
|
||||||
|
#include "repmgr-action-daemon.h"
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Possibly also show:
|
||||||
|
* - repmgrd start time?
|
||||||
|
* - repmgrd mode
|
||||||
|
* - priority
|
||||||
|
* - whether promotion candidate (due to zero priority/different location)
|
||||||
|
*/
|
||||||
|
|
||||||
|
typedef enum
|
||||||
|
{
|
||||||
|
STATUS_ID = 0,
|
||||||
|
STATUS_NAME,
|
||||||
|
STATUS_ROLE,
|
||||||
|
STATUS_PG,
|
||||||
|
STATUS_RUNNING,
|
||||||
|
STATUS_PID,
|
||||||
|
STATUS_PAUSED
|
||||||
|
} StatusHeader;
|
||||||
|
|
||||||
|
#define STATUS_HEADER_COUNT 7
|
||||||
|
|
||||||
|
struct ColHeader headers_status[STATUS_HEADER_COUNT];
|
||||||
|
|
||||||
|
static void fetch_node_records(PGconn *conn, NodeInfoList *node_list);
|
||||||
|
static void _do_repmgr_pause(bool pause);
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
do_daemon_status(void)
|
||||||
|
{
|
||||||
|
PGconn *conn = NULL;
|
||||||
|
NodeInfoList nodes = T_NODE_INFO_LIST_INITIALIZER;
|
||||||
|
NodeInfoListCell *cell = NULL;
|
||||||
|
int i;
|
||||||
|
RepmgrdInfo **repmgrd_info;
|
||||||
|
ItemList warnings = {NULL, NULL};
|
||||||
|
|
||||||
|
/* Connect to local database to obtain cluster connection data */
|
||||||
|
log_verbose(LOG_INFO, _("connecting to database"));
|
||||||
|
|
||||||
|
if (strlen(config_file_options.conninfo))
|
||||||
|
conn = establish_db_connection(config_file_options.conninfo, true);
|
||||||
|
else
|
||||||
|
conn = establish_db_connection_by_params(&source_conninfo, true);
|
||||||
|
|
||||||
|
fetch_node_records(conn, &nodes);
|
||||||
|
|
||||||
|
repmgrd_info = (RepmgrdInfo **) pg_malloc0(sizeof(RepmgrdInfo *) * nodes.node_count);
|
||||||
|
|
||||||
|
if (repmgrd_info == NULL)
|
||||||
|
{
|
||||||
|
log_error(_("unable to allocate memory"));
|
||||||
|
exit(ERR_OUT_OF_MEMORY);
|
||||||
|
}
|
||||||
|
|
||||||
|
strncpy(headers_status[STATUS_ID].title, _("ID"), MAXLEN);
|
||||||
|
strncpy(headers_status[STATUS_NAME].title, _("Name"), MAXLEN);
|
||||||
|
strncpy(headers_status[STATUS_ROLE].title, _("Role"), MAXLEN);
|
||||||
|
strncpy(headers_status[STATUS_PG].title, _("Status"), MAXLEN);
|
||||||
|
strncpy(headers_status[STATUS_RUNNING].title, _("repmgrd"), MAXLEN);
|
||||||
|
strncpy(headers_status[STATUS_PID].title, _("PID"), MAXLEN);
|
||||||
|
strncpy(headers_status[STATUS_PAUSED].title, _("Paused?"), MAXLEN);
|
||||||
|
|
||||||
|
for (i = 0; i < STATUS_HEADER_COUNT; i++)
|
||||||
|
{
|
||||||
|
headers_status[i].max_length = strlen(headers_status[i].title);
|
||||||
|
}
|
||||||
|
|
||||||
|
i = 0;
|
||||||
|
|
||||||
|
for (cell = nodes.head; cell; cell = cell->next)
|
||||||
|
{
|
||||||
|
int j;
|
||||||
|
|
||||||
|
repmgrd_info[i] = pg_malloc0(sizeof(RepmgrdInfo));
|
||||||
|
repmgrd_info[i]->node_id = cell->node_info->node_id;
|
||||||
|
repmgrd_info[i]->pid = UNKNOWN_PID;
|
||||||
|
repmgrd_info[i]->paused = false;
|
||||||
|
repmgrd_info[i]->running = false;
|
||||||
|
repmgrd_info[i]->pg_running = true;
|
||||||
|
|
||||||
|
cell->node_info->conn = establish_db_connection_quiet(cell->node_info->conninfo);
|
||||||
|
|
||||||
|
if (PQstatus(cell->node_info->conn) != CONNECTION_OK)
|
||||||
|
{
|
||||||
|
if (runtime_options.verbose)
|
||||||
|
{
|
||||||
|
char error[MAXLEN];
|
||||||
|
|
||||||
|
strncpy(error, PQerrorMessage(cell->node_info->conn), MAXLEN);
|
||||||
|
|
||||||
|
item_list_append_format(&warnings,
|
||||||
|
"when attempting to connect to node \"%s\" (ID: %i), following error encountered :\n\"%s\"",
|
||||||
|
cell->node_info->node_name, cell->node_info->node_id, trim(error));
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
item_list_append_format(&warnings,
|
||||||
|
"unable to connect to node \"%s\" (ID: %i)",
|
||||||
|
cell->node_info->node_name, cell->node_info->node_id);
|
||||||
|
}
|
||||||
|
|
||||||
|
repmgrd_info[i]->pg_running = false;
|
||||||
|
maxlen_snprintf(repmgrd_info[i]->pg_running_text, "%s", _("not running"));
|
||||||
|
maxlen_snprintf(repmgrd_info[i]->repmgrd_running, "%s", _("n/a"));
|
||||||
|
maxlen_snprintf(repmgrd_info[i]->pid_text, "%s", _("n/a"));
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
maxlen_snprintf(repmgrd_info[i]->pg_running_text, "%s", _("running"));
|
||||||
|
|
||||||
|
repmgrd_info[i]->pid = repmgrd_get_pid(cell->node_info->conn);
|
||||||
|
|
||||||
|
repmgrd_info[i]->running = repmgrd_is_running(cell->node_info->conn);
|
||||||
|
|
||||||
|
if (repmgrd_info[i]->running == true)
|
||||||
|
{
|
||||||
|
maxlen_snprintf(repmgrd_info[i]->repmgrd_running, "%s", _("running"));
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
maxlen_snprintf(repmgrd_info[i]->repmgrd_running, "%s", _("not running"));
|
||||||
|
}
|
||||||
|
|
||||||
|
if (repmgrd_info[i]->pid == UNKNOWN_PID)
|
||||||
|
{
|
||||||
|
maxlen_snprintf(repmgrd_info[i]->pid_text, "%s", _("n/a"));
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
maxlen_snprintf(repmgrd_info[i]->pid_text, "%i", repmgrd_info[i]->pid);
|
||||||
|
}
|
||||||
|
|
||||||
|
repmgrd_info[i]->paused = repmgrd_is_paused(cell->node_info->conn);
|
||||||
|
|
||||||
|
PQfinish(cell->node_info->conn);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
headers_status[STATUS_NAME].cur_length = strlen(cell->node_info->node_name);
|
||||||
|
headers_status[STATUS_ROLE].cur_length = strlen(get_node_type_string(cell->node_info->type));
|
||||||
|
headers_status[STATUS_PID].cur_length = strlen(repmgrd_info[i]->pid_text);
|
||||||
|
headers_status[STATUS_RUNNING].cur_length = strlen(repmgrd_info[i]->repmgrd_running);
|
||||||
|
headers_status[STATUS_PG].cur_length = strlen(repmgrd_info[i]->pg_running_text);
|
||||||
|
|
||||||
|
for (j = 0; j < STATUS_HEADER_COUNT; j++)
|
||||||
|
{
|
||||||
|
if (headers_status[j].cur_length > headers_status[j].max_length)
|
||||||
|
{
|
||||||
|
headers_status[j].max_length = headers_status[j].cur_length;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
i++;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Print column header row (text mode only) */
|
||||||
|
if (runtime_options.output_mode == OM_TEXT)
|
||||||
|
{
|
||||||
|
print_status_header(STATUS_HEADER_COUNT, headers_status);
|
||||||
|
}
|
||||||
|
|
||||||
|
i = 0;
|
||||||
|
|
||||||
|
for (cell = nodes.head; cell; cell = cell->next)
|
||||||
|
{
|
||||||
|
if (runtime_options.output_mode == OM_CSV)
|
||||||
|
{
|
||||||
|
printf("%i,%s,%s,%i,%i,%i,%i\n",
|
||||||
|
cell->node_info->node_id,
|
||||||
|
cell->node_info->node_name,
|
||||||
|
get_node_type_string(cell->node_info->type),
|
||||||
|
repmgrd_info[i]->pg_running ? 1 : 0,
|
||||||
|
repmgrd_info[i]->running ? 1 : 0,
|
||||||
|
repmgrd_info[i]->pid,
|
||||||
|
repmgrd_info[i]->paused ? 1 : 0);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
printf(" %-*i ", headers_status[STATUS_ID].max_length, cell->node_info->node_id);
|
||||||
|
printf("| %-*s ", headers_status[STATUS_NAME].max_length, cell->node_info->node_name);
|
||||||
|
printf("| %-*s ", headers_status[STATUS_ROLE].max_length, get_node_type_string(cell->node_info->type));
|
||||||
|
|
||||||
|
printf("| %-*s ", headers_status[STATUS_PG].max_length, repmgrd_info[i]->pg_running_text);
|
||||||
|
printf("| %-*s ", headers_status[STATUS_RUNNING].max_length, repmgrd_info[i]->repmgrd_running);
|
||||||
|
printf("| %-*s ", headers_status[STATUS_PID].max_length, repmgrd_info[i]->pid_text);
|
||||||
|
|
||||||
|
if (repmgrd_info[i]->pid == UNKNOWN_PID)
|
||||||
|
printf("| %-*s ", headers_status[STATUS_PAUSED].max_length, "n/a");
|
||||||
|
else
|
||||||
|
printf("| %-*s ", headers_status[STATUS_PAUSED].max_length, repmgrd_info[i]->paused ? "yes" : "no");
|
||||||
|
|
||||||
|
printf("\n");
|
||||||
|
}
|
||||||
|
|
||||||
|
free(repmgrd_info[i]);
|
||||||
|
i++;
|
||||||
|
}
|
||||||
|
|
||||||
|
free(repmgrd_info);
|
||||||
|
|
||||||
|
/* emit any warnings */
|
||||||
|
|
||||||
|
if (warnings.head != NULL && runtime_options.terse == false && runtime_options.output_mode != OM_CSV)
|
||||||
|
{
|
||||||
|
ItemListCell *cell = NULL;
|
||||||
|
|
||||||
|
printf(_("\nWARNING: following issues were detected\n"));
|
||||||
|
for (cell = warnings.head; cell; cell = cell->next)
|
||||||
|
{
|
||||||
|
printf(_(" - %s\n"), cell->string);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (runtime_options.verbose == false)
|
||||||
|
{
|
||||||
|
log_hint(_("execute with --verbose option to see connection error messages"));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void
|
||||||
|
do_daemon_pause(void)
|
||||||
|
{
|
||||||
|
_do_repmgr_pause(true);
|
||||||
|
}
|
||||||
|
|
||||||
|
void
|
||||||
|
do_daemon_unpause(void)
|
||||||
|
{
|
||||||
|
_do_repmgr_pause(false);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static void
|
||||||
|
_do_repmgr_pause(bool pause)
|
||||||
|
{
|
||||||
|
PGconn *conn = NULL;
|
||||||
|
NodeInfoList nodes = T_NODE_INFO_LIST_INITIALIZER;
|
||||||
|
NodeInfoListCell *cell = NULL;
|
||||||
|
RepmgrdInfo **repmgrd_info;
|
||||||
|
int i;
|
||||||
|
int error_nodes = 0;
|
||||||
|
|
||||||
|
repmgrd_info = (RepmgrdInfo **) pg_malloc0(sizeof(RepmgrdInfo *) * nodes.node_count);
|
||||||
|
|
||||||
|
if (repmgrd_info == NULL)
|
||||||
|
{
|
||||||
|
log_error(_("unable to allocate memory"));
|
||||||
|
exit(ERR_OUT_OF_MEMORY);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Connect to local database to obtain cluster connection data */
|
||||||
|
log_verbose(LOG_INFO, _("connecting to database"));
|
||||||
|
|
||||||
|
if (strlen(config_file_options.conninfo))
|
||||||
|
conn = establish_db_connection(config_file_options.conninfo, true);
|
||||||
|
else
|
||||||
|
conn = establish_db_connection_by_params(&source_conninfo, true);
|
||||||
|
|
||||||
|
fetch_node_records(conn, &nodes);
|
||||||
|
|
||||||
|
i = 0;
|
||||||
|
|
||||||
|
for (cell = nodes.head; cell; cell = cell->next)
|
||||||
|
{
|
||||||
|
repmgrd_info[i] = pg_malloc0(sizeof(RepmgrdInfo));
|
||||||
|
repmgrd_info[i]->node_id = cell->node_info->node_id;
|
||||||
|
|
||||||
|
log_verbose(LOG_DEBUG, "pausing node %i (%s)",
|
||||||
|
cell->node_info->node_id,
|
||||||
|
cell->node_info->node_name);
|
||||||
|
cell->node_info->conn = establish_db_connection_quiet(cell->node_info->conninfo);
|
||||||
|
|
||||||
|
if (PQstatus(cell->node_info->conn) != CONNECTION_OK)
|
||||||
|
{
|
||||||
|
log_warning(_("unable to connect to node %i"),
|
||||||
|
cell->node_info->node_id);
|
||||||
|
error_nodes++;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
if (runtime_options.dry_run == true)
|
||||||
|
{
|
||||||
|
if (pause == true)
|
||||||
|
{
|
||||||
|
log_info(_("would pause node %i (%s) "),
|
||||||
|
cell->node_info->node_id,
|
||||||
|
cell->node_info->node_name);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
log_info(_("would unpause node %i (%s) "),
|
||||||
|
cell->node_info->node_id,
|
||||||
|
cell->node_info->node_name);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
bool success = repmgrd_pause(cell->node_info->conn, pause);
|
||||||
|
|
||||||
|
if (success == false)
|
||||||
|
error_nodes++;
|
||||||
|
|
||||||
|
log_notice(_("node %i (%s) %s"),
|
||||||
|
cell->node_info->node_id,
|
||||||
|
cell->node_info->node_name,
|
||||||
|
success == true
|
||||||
|
? pause == true ? "paused" : "unpaused"
|
||||||
|
: pause == true ? "not paused" : "not unpaused");
|
||||||
|
}
|
||||||
|
PQfinish(cell->node_info->conn);
|
||||||
|
}
|
||||||
|
i++;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (error_nodes > 0)
|
||||||
|
{
|
||||||
|
if (pause == true)
|
||||||
|
{
|
||||||
|
log_error(_("unable to pause %i node(s)"), error_nodes);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
log_error(_("unable to unpause %i node(s)"), error_nodes);
|
||||||
|
}
|
||||||
|
|
||||||
|
log_hint(_("execute \"repmgr daemon status\" to view current status"));
|
||||||
|
|
||||||
|
exit(ERR_REPMGRD_PAUSE);
|
||||||
|
}
|
||||||
|
|
||||||
|
exit(SUCCESS);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
fetch_node_records(PGconn *conn, NodeInfoList *node_list)
|
||||||
|
{
|
||||||
|
bool success = get_all_node_records(conn, node_list);
|
||||||
|
|
||||||
|
if (success == false)
|
||||||
|
{
|
||||||
|
/* get_all_node_records() will display any error message */
|
||||||
|
PQfinish(conn);
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (node_list->node_count == 0)
|
||||||
|
{
|
||||||
|
log_error(_("no node records were found"));
|
||||||
|
log_hint(_("ensure at least one node is registered"));
|
||||||
|
PQfinish(conn);
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void do_daemon_help(void)
|
||||||
|
{
|
||||||
|
print_help_header();
|
||||||
|
|
||||||
|
printf(_("Usage:\n"));
|
||||||
|
printf(_(" %s [OPTIONS] daemon status\n"), progname());
|
||||||
|
printf(_(" %s [OPTIONS] daemon pause\n"), progname());
|
||||||
|
printf(_(" %s [OPTIONS] daemon unpause\n"), progname());
|
||||||
|
puts("");
|
||||||
|
|
||||||
|
printf(_("DAEMON STATUS\n"));
|
||||||
|
puts("");
|
||||||
|
printf(_(" \"daemon status\" shows the status of repmgrd on each node in the cluster\n"));
|
||||||
|
puts("");
|
||||||
|
printf(_(" --csv emit output as CSV\n"));
|
||||||
|
printf(_(" --verbose show text of database connection error messages\n"));
|
||||||
|
puts("");
|
||||||
|
|
||||||
|
printf(_("DAEMON PAUSE\n"));
|
||||||
|
puts("");
|
||||||
|
printf(_(" \"daemon pause\" instructs repmgrd on each node to pause failover detection\n"));
|
||||||
|
puts("");
|
||||||
|
printf(_(" --dry-run check if nodes are reachable but don't pause repmgrd\n"));
|
||||||
|
puts("");
|
||||||
|
|
||||||
|
printf(_("DAEMON PAUSE\n"));
|
||||||
|
puts("");
|
||||||
|
printf(_(" \"daemon unpause\" instructs repmgrd on each node to resume failover detection\n"));
|
||||||
|
puts("");
|
||||||
|
printf(_(" --dry-run check if nodes are reachable but don't unpause repmgrd\n"));
|
||||||
|
puts("");
|
||||||
|
|
||||||
|
|
||||||
|
puts("");
|
||||||
|
}
|
||||||
28
repmgr-action-daemon.h
Normal file
28
repmgr-action-daemon.h
Normal file
@@ -0,0 +1,28 @@
|
|||||||
|
/*
|
||||||
|
* repmgr-action-daemon.h
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2018
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#ifndef _REPMGR_ACTION_DAEMON_H_
|
||||||
|
#define _REPMGR_ACTION_DAEMON_H_
|
||||||
|
|
||||||
|
|
||||||
|
extern void do_daemon_status(void);
|
||||||
|
extern void do_daemon_pause(void);
|
||||||
|
extern void do_daemon_unpause(void);
|
||||||
|
|
||||||
|
extern void do_daemon_help(void);
|
||||||
|
#endif
|
||||||
2346
repmgr-action-node.c
2346
repmgr-action-node.c
File diff suppressed because it is too large
Load Diff
Some files were not shown because too many files have changed in this diff Show More
Reference in New Issue
Block a user