mirror of
https://github.com/EnterpriseDB/repmgr.git
synced 2026-03-23 15:16:29 +00:00
Compare commits
551 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
318f1dac40 | ||
|
|
bda4b0995c | ||
|
|
c14449f0a7 | ||
|
|
557e34b70c | ||
|
|
333083869b | ||
|
|
57fae00844 | ||
|
|
3de336f1c0 | ||
|
|
5493b57443 | ||
|
|
e53f1bf844 | ||
|
|
90638811c8 | ||
|
|
892e3b93d1 | ||
|
|
6f15a7e52e | ||
|
|
98998f73bf | ||
|
|
34ac2d8141 | ||
|
|
c820b61f28 | ||
|
|
9e620656c5 | ||
|
|
2fa277cc53 | ||
|
|
6a4f5944a1 | ||
|
|
c02a12a113 | ||
|
|
01b3933922 | ||
|
|
39b3b32814 | ||
|
|
846e0f73b2 | ||
|
|
7467525c8d | ||
|
|
b27a94ccbe | ||
|
|
2e69d155da | ||
|
|
870a367d3b | ||
|
|
9c28d3626b | ||
|
|
0916d8f2ad | ||
|
|
1964f890be | ||
|
|
976a61005e | ||
|
|
0c82278fd4 | ||
|
|
0abfde3773 | ||
|
|
1746831486 | ||
|
|
8c8e368a69 | ||
|
|
0ef532dcff | ||
|
|
478407fd86 | ||
|
|
05bfdfab2c | ||
|
|
29740dc41b | ||
|
|
ad6ecef2ab | ||
|
|
5318d37462 | ||
|
|
7244dda20f | ||
|
|
e651284927 | ||
|
|
72a2ac284a | ||
|
|
cec01c6620 | ||
|
|
989f683bc6 | ||
|
|
fa30382f2c | ||
|
|
defc2653e0 | ||
|
|
67e8ca73b5 | ||
|
|
a1a1d64e1f | ||
|
|
76509038cc | ||
|
|
7f8e50c882 | ||
|
|
5deb6c8ce4 | ||
|
|
175ee8acfc | ||
|
|
d1491f51a3 | ||
|
|
bc9febdc48 | ||
|
|
b6cf22ac90 | ||
|
|
d89a73cbf4 | ||
|
|
1f09e92e3f | ||
|
|
1bdc72a07b | ||
|
|
a6f1c6e483 | ||
|
|
6e14f0bc5d | ||
|
|
a336d22bd9 | ||
|
|
e88a8a9708 | ||
|
|
8f3f4eb4a3 | ||
|
|
dc18e5b791 | ||
|
|
9da0914976 | ||
|
|
666e71a589 | ||
|
|
062af91d36 | ||
|
|
571ad698db | ||
|
|
742f7e167f | ||
|
|
1fb2801639 | ||
|
|
e3031f0204 | ||
|
|
79748f28f1 | ||
|
|
46740b64a9 | ||
|
|
6557099832 | ||
|
|
083e288ac3 | ||
|
|
f5e3d7c041 | ||
|
|
402e02f4b7 | ||
|
|
a21b16f960 | ||
|
|
be58af701b | ||
|
|
eb2cdf8a98 | ||
|
|
7cc0400c03 | ||
|
|
9788b2bd29 | ||
|
|
227f0190f7 | ||
|
|
d6dbc70916 | ||
|
|
d2f4eda224 | ||
|
|
2588853e83 | ||
|
|
b54f98ed8a | ||
|
|
26f73686e5 | ||
|
|
e274a2cbcb | ||
|
|
d502bbe614 | ||
|
|
2594411820 | ||
|
|
d22535de00 | ||
|
|
fce1f0cd4a | ||
|
|
bb842c3989 | ||
|
|
556ff3c311 | ||
|
|
251486546d | ||
|
|
53d3e71cd3 | ||
|
|
b986ce81b2 | ||
|
|
7ddb060bdc | ||
|
|
6b02faf37c | ||
|
|
0cde0068dd | ||
|
|
20d66df0ef | ||
|
|
3f7c30b84d | ||
|
|
a63baf7fcb | ||
|
|
e19c643389 | ||
|
|
f058833451 | ||
|
|
96c14adfdb | ||
|
|
50119056a5 | ||
|
|
a279c42df9 | ||
|
|
f70b6ea136 | ||
|
|
e4cb6d7130 | ||
|
|
502c056753 | ||
|
|
871ec47ff5 | ||
|
|
f435abb3ec | ||
|
|
a217b4d0a9 | ||
|
|
2dcb75f889 | ||
|
|
b509ce6382 | ||
|
|
1150bf272a | ||
|
|
09ac6cd145 | ||
|
|
2fae788bc4 | ||
|
|
eb90f864c9 | ||
|
|
ba89758366 | ||
|
|
84595fe711 | ||
|
|
9523894808 | ||
|
|
df09af4d57 | ||
|
|
2c1cbc6bf9 | ||
|
|
ed22fe326e | ||
|
|
46500e1408 | ||
|
|
c3971513b6 | ||
|
|
a2910eded9 | ||
|
|
dc70e2d804 | ||
|
|
ea45158f50 | ||
|
|
84d1e16edd | ||
|
|
57815af3ac | ||
|
|
a4a2e48ab4 | ||
|
|
5189488b92 | ||
|
|
263128a740 | ||
|
|
f775750334 | ||
|
|
41ec45a4cc | ||
|
|
9b5b9acb82 | ||
|
|
77de5dbeeb | ||
|
|
465f1a73a5 | ||
|
|
c4f84bd777 | ||
|
|
da4dc26505 | ||
|
|
19670db1d4 | ||
|
|
b9f52e74eb | ||
|
|
fa10fd8493 | ||
|
|
b7f20ee1f7 | ||
|
|
bbb2e2f017 | ||
|
|
52328b8f33 | ||
|
|
65c2be3441 | ||
|
|
b17593ff4d | ||
|
|
7c1776655b | ||
|
|
789470b227 | ||
|
|
5d3c0d6163 | ||
|
|
44d4ca46b0 | ||
|
|
114c1bddcb | ||
|
|
5090b8cab1 | ||
|
|
5e338473f7 | ||
|
|
e043d5c9a9 | ||
|
|
03911488aa | ||
|
|
3e51a85e07 | ||
|
|
036c59526a | ||
|
|
2c55accbdd | ||
|
|
3ce231a571 | ||
|
|
178b380f34 | ||
|
|
4d36712901 | ||
|
|
7c3c30ae4a | ||
|
|
7e6491a6d6 | ||
|
|
ac8910000f | ||
|
|
cc3c2f5073 | ||
|
|
171df20386 | ||
|
|
2105837ef4 | ||
|
|
d12ecba63c | ||
|
|
5276cb279c | ||
|
|
719ad3cf95 | ||
|
|
e87399afc1 | ||
|
|
1d05345aa3 | ||
|
|
a8afa843ee | ||
|
|
5c4b477d84 | ||
|
|
f8fe801225 | ||
|
|
d7456d879d | ||
|
|
751469a08d | ||
|
|
afa5c1469b | ||
|
|
1778eeab9c | ||
|
|
95de5ef976 | ||
|
|
c0eea90402 | ||
|
|
135fa2e1b9 | ||
|
|
2a8861be8b | ||
|
|
a55c224510 | ||
|
|
844b9f54e4 | ||
|
|
8de84707d9 | ||
|
|
3ea61689eb | ||
|
|
efb106f8a0 | ||
|
|
5baec14a1e | ||
|
|
fe469fe188 | ||
|
|
5a7ce552f0 | ||
|
|
ef7bed1b3d | ||
|
|
6bd1c6a36d | ||
|
|
9831cabd4d | ||
|
|
d244fb29d7 | ||
|
|
4a349f7224 | ||
|
|
fb6109b3e6 | ||
|
|
b314f5aaf4 | ||
|
|
7fc340a8e2 | ||
|
|
e4c8bd981b | ||
|
|
a310417a49 | ||
|
|
9a07686ceb | ||
|
|
45aa0724c4 | ||
|
|
a558e9379e | ||
|
|
85f68e9f77 | ||
|
|
00e55c0672 | ||
|
|
84ab37c600 | ||
|
|
6a198401db | ||
|
|
cb78802027 | ||
|
|
48f637486d | ||
|
|
73280a426b | ||
|
|
b8ee321d5f | ||
|
|
ccdc0f9871 | ||
|
|
3bccd79510 | ||
|
|
a4ee10ca22 | ||
|
|
7ca9ff6d54 | ||
|
|
b660eb7988 | ||
|
|
6a4546a7b3 | ||
|
|
2f529e20c1 | ||
|
|
9853581d12 | ||
|
|
ecdae9671f | ||
|
|
1f3e937bbe | ||
|
|
89aeccedc2 | ||
|
|
d9bda915bb | ||
|
|
c565be4ab6 | ||
|
|
c26fd21351 | ||
|
|
6b57d0e680 | ||
|
|
6faf029c93 | ||
|
|
c42437a4f2 | ||
|
|
d0c05e6f46 | ||
|
|
050f007cc2 | ||
|
|
371d80ff35 | ||
|
|
e0a61afb7d | ||
|
|
bbc88ce05c | ||
|
|
61e907cf70 | ||
|
|
02668ee045 | ||
|
|
36eb26f86d | ||
|
|
cbc2c7b3e6 | ||
|
|
8a28dadde4 | ||
|
|
3eda7373ad | ||
|
|
34e574ac66 | ||
|
|
e8fcc3d7a6 | ||
|
|
eba0f1d7ae | ||
|
|
db32565b36 | ||
|
|
94befc3230 | ||
|
|
340899f082 | ||
|
|
76681c0850 | ||
|
|
eebaef59a3 | ||
|
|
ddaaa28449 | ||
|
|
e81bf869ec | ||
|
|
fa62d715c2 | ||
|
|
72af24e1d6 | ||
|
|
61d617ae93 | ||
|
|
319fba8b1f | ||
|
|
c92ea1d057 | ||
|
|
b2ca6fd35e | ||
|
|
c880187e89 | ||
|
|
4724da41ad | ||
|
|
d44885b330 | ||
|
|
72f9b0145a | ||
|
|
5e03ef40cb | ||
|
|
091541619d | ||
|
|
5e9db47d12 | ||
|
|
e8a0cd33b5 | ||
|
|
8cd79fd7dd | ||
|
|
013b4b4b8a | ||
|
|
c5a721a3cf | ||
|
|
a6294b7da0 | ||
|
|
a0f02e454c | ||
|
|
69d9d137e0 | ||
|
|
60bceae905 | ||
|
|
746c9793ed | ||
|
|
c30447ac90 | ||
|
|
097024a32f | ||
|
|
66b7dbbed7 | ||
|
|
74f6f97f26 | ||
|
|
968c2f1954 | ||
|
|
bd76d0eb92 | ||
|
|
f1ee6e19b6 | ||
|
|
fbb65b4a43 | ||
|
|
3fac975de6 | ||
|
|
a2b5ba595a | ||
|
|
c16ab3c889 | ||
|
|
dd5b6f9f12 | ||
|
|
303bb22ee1 | ||
|
|
5d8b1a3a31 | ||
|
|
3d6c349d88 | ||
|
|
1ade1acb22 | ||
|
|
66fd003ab4 | ||
|
|
0d42b771f5 | ||
|
|
005640be51 | ||
|
|
b6ebd34e2f | ||
|
|
951879f80d | ||
|
|
46ff9fb587 | ||
|
|
cc610f995d | ||
|
|
384618cb33 | ||
|
|
0dd617cfca | ||
|
|
f18d629bd2 | ||
|
|
afc904f876 | ||
|
|
3bcea46c3b | ||
|
|
d7e85f7565 | ||
|
|
b14d8ddb74 | ||
|
|
9b2a907b09 | ||
|
|
f63d42fe77 | ||
|
|
560066fa9d | ||
|
|
3937670d14 | ||
|
|
0daa7381b3 | ||
|
|
e53545af4f | ||
|
|
45178c19d8 | ||
|
|
cf46834041 | ||
|
|
c30609426a | ||
|
|
1c49c4159c | ||
|
|
b6b6439819 | ||
|
|
9a05999abb | ||
|
|
4c463a66b7 | ||
|
|
209de699ce | ||
|
|
e814c1120e | ||
|
|
247823db4d | ||
|
|
beda22d5f9 | ||
|
|
2eb00a3e6f | ||
|
|
0a798bf6e4 | ||
|
|
21b2ff1a1f | ||
|
|
57f9432692 | ||
|
|
54d3c7a4ca | ||
|
|
7fd44a3d74 | ||
|
|
b0f6b7bad7 | ||
|
|
4dbbf40196 | ||
|
|
d5e24689a4 | ||
|
|
10e47441a2 | ||
|
|
274a30efa5 | ||
|
|
db63b5bb1c | ||
|
|
e100728b93 | ||
|
|
d104f2a914 | ||
|
|
2946c097f0 | ||
|
|
a538ceb0ea | ||
|
|
5a2a8d1c82 | ||
|
|
b5a7efa58e | ||
|
|
9f6f58e4ed | ||
|
|
c22f4eaf6f | ||
|
|
925d82f7a4 | ||
|
|
1db577e294 | ||
|
|
a886fddccc | ||
|
|
83e5f98171 | ||
|
|
eb31a56186 | ||
|
|
8cd2c6fd05 | ||
|
|
e3e1c5de4e | ||
|
|
f9a150504a | ||
|
|
5bc809466c | ||
|
|
5d32026b79 | ||
|
|
2a8d6f72c6 | ||
|
|
190cc7dcb4 | ||
|
|
819937d4bd | ||
|
|
57299cb978 | ||
|
|
59f503835b | ||
|
|
33e626cd75 | ||
|
|
491ec37adf | ||
|
|
c93790fc96 | ||
|
|
ecabe2c294 | ||
|
|
2ba57e5938 | ||
|
|
2eec17e25f | ||
|
|
c48c248c15 | ||
|
|
958e45f2b8 | ||
|
|
daafd70383 | ||
|
|
c828598bfb | ||
|
|
b55519c4a2 | ||
|
|
4cafd443e1 | ||
|
|
d400d7f9ac | ||
|
|
62bb3db1f8 | ||
|
|
d9961bbb17 | ||
|
|
e1b8982c14 | ||
|
|
2fe3b3c2a3 | ||
|
|
c6e1bc205a | ||
|
|
7241391ddc | ||
|
|
c8f449f178 | ||
|
|
49420c437f | ||
|
|
827ffef5f9 | ||
|
|
16296bb1c3 | ||
|
|
c9c18d6216 | ||
|
|
d21f506614 | ||
|
|
fbad18085e | ||
|
|
ca08b1c3bb | ||
|
|
3d95fab0ac | ||
|
|
12d6ce4629 | ||
|
|
dfb34ae7b6 | ||
|
|
98c4eb002a | ||
|
|
faed8a65f7 | ||
|
|
a81cf04614 | ||
|
|
ca6cbcf965 | ||
|
|
16c1e13019 | ||
|
|
1375adcac8 | ||
|
|
e859a58405 | ||
|
|
1a6d830314 | ||
|
|
a96f478a43 | ||
|
|
8f20ab16dd | ||
|
|
3ec436f30d | ||
|
|
61e00bf1c7 | ||
|
|
5d71869fc1 | ||
|
|
7598e08b6f | ||
|
|
ba71e1eedf | ||
|
|
a4c07b23fb | ||
|
|
0c36f921f7 | ||
|
|
8ac5a5444e | ||
|
|
f60e7346e2 | ||
|
|
855ca8fe1a | ||
|
|
daa79d1a0f | ||
|
|
211768d911 | ||
|
|
f982708b35 | ||
|
|
995083d66c | ||
|
|
be58d6af96 | ||
|
|
a52e97e622 | ||
|
|
cc1ea00333 | ||
|
|
ec3596521f | ||
|
|
66245ccc03 | ||
|
|
c7542063be | ||
|
|
2633d994ef | ||
|
|
5359d45463 | ||
|
|
efa60d142c | ||
|
|
f3d0ab9ab9 | ||
|
|
7e6bac1be6 | ||
|
|
b72058dba8 | ||
|
|
79d1332f9c | ||
|
|
cde721e3fc | ||
|
|
7b2439b824 | ||
|
|
787cd94142 | ||
|
|
056e64f635 | ||
|
|
6b5a609d30 | ||
|
|
7a4d84379c | ||
|
|
490e12b1af | ||
|
|
7b9df3ac8f | ||
|
|
d6bf870316 | ||
|
|
b15e8debe1 | ||
|
|
310faf1bd9 | ||
|
|
35caeaa66a | ||
|
|
ba300c58f7 | ||
|
|
f2370de2fa | ||
|
|
3920deb803 | ||
|
|
e452bf6601 | ||
|
|
167b4efbb3 | ||
|
|
56b9ca7992 | ||
|
|
9c002c7e38 | ||
|
|
cfec04d19f | ||
|
|
4f1c67a1bf | ||
|
|
2f4fd2b7fa | ||
|
|
aca2b9547f | ||
|
|
c9db7f57d2 | ||
|
|
96ac39ba0f | ||
|
|
88a3378203 | ||
|
|
4db0efab47 | ||
|
|
864d57953a | ||
|
|
84d2a292b2 | ||
|
|
62d53b7622 | ||
|
|
77d52adb53 | ||
|
|
7a3e2f2a3a | ||
|
|
120688013e | ||
|
|
f6d1db5edb | ||
|
|
02729d299b | ||
|
|
88a6a1376e | ||
|
|
67df082ee9 | ||
|
|
9ed71d6317 | ||
|
|
933647d6de | ||
|
|
f99018b202 | ||
|
|
ced87373cd | ||
|
|
1db22546a9 | ||
|
|
7ae0df9c85 | ||
|
|
7a80f7a096 | ||
|
|
8710e067d0 | ||
|
|
793950eabd | ||
|
|
d1b4280182 | ||
|
|
64d038c823 | ||
|
|
46dd734b3d | ||
|
|
0a2e4466aa | ||
|
|
17ab86f7ac | ||
|
|
d433982af7 | ||
|
|
869b6a7a06 | ||
|
|
9018dc65de | ||
|
|
9cbd8df089 | ||
|
|
67a81d1d47 | ||
|
|
ab70007b75 | ||
|
|
0145aa0fc3 | ||
|
|
493c307b23 | ||
|
|
fc6225a511 | ||
|
|
e3111d37ba | ||
|
|
2a1a9f2e61 | ||
|
|
71a667ecb8 | ||
|
|
3ab91730c3 | ||
|
|
dd7f9b79ae | ||
|
|
8ab1901a93 | ||
|
|
e0cbdd5b31 | ||
|
|
d62aaeedd0 | ||
|
|
05cc7091b5 | ||
|
|
d192d5665c | ||
|
|
3848b9011b | ||
|
|
487aadc4b9 | ||
|
|
3f5920a395 | ||
|
|
617ea8cb78 | ||
|
|
142517fcca | ||
|
|
d722e2c74b | ||
|
|
abb02cab76 | ||
|
|
8e66e4811c | ||
|
|
ce5a541960 | ||
|
|
e12be52fa8 | ||
|
|
c0911d3286 | ||
|
|
6e94432282 | ||
|
|
29d9232e2f | ||
|
|
8973812144 | ||
|
|
e775a962ad | ||
|
|
12204f7e56 | ||
|
|
684f7590b7 | ||
|
|
9d589a780d | ||
|
|
83e6d15410 | ||
|
|
6a10fe0cd9 | ||
|
|
c664682c05 | ||
|
|
44acc8d719 | ||
|
|
b911483d5e | ||
|
|
ee9270fe8d | ||
|
|
d0a4eebeec | ||
|
|
0f5e71f029 | ||
|
|
dbd90d45f5 | ||
|
|
c8d0fb401f | ||
|
|
afda3419cc | ||
|
|
a86fa4ad4a | ||
|
|
7e3007f6e8 | ||
|
|
8c797a8fea | ||
|
|
56cec22f22 | ||
|
|
b61649a3e3 | ||
|
|
ded716e403 | ||
|
|
d639dc3342 | ||
|
|
17ed81ebb7 | ||
|
|
b00c507ee4 | ||
|
|
55d8b2ad9c | ||
|
|
c918aaad4a | ||
|
|
6e7eee4c01 | ||
|
|
5c59e8fc5b | ||
|
|
eba0b6bb1e | ||
|
|
3bc0b80a71 | ||
|
|
06b9e0a8ec | ||
|
|
120be2db1c | ||
|
|
12bd7da836 | ||
|
|
2fd905cf9e | ||
|
|
dd7ebdc1c7 | ||
|
|
1636805fa1 | ||
|
|
899d789699 | ||
|
|
cd7a3215df | ||
|
|
f8fd344d9f |
@@ -2,7 +2,7 @@ License and Contributions
|
|||||||
=========================
|
=========================
|
||||||
|
|
||||||
`repmgr` is licensed under the GPL v3. All of its code and documentation is
|
`repmgr` is licensed under the GPL v3. All of its code and documentation is
|
||||||
Copyright 2010-2015, 2ndQuadrant Limited. See the files COPYRIGHT and LICENSE for
|
Copyright 2010-2017, 2ndQuadrant Limited. See the files COPYRIGHT and LICENSE for
|
||||||
details.
|
details.
|
||||||
|
|
||||||
The development of repmgr has primarily been sponsored by 2ndQuadrant customers.
|
The development of repmgr has primarily been sponsored by 2ndQuadrant customers.
|
||||||
|
|||||||
@@ -1,4 +1,4 @@
|
|||||||
Copyright (c) 2010-2015, 2ndQuadrant Limited
|
Copyright (c) 2010-2017, 2ndQuadrant Limited
|
||||||
All rights reserved.
|
All rights reserved.
|
||||||
|
|
||||||
This program is free software: you can redistribute it and/or modify
|
This program is free software: you can redistribute it and/or modify
|
||||||
|
|||||||
239
FAILOVER.rst
239
FAILOVER.rst
@@ -1,238 +1 @@
|
|||||||
====================================================
|
The contents of this file have been incorporated into the main README.md document.
|
||||||
PostgreSQL Automatic Failover - User Documentation
|
|
||||||
====================================================
|
|
||||||
|
|
||||||
Automatic Failover
|
|
||||||
==================
|
|
||||||
|
|
||||||
repmgr allows for automatic failover when it detects the failure of the master node.
|
|
||||||
Following is a quick setup for this.
|
|
||||||
|
|
||||||
Installation
|
|
||||||
============
|
|
||||||
|
|
||||||
For convenience, we define:
|
|
||||||
|
|
||||||
**node1**
|
|
||||||
is the fully qualified domain name of the Master server, IP 192.168.1.10
|
|
||||||
**node2**
|
|
||||||
is the fully qualified domain name of the Standby server, IP 192.168.1.11
|
|
||||||
**witness**
|
|
||||||
is the fully qualified domain name of the server used as a witness, IP 192.168.1.12
|
|
||||||
|
|
||||||
**Note:** We don't recommend using names with the status of a server like «masterserver»,
|
|
||||||
because it would be confusing once a failover takes place and the Master is
|
|
||||||
now on the «standbyserver».
|
|
||||||
|
|
||||||
Summary
|
|
||||||
-------
|
|
||||||
|
|
||||||
2 PostgreSQL servers are involved in the replication. Automatic failover needs
|
|
||||||
a vote to decide what server it should promote, so an odd number is required.
|
|
||||||
A witness-repmgrd is installed in a third server where it uses a PostgreSQL
|
|
||||||
cluster to communicate with other repmgrd daemons.
|
|
||||||
|
|
||||||
1. Install PostgreSQL in all the servers involved (including the witness server)
|
|
||||||
|
|
||||||
2. Install repmgr in all the servers involved (including the witness server)
|
|
||||||
|
|
||||||
3. Configure the Master PostreSQL
|
|
||||||
|
|
||||||
4. Clone the Master to the Standby using "repmgr standby clone" command
|
|
||||||
|
|
||||||
5. Configure repmgr in all the servers involved (including the witness server)
|
|
||||||
|
|
||||||
6. Register Master and Standby nodes
|
|
||||||
|
|
||||||
7. Initiate witness server
|
|
||||||
|
|
||||||
8. Start the repmgrd daemons in all nodes
|
|
||||||
|
|
||||||
**Note** A complete High-Availability design needs at least 3 servers to still have
|
|
||||||
a backup node after a first failure.
|
|
||||||
|
|
||||||
Install PostgreSQL
|
|
||||||
------------------
|
|
||||||
|
|
||||||
You can install PostgreSQL using any of the recommended methods. You should ensure
|
|
||||||
it's 9.0 or later.
|
|
||||||
|
|
||||||
Install repmgr
|
|
||||||
--------------
|
|
||||||
|
|
||||||
Install repmgr following the steps in the README file.
|
|
||||||
|
|
||||||
Configure PostreSQL
|
|
||||||
-------------------
|
|
||||||
|
|
||||||
Log in to node1.
|
|
||||||
|
|
||||||
Edit the file postgresql.conf and modify the parameters::
|
|
||||||
|
|
||||||
listen_addresses='*'
|
|
||||||
wal_level = 'hot_standby'
|
|
||||||
archive_mode = on
|
|
||||||
archive_command = 'cd .' # we can also use exit 0, anything that
|
|
||||||
# just does nothing
|
|
||||||
max_wal_senders = 10
|
|
||||||
wal_keep_segments = 5000 # 80 GB required on pg_xlog
|
|
||||||
hot_standby = on
|
|
||||||
shared_preload_libraries = 'repmgr_funcs'
|
|
||||||
|
|
||||||
Edit the file pg_hba.conf and add lines for the replication::
|
|
||||||
|
|
||||||
host repmgr repmgr 127.0.0.1/32 trust
|
|
||||||
host repmgr repmgr 192.168.1.10/30 trust
|
|
||||||
host replication all 192.168.1.10/30 trust
|
|
||||||
|
|
||||||
**Note:** It is also possible to use a password authentication (md5), .pgpass file
|
|
||||||
should be edited to allow connection between each node.
|
|
||||||
|
|
||||||
Create the user and database to manage replication::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
createuser -s repmgr
|
|
||||||
createdb -O repmgr repmgr
|
|
||||||
|
|
||||||
Restart the PostgreSQL server::
|
|
||||||
|
|
||||||
pg_ctl -D $PGDATA restart
|
|
||||||
|
|
||||||
And check everything is fine in the server log.
|
|
||||||
|
|
||||||
Create the ssh-key for the postgres user and copy it to other servers::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
ssh-keygen # /!\ do not use a passphrase /!\
|
|
||||||
cat ~/.ssh/id_rsa.pub > ~/.ssh/authorized_keys
|
|
||||||
chmod 600 ~/.ssh/authorized_keys
|
|
||||||
exit
|
|
||||||
rsync -avz ~postgres/.ssh/authorized_keys node2:~postgres/.ssh/
|
|
||||||
rsync -avz ~postgres/.ssh/authorized_keys witness:~postgres/.ssh/
|
|
||||||
rsync -avz ~postgres/.ssh/id_rsa* node2:~postgres/.ssh/
|
|
||||||
rsync -avz ~postgres/.ssh/id_rsa* witness:~postgres/.ssh/
|
|
||||||
|
|
||||||
Clone Master
|
|
||||||
------------
|
|
||||||
|
|
||||||
Log in to node2.
|
|
||||||
|
|
||||||
Clone node1 (the current Master)::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgr -d repmgr -U repmgr -h node1 standby clone
|
|
||||||
|
|
||||||
Start the PostgreSQL server::
|
|
||||||
|
|
||||||
pg_ctl -D $PGDATA start
|
|
||||||
|
|
||||||
And check everything is fine in the server log.
|
|
||||||
|
|
||||||
Configure repmgr
|
|
||||||
----------------
|
|
||||||
|
|
||||||
Log in to each server and configure repmgr by editing the file
|
|
||||||
/etc/repmgr/repmgr.conf::
|
|
||||||
|
|
||||||
cluster=my_cluster
|
|
||||||
node=1
|
|
||||||
node_name=earth
|
|
||||||
conninfo='host=192.168.1.10 dbname=repmgr user=repmgr'
|
|
||||||
master_response_timeout=60
|
|
||||||
reconnect_attempts=6
|
|
||||||
reconnect_interval=10
|
|
||||||
failover=automatic
|
|
||||||
promote_command='promote_command.sh'
|
|
||||||
follow_command='repmgr standby follow -f /etc/repmgr/repmgr.conf'
|
|
||||||
|
|
||||||
**cluster**
|
|
||||||
is the name of the current replication.
|
|
||||||
**node**
|
|
||||||
is the number of the current node (1, 2 or 3 in the current example).
|
|
||||||
**node_name**
|
|
||||||
is an identifier for every node.
|
|
||||||
**conninfo**
|
|
||||||
is used to connect to the local PostgreSQL server (where the configuration file is) from any node. In the witness server configuration you need to add a 'port=5499' to the conninfo.
|
|
||||||
**master_response_timeout**
|
|
||||||
is the maximum amount of time we are going to wait before deciding the master has died and start the failover procedure.
|
|
||||||
**reconnect_attempts**
|
|
||||||
is the number of times we will try to reconnect to master after a failure has been detected and before start the failover procedure.
|
|
||||||
**reconnect_interval**
|
|
||||||
is the amount of time between retries to reconnect to master after a failure has been detected and before start the failover procedure.
|
|
||||||
**failover**
|
|
||||||
configure behavior: *manual* or *automatic*.
|
|
||||||
**promote_command**
|
|
||||||
the command executed to do the failover (including the PostgreSQL failover itself). The command must return 0 on success.
|
|
||||||
**follow_command**
|
|
||||||
the command executed to address the current standby to another Master. The command must return 0 on success.
|
|
||||||
|
|
||||||
Register Master and Standby
|
|
||||||
---------------------------
|
|
||||||
|
|
||||||
Log in to node1.
|
|
||||||
|
|
||||||
Register the node as master::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgr -f /etc/repmgr/repmgr.conf master register
|
|
||||||
|
|
||||||
This will also create the repmgr schema and functions.
|
|
||||||
|
|
||||||
Log in to node2. Register it as a standby::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgr -f /etc/repmgr/repmgr.conf standby register
|
|
||||||
|
|
||||||
Initialize witness server
|
|
||||||
-------------------------
|
|
||||||
|
|
||||||
Log in to witness.
|
|
||||||
|
|
||||||
Initialize the witness server::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgr -d repmgr -U repmgr -h 192.168.1.10 -D $WITNESS_PGDATA -f /etc/repmgr/repmgr.conf witness create
|
|
||||||
|
|
||||||
The witness server needs the following information from the command
|
|
||||||
line:
|
|
||||||
|
|
||||||
* Connection details for the current master, to copy the cluster
|
|
||||||
configuration.
|
|
||||||
* A location for initializing its own $PGDATA.
|
|
||||||
|
|
||||||
repmgr will also ask for the superuser password on the witness database so
|
|
||||||
it can reconnect when needed (the command line option --initdb-no-pwprompt
|
|
||||||
will set up a password-less superuser).
|
|
||||||
|
|
||||||
By default the witness server will listen on port 5499; this value can be
|
|
||||||
overridden by explicitly providing the port number in the conninfo string
|
|
||||||
in repmgr.conf. (Note that it is also possible to specify the port number
|
|
||||||
with the -l/--local-port option, however this option is now deprecated and
|
|
||||||
will be overridden by a port setting in the conninfo string).
|
|
||||||
|
|
||||||
Start the repmgrd daemons
|
|
||||||
-------------------------
|
|
||||||
|
|
||||||
Log in to node2 and witness::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
repmgrd -f /etc/repmgr/repmgr.conf --daemonize -> /var/log/postgresql/repmgr.log 2>&1
|
|
||||||
|
|
||||||
**Note:** The Master does not need a repmgrd daemon.
|
|
||||||
|
|
||||||
Suspend Automatic behavior
|
|
||||||
==========================
|
|
||||||
|
|
||||||
Edit the repmgr.conf of the node to remove from automatic processing and change::
|
|
||||||
|
|
||||||
failover=manual
|
|
||||||
|
|
||||||
Then, signal repmgrd daemon::
|
|
||||||
|
|
||||||
su - postgres
|
|
||||||
kill -HUP $(pidof repmgrd)
|
|
||||||
|
|
||||||
Usage
|
|
||||||
=====
|
|
||||||
|
|
||||||
The repmgr documentation is in the README file (how to build, options, etc.)
|
|
||||||
|
|||||||
30
FAQ.md
30
FAQ.md
@@ -38,7 +38,7 @@ General
|
|||||||
|
|
||||||
No. Hash indexes and replication do not mix well and their use is
|
No. Hash indexes and replication do not mix well and their use is
|
||||||
explicitly discouraged; see:
|
explicitly discouraged; see:
|
||||||
http://www.postgresql.org/docs/current/interactive/sql-createindex.html#AEN74175
|
https://www.postgresql.org/docs/current/interactive/sql-createindex.html#AEN74175
|
||||||
|
|
||||||
`repmgr`
|
`repmgr`
|
||||||
--------
|
--------
|
||||||
@@ -120,6 +120,23 @@ General
|
|||||||
permission is for PostgreSQL's streaming replication and doesn't
|
permission is for PostgreSQL's streaming replication and doesn't
|
||||||
necessarily need to be the `repmgr` user.
|
necessarily need to be the `repmgr` user.
|
||||||
|
|
||||||
|
- When cloning a standby, why do I need to provide the connection parameters
|
||||||
|
for the primary server on the command line, not in the configuration file?
|
||||||
|
|
||||||
|
Cloning a standby is a one-time action; the role of the server being cloned
|
||||||
|
from could change, so fixing it in the configuration file would create
|
||||||
|
confusion. If `repmgr` needs to establish a connection to the primary
|
||||||
|
server, it can retrieve this from the `repl_nodes` table or if necessary
|
||||||
|
scan the replication cluster until it locates the active primary.
|
||||||
|
|
||||||
|
- Why is there no foreign key on the `node_id` column in the `repl_events`
|
||||||
|
table?
|
||||||
|
|
||||||
|
Under some circumstances event notifications can be generated for servers
|
||||||
|
which have not yet been registered; it's also useful to retain a record
|
||||||
|
of events which includes servers removed from the replication cluster
|
||||||
|
which no longer have an entry in the `repl_nodes` table.
|
||||||
|
|
||||||
|
|
||||||
`repmgrd`
|
`repmgrd`
|
||||||
---------
|
---------
|
||||||
@@ -135,6 +152,9 @@ General
|
|||||||
|
|
||||||
In `repmgr.conf`, set its priority to a value of 0 or less.
|
In `repmgr.conf`, set its priority to a value of 0 or less.
|
||||||
|
|
||||||
|
Additionally, if `failover` is set to `manual`, the node will never
|
||||||
|
be considered as a promotion candidate.
|
||||||
|
|
||||||
- Does `repmgrd` support delayed standbys?
|
- Does `repmgrd` support delayed standbys?
|
||||||
|
|
||||||
`repmgrd` can monitor delayed standbys - those set up with
|
`repmgrd` can monitor delayed standbys - those set up with
|
||||||
@@ -153,3 +173,11 @@ General
|
|||||||
|
|
||||||
Configure your system's `logrotate` service to do this; see example
|
Configure your system's `logrotate` service to do this; see example
|
||||||
in README.md
|
in README.md
|
||||||
|
|
||||||
|
- I've recloned a failed master as a standby, but `repmgrd` refuses to start?
|
||||||
|
|
||||||
|
Check you registered the standby after recloning. If unregistered the standby
|
||||||
|
cannot be considered as a promotion candidate even if `failover` is set to
|
||||||
|
`automatic`, which is probably not what you want. `repmgrd` will start if
|
||||||
|
`failover` is set to `manual` so the node's replication status can still
|
||||||
|
be monitored, if desired.
|
||||||
|
|||||||
127
HISTORY
127
HISTORY
@@ -1,3 +1,130 @@
|
|||||||
|
3.3.2 2017-06-01
|
||||||
|
Add support for PostgreSQL 10 (Ian)
|
||||||
|
repmgr: ensure --replication-user option is honoured when passing database
|
||||||
|
connection parameters as a conninfo string (Ian)
|
||||||
|
repmgr: improve detection of pg_rewind on remote server (Ian)
|
||||||
|
repmgr: add DETAIL log output for additional clarification of error messages (Ian)
|
||||||
|
repmgr: suppress various spurious error messages in `standby follow` and
|
||||||
|
`standby switchover` (Ian)
|
||||||
|
repmgr: add missing `-P` option (Ian)
|
||||||
|
repmgrd: monitoring statistic reporting fixes (Ian)
|
||||||
|
|
||||||
|
3.3.1 2017-03-13
|
||||||
|
repmgrd: prevent invalid apply lag value being written to the
|
||||||
|
monitoring table (Ian)
|
||||||
|
repmgrd: fix error in XLogRecPtr conversion when calculating
|
||||||
|
monitoring statistics (Ian)
|
||||||
|
repmgr: if replication slots in use, where possible delete slot on old
|
||||||
|
upstream node after following new upstream (Ian)
|
||||||
|
repmgr: improve logging of rsync actions (Ian)
|
||||||
|
repmgr: improve `standby clone` when synchronous replication in use (Ian)
|
||||||
|
repmgr: stricter checking of allowed node id values
|
||||||
|
repmgr: enable `master register --force` when there is a foreign key
|
||||||
|
dependency from a standby node (Ian)
|
||||||
|
|
||||||
|
3.3 2016-12-27
|
||||||
|
repmgr: always log to STDERR even if log facility defined (Ian)
|
||||||
|
repmgr: add --log-to-file to log repmgr output to the defined
|
||||||
|
log facility (Ian)
|
||||||
|
repmgr: improve handling of command line parameter errors (Ian)
|
||||||
|
repmgr: add option --upstream-conninfo to explicitly set
|
||||||
|
'primary_conninfo' in recovery.conf (Ian)
|
||||||
|
repmgr: enable a standby to be registered which isn't running (Ian)
|
||||||
|
repmgr: enable `standby register --force` to update a node record
|
||||||
|
with cascaded downstream node records (Ian)
|
||||||
|
repmgr: add option `--no-conninfo-password` (Abhijit, Ian)
|
||||||
|
repmgr: add initial support for PostgreSQL 10.0 (Ian)
|
||||||
|
repmgr: escape values in primary_conninfo if needed (Ian)
|
||||||
|
|
||||||
|
3.2.1 2016-10-24
|
||||||
|
repmgr: require a valid repmgr cluster name unless -F/--force
|
||||||
|
supplied (Ian)
|
||||||
|
repmgr: check master server is registered with repmgr before
|
||||||
|
cloning (Ian)
|
||||||
|
repmgr: ensure data directory defaults to that of the source node (Ian)
|
||||||
|
repmgr: various fixes to Barman cloning mode (Gianni, Ian)
|
||||||
|
repmgr: fix `repmgr cluster crosscheck` output (Ian)
|
||||||
|
|
||||||
|
3.2 2016-10-05
|
||||||
|
repmgr: add support for cloning from a Barman backup (Gianni)
|
||||||
|
repmgr: add commands `standby matrix` and `standby crosscheck` (Gianni)
|
||||||
|
repmgr: suppress connection error display in `repmgr cluster show`
|
||||||
|
unless `--verbose` supplied (Ian)
|
||||||
|
repmgr: add commands `witness register` and `witness unregister` (Ian)
|
||||||
|
repmgr: enable `standby unregister` / `witness unregister` to be
|
||||||
|
executed for a node which is not running (Ian)
|
||||||
|
repmgr: remove deprecated command line options --initdb-no-pwprompt and
|
||||||
|
-l/--local-port (Ian)
|
||||||
|
repmgr: before cloning with pg_basebackup, check that sufficient free
|
||||||
|
walsenders are available (Ian)
|
||||||
|
repmgr: add option `--wait-sync` for `standby register` which causes
|
||||||
|
repmgr to wait for the registered node record to synchronise to
|
||||||
|
the standby (Ian)
|
||||||
|
repmgr: add option `--copy-external-config-files` for files outside
|
||||||
|
of the data directory (Ian)
|
||||||
|
repmgr: only require `wal_keep_segments` to be set in certain corner
|
||||||
|
cases (Ian)
|
||||||
|
repmgr: better support cloning from a node other than the one to
|
||||||
|
stream from (Ian)
|
||||||
|
repmgrd: add configuration options to override the default pg_ctl
|
||||||
|
commands (Jarkko Oranen, Ian)
|
||||||
|
repmgrd: don't start if node is inactive and failover=automatic (Ian)
|
||||||
|
packaging: improve "repmgr-auto" Debian package (Gianni)
|
||||||
|
|
||||||
|
|
||||||
|
3.1.5 2016-08-15
|
||||||
|
repmgrd: in a failover situation, prevent endless looping when
|
||||||
|
attempting to establish the status of a node with
|
||||||
|
`failover=manual` (Ian)
|
||||||
|
repmgrd: improve handling of failover events on standbys with
|
||||||
|
`failover=manual`, and create a new event notification
|
||||||
|
for this, `standby_disconnect_manual` (Ian)
|
||||||
|
repmgr: add further event notifications (Gianni)
|
||||||
|
repmgr: when executing `standby switchover`, don't collect remote
|
||||||
|
command output unless required (Gianni, Ian)
|
||||||
|
repmgrd: improve standby monitoring query (Ian, based on suggestion
|
||||||
|
from Álvaro)
|
||||||
|
repmgr: various command line handling improvements (Ian)
|
||||||
|
|
||||||
|
3.1.4 2016-07-12
|
||||||
|
repmgr: new configuration option for setting "restore_command"
|
||||||
|
in the recovery.conf file generated by repmgr (Martín)
|
||||||
|
repmgr: add --csv option to "repmgr cluster show" (Gianni)
|
||||||
|
repmgr: enable provision of a conninfo string as the -d/--dbname
|
||||||
|
parameter, similar to other PostgreSQL utilities (Ian)
|
||||||
|
repmgr: during switchover operations improve detection of
|
||||||
|
demotion candidate shutdown (Ian)
|
||||||
|
various bugfixes and documentation updates (Ian, Martín)
|
||||||
|
|
||||||
|
3.1.3 2016-05-17
|
||||||
|
repmgrd: enable monitoring when a standby is catching up by
|
||||||
|
replaying archived WAL (Ian)
|
||||||
|
repmgrd: when upstream_node_id is NULL, assume upstream node
|
||||||
|
to be current master (Ian)
|
||||||
|
repmgrd: check for reappearance of the master node if standby
|
||||||
|
promotion fails (Ian)
|
||||||
|
improve handling of rsync failure conditions (Martín)
|
||||||
|
|
||||||
|
3.1.2 2016-04-12
|
||||||
|
Fix pg_ctl path generation in do_standby_switchover() (Ian)
|
||||||
|
Regularly sync witness server repl_nodes table (Ian)
|
||||||
|
Documentation improvements (Gianni, dhyannataraj)
|
||||||
|
(Experimental) ensure repmgr handles failover slots when copying
|
||||||
|
in rsync mode (Craig, Ian)
|
||||||
|
rsync mode handling fixes (Martín)
|
||||||
|
Enable repmgr to compile against 9.6devel (Ian)
|
||||||
|
|
||||||
|
3.1.1 2016-02-24
|
||||||
|
Add '-P/--pwprompt' option for "repmgr create witness" (Ian)
|
||||||
|
Prevent repmgr/repmgrd running as root (Ian)
|
||||||
|
|
||||||
|
3.1.0 2016-02-01
|
||||||
|
Add "repmgr standby switchover" command (Ian)
|
||||||
|
Revised README file (Ian)
|
||||||
|
Remove requirement for 'archive_mode' to be enabled (Ian)
|
||||||
|
Improve -?/--help output, showing default values if relevant (Ian)
|
||||||
|
Various bugfixes to command line/configuration parameter handling (Ian)
|
||||||
|
|
||||||
3.0.3 2016-01-04
|
3.0.3 2016-01-04
|
||||||
Create replication slot if required before base backup is run (Abhijit)
|
Create replication slot if required before base backup is run (Abhijit)
|
||||||
standy clone: when using rsync, clean up "pg_replslot" directory (Ian)
|
standy clone: when using rsync, clean up "pg_replslot" directory (Ian)
|
||||||
|
|||||||
59
Makefile
59
Makefile
@@ -1,24 +1,34 @@
|
|||||||
#
|
#
|
||||||
# Makefile
|
# Makefile
|
||||||
# Copyright (c) 2ndQuadrant, 2010-2015
|
# Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
|
|
||||||
|
HEADERS = $(wildcard *.h)
|
||||||
|
|
||||||
repmgrd_OBJS = dbutils.o config.o repmgrd.o log.o strutil.o
|
repmgrd_OBJS = dbutils.o config.o repmgrd.o log.o strutil.o
|
||||||
repmgr_OBJS = dbutils.o check_dir.o config.o repmgr.o log.o strutil.o
|
repmgr_OBJS = dbutils.o check_dir.o config.o repmgr.o log.o strutil.o dirmod.o compat.o
|
||||||
|
|
||||||
DATA = repmgr.sql uninstall_repmgr.sql
|
DATA = repmgr.sql uninstall_repmgr.sql
|
||||||
|
REGRESS = repmgr_funcs repmgr_test
|
||||||
|
|
||||||
PG_CPPFLAGS = -I$(libpq_srcdir)
|
PG_CPPFLAGS = -I$(includedir_internal) -I$(libpq_srcdir)
|
||||||
PG_LIBS = $(libpq_pgport)
|
PG_LIBS = $(libpq_pgport)
|
||||||
|
|
||||||
all: repmgrd repmgr
|
|
||||||
|
all: repmgrd repmgr
|
||||||
$(MAKE) -C sql
|
$(MAKE) -C sql
|
||||||
|
|
||||||
repmgrd: $(repmgrd_OBJS)
|
repmgrd: $(repmgrd_OBJS)
|
||||||
$(CC) $(CFLAGS) $(repmgrd_OBJS) $(PG_LIBS) $(LDFLAGS) $(LDFLAGS_EX) $(LIBS) -o repmgrd
|
$(CC) -o repmgrd $(CFLAGS) $(repmgrd_OBJS) $(PG_LIBS) $(LDFLAGS) $(LDFLAGS_EX)
|
||||||
$(MAKE) -C sql
|
$(MAKE) -C sql
|
||||||
|
|
||||||
repmgr: $(repmgr_OBJS)
|
repmgr: $(repmgr_OBJS)
|
||||||
$(CC) $(CFLAGS) $(repmgr_OBJS) $(PG_LIBS) $(LDFLAGS) $(LDFLAGS_EX) $(LIBS) -o repmgr
|
$(CC) -o repmgr $(CFLAGS) $(repmgr_OBJS) $(PG_LIBS) $(LDFLAGS) $(LDFLAGS_EX)
|
||||||
|
|
||||||
|
# Make all objects depend on all include files. This is a bit of a
|
||||||
|
# shotgun approach, but the codebase is small enough that a complete rebuild
|
||||||
|
# is very fast anyway.
|
||||||
|
$(repmgr_OBJS): $(HEADERS)
|
||||||
|
$(repmgrd_OBJS): $(HEADERS)
|
||||||
|
|
||||||
ifdef USE_PGXS
|
ifdef USE_PGXS
|
||||||
PG_CONFIG = pg_config
|
PG_CONFIG = pg_config
|
||||||
@@ -31,8 +41,8 @@ include $(top_builddir)/src/Makefile.global
|
|||||||
include $(top_srcdir)/contrib/contrib-global.mk
|
include $(top_srcdir)/contrib/contrib-global.mk
|
||||||
endif
|
endif
|
||||||
|
|
||||||
# XXX: Try to use PROGRAM construct (see pgxs.mk) someday. Right now
|
# XXX: This overrides the pgxs install target - we're building two binaries,
|
||||||
# is overriding pgxs install.
|
# which is not supported by pgxs.mk's PROGRAM construct.
|
||||||
install: install_prog install_ext
|
install: install_prog install_ext
|
||||||
|
|
||||||
install_prog:
|
install_prog:
|
||||||
@@ -43,6 +53,12 @@ install_prog:
|
|||||||
install_ext:
|
install_ext:
|
||||||
$(MAKE) -C sql install
|
$(MAKE) -C sql install
|
||||||
|
|
||||||
|
# Distribution-specific package building targets
|
||||||
|
# ----------------------------------------------
|
||||||
|
#
|
||||||
|
# XXX we recommend using the PGDG-supplied packages where possible;
|
||||||
|
# see README.md for details.
|
||||||
|
|
||||||
install_rhel:
|
install_rhel:
|
||||||
mkdir -p '$(DESTDIR)/etc/init.d/'
|
mkdir -p '$(DESTDIR)/etc/init.d/'
|
||||||
$(INSTALL_PROGRAM) RHEL/repmgrd.init '$(DESTDIR)/etc/init.d/repmgrd'
|
$(INSTALL_PROGRAM) RHEL/repmgrd.init '$(DESTDIR)/etc/init.d/repmgrd'
|
||||||
@@ -67,16 +83,23 @@ clean:
|
|||||||
rm -f repmgr
|
rm -f repmgr
|
||||||
$(MAKE) -C sql clean
|
$(MAKE) -C sql clean
|
||||||
|
|
||||||
|
# Get correct version numbers and install paths, depending on your postgres version
|
||||||
|
PG_VERSION = $(shell pg_config --version | cut -d ' ' -f 2 | cut -d '.' -f 1,2)
|
||||||
|
REPMGR_VERSION = $(shell grep REPMGR_VERSION version.h | cut -d ' ' -f 3 | cut -d '"' -f 2)
|
||||||
|
PKGLIBDIR = $(shell pg_config --pkglibdir)
|
||||||
|
SHAREDIR = $(shell pg_config --sharedir)
|
||||||
|
PGBINDIR = /usr/lib/postgresql/$(PG_VERSION)/bin
|
||||||
|
|
||||||
deb: repmgrd repmgr
|
deb: repmgrd repmgr
|
||||||
mkdir -p ./debian/usr/bin
|
mkdir -p ./debian/usr/bin ./debian$(PGBINDIR)
|
||||||
cp repmgrd repmgr ./debian/usr/bin/
|
cp repmgrd repmgr ./debian$(PGBINDIR)
|
||||||
mkdir -p ./debian/usr/share/postgresql/9.0/contrib/
|
ln -s ../..$(PGBINDIR)/repmgr ./debian/usr/bin/repmgr
|
||||||
cp sql/repmgr_funcs.sql ./debian/usr/share/postgresql/9.0/contrib/
|
mkdir -p ./debian$(SHAREDIR)/contrib/
|
||||||
cp sql/uninstall_repmgr_funcs.sql ./debian/usr/share/postgresql/9.0/contrib/
|
cp sql/repmgr_funcs.sql ./debian$(SHAREDIR)/contrib/
|
||||||
mkdir -p ./debian/usr/lib/postgresql/9.0/lib/
|
cp sql/uninstall_repmgr_funcs.sql ./debian$(SHAREDIR)/contrib/
|
||||||
cp sql/repmgr_funcs.so ./debian/usr/lib/postgresql/9.0/lib/
|
mkdir -p ./debian$(PKGLIBDIR)/
|
||||||
|
cp sql/repmgr_funcs.so ./debian$(PKGLIBDIR)/
|
||||||
dpkg-deb --build debian
|
dpkg-deb --build debian
|
||||||
mv debian.deb ../postgresql-repmgr-9.0_1.0.0.deb
|
mv debian.deb ../postgresql-repmgr-$(PG_VERSION)_$(REPMGR_VERSION).deb
|
||||||
rm -rf ./debian/usr
|
rm -rf ./debian/usr
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
119
QUICKSTART.md
119
QUICKSTART.md
@@ -1,118 +1 @@
|
|||||||
repmgr quickstart guide
|
The contents of this file have been incorporated into the main README.md document.
|
||||||
=======================
|
|
||||||
|
|
||||||
This quickstart guide provides some annotated examples on basic
|
|
||||||
`repmgr` setup. It assumes you are familiar with PostgreSQL replication
|
|
||||||
concepts setup and Linux/UNIX system administration.
|
|
||||||
|
|
||||||
For the purposes of this guide, we'll assume the database user will be
|
|
||||||
`repmgr_usr` and the database will be `repmgr_db`.
|
|
||||||
|
|
||||||
|
|
||||||
Master setup
|
|
||||||
------------
|
|
||||||
|
|
||||||
1. Configure PostgreSQL
|
|
||||||
|
|
||||||
- create user and database:
|
|
||||||
|
|
||||||
```
|
|
||||||
CREATE ROLE repmgr_usr LOGIN SUPERUSER;
|
|
||||||
CREATE DATABASE repmgr_db OWNER repmgr_usr;
|
|
||||||
```
|
|
||||||
|
|
||||||
- configure `postgresql.conf` for replication (see README.md for sample
|
|
||||||
settings)
|
|
||||||
|
|
||||||
- update `pg_hba.conf`, e.g.:
|
|
||||||
|
|
||||||
```
|
|
||||||
host repmgr_db repmgr_usr 192.168.1.0/24 trust
|
|
||||||
host replication repmgr_usr 192.168.1.0/24 trust
|
|
||||||
```
|
|
||||||
|
|
||||||
Restart the PostgreSQL server after making these changes.
|
|
||||||
|
|
||||||
2. Create the `repmgr` configuration file:
|
|
||||||
|
|
||||||
$ cat /path/to/repmgr/node1/repmgr.conf
|
|
||||||
cluster=test
|
|
||||||
node=1
|
|
||||||
node_name=node1
|
|
||||||
conninfo='host=repmgr_node1 user=repmgr_usr dbname=repmgr_db'
|
|
||||||
pg_bindir=/path/to/postgres/bin
|
|
||||||
|
|
||||||
(For an annotated `repmgr.conf` file, see `repmgr.conf.sample` in the
|
|
||||||
repository's root directory).
|
|
||||||
|
|
||||||
3. Register the master node with `repmgr`:
|
|
||||||
|
|
||||||
$ repmgr -f /path/to/repmgr/node1/repmgr.conf --verbose master register
|
|
||||||
[2015-03-03 17:45:53] [INFO] repmgr connecting to master database
|
|
||||||
[2015-03-03 17:45:53] [INFO] repmgr connected to master, checking its state
|
|
||||||
[2015-03-03 17:45:53] [INFO] master register: creating database objects inside the repmgr_test schema
|
|
||||||
[2015-03-03 17:45:53] [NOTICE] Master node correctly registered for cluster test with id 1 (conninfo: host=localhost user=repmgr_usr dbname=repmgr_db)
|
|
||||||
|
|
||||||
Standby setup
|
|
||||||
-------------
|
|
||||||
|
|
||||||
1. Use `repmgr standby clone` to clone a standby from the master:
|
|
||||||
|
|
||||||
repmgr -D /path/to/standby/data -d repmgr_db -U repmgr_usr --verbose standby clone 192.168.1.2
|
|
||||||
[2015-03-03 18:18:21] [NOTICE] No configuration file provided and default file './repmgr.conf' not found - continuing with default values
|
|
||||||
[2015-03-03 18:18:21] [NOTICE] repmgr Destination directory ' /path/to/standby/data' provided
|
|
||||||
[2015-03-03 18:18:21] [INFO] repmgr connecting to upstream node
|
|
||||||
[2015-03-03 18:18:21] [INFO] repmgr connected to upstream node, checking its state
|
|
||||||
[2015-03-03 18:18:21] [INFO] Successfully connected to upstream node. Current installation size is 27 MB
|
|
||||||
[2015-03-03 18:18:21] [NOTICE] Starting backup...
|
|
||||||
[2015-03-03 18:18:21] [INFO] creating directory " /path/to/standby/data"...
|
|
||||||
[2015-03-03 18:18:21] [INFO] Executing: 'pg_basebackup -l "repmgr base backup" -h localhost -p 9595 -U repmgr_usr -D /path/to/standby/data '
|
|
||||||
NOTICE: pg_stop_backup complete, all required WAL segments have been archived
|
|
||||||
[2015-03-03 18:18:23] [NOTICE] repmgr standby clone (using pg_basebackup) complete
|
|
||||||
[2015-03-03 18:18:23] [NOTICE] HINT: You can now start your postgresql server
|
|
||||||
[2015-03-03 18:18:23] [NOTICE] for example : pg_ctl -D /path/to/standby/data start
|
|
||||||
|
|
||||||
Note that the `repmgr.conf` file is not required when cloning a standby.
|
|
||||||
However we recommend providing a valid `repmgr.conf` if you wish to use
|
|
||||||
replication slots, or want `repmgr` to log the clone event to the
|
|
||||||
`repl_events` table.
|
|
||||||
|
|
||||||
This will clone the PostgreSQL database files from the master, including its
|
|
||||||
`postgresql.conf` and `pg_hba.conf` files, and additionally automatically create
|
|
||||||
the `recovery.conf` file containing the correct parameters to start streaming
|
|
||||||
from the primary node.
|
|
||||||
|
|
||||||
2. Start the PostgreSQL server
|
|
||||||
|
|
||||||
3. Create the `repmgr` configuration file:
|
|
||||||
|
|
||||||
$ cat /path/node2/repmgr/repmgr.conf
|
|
||||||
cluster=test
|
|
||||||
node=2
|
|
||||||
node_name=node2
|
|
||||||
conninfo='host=repmgr_node2 user=repmgr_usr dbname=repmgr_db'
|
|
||||||
pg_bindir=/path/to/postgres/bin
|
|
||||||
|
|
||||||
4. Register the standby node with `repmgr`:
|
|
||||||
|
|
||||||
$ repmgr -f /path/to/repmgr/node2/repmgr.conf --verbose standby register
|
|
||||||
[2015-03-03 18:24:34] [NOTICE] Opening configuration file: /path/to/repmgr/node2/repmgr.conf
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr connecting to standby database
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr connecting to master database
|
|
||||||
[2015-03-03 18:24:34] [INFO] finding node list for cluster 'test'
|
|
||||||
[2015-03-03 18:24:34] [INFO] checking role of cluster node '1'
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr connected to master, checking its state
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr registering the standby
|
|
||||||
[2015-03-03 18:24:34] [INFO] repmgr registering the standby complete
|
|
||||||
[2015-03-03 18:24:34] [NOTICE] Standby node correctly registered for cluster test with id 2 (conninfo: host=localhost user=repmgr_usr dbname=repmgr_db)
|
|
||||||
|
|
||||||
|
|
||||||
This concludes the basic `repmgr` setup of master and standby. The records
|
|
||||||
created in the `repl_nodes` table should look something like this:
|
|
||||||
|
|
||||||
repmgr_db=# SELECT * from repmgr_test.repl_nodes;
|
|
||||||
id | type | upstream_node_id | cluster | name | conninfo | slot_name | priority | active
|
|
||||||
----+---------+------------------+---------+-------+----------------------------------------------------+-----------+----------+--------
|
|
||||||
1 | primary | | test | node1 | host=repmgr_node1 user=repmgr_usr dbname=repmgr_db | | 0 | t
|
|
||||||
2 | standby | 1 | test | node2 | host=repmgr_node2 user=repmgr_usr dbname=repmgr_db | | 0 | t
|
|
||||||
(2 rows)
|
|
||||||
|
|||||||
@@ -1,61 +0,0 @@
|
|||||||
Summary: repmgr
|
|
||||||
Name: repmgr
|
|
||||||
Version: 3.0
|
|
||||||
Release: 1
|
|
||||||
License: GPLv3
|
|
||||||
Group: System Environment/Daemons
|
|
||||||
URL: http://repmgr.org
|
|
||||||
Packager: Ian Barwick <ian@2ndquadrant.com>
|
|
||||||
Vendor: 2ndQuadrant Limited
|
|
||||||
Distribution: centos
|
|
||||||
Source0: %{name}-%{version}.tar.gz
|
|
||||||
BuildRoot: %{_tmppath}/%{name}-%{version}-%{release}-root
|
|
||||||
|
|
||||||
%description
|
|
||||||
repmgr is a utility suite which greatly simplifies
|
|
||||||
the process of setting up and managing replication
|
|
||||||
using streaming replication within a cluster of
|
|
||||||
PostgreSQL servers.
|
|
||||||
|
|
||||||
%prep
|
|
||||||
%setup
|
|
||||||
|
|
||||||
%build
|
|
||||||
export PATH=$PATH:/usr/pgsql-9.3/bin/
|
|
||||||
%{__make} USE_PGXS=1
|
|
||||||
|
|
||||||
%install
|
|
||||||
[ "%{buildroot}" != "/" ] && %{__rm} -rf %{buildroot}
|
|
||||||
|
|
||||||
export PATH=$PATH:/usr/pgsql-9.3/bin/
|
|
||||||
%{__make} USE_PGXS=1 install DESTDIR=%{buildroot} INSTALL="install -p"
|
|
||||||
%{__make} USE_PGXS=1 install_prog DESTDIR=%{buildroot} INSTALL="install -p"
|
|
||||||
%{__make} USE_PGXS=1 install_rhel DESTDIR=%{buildroot} INSTALL="install -p"
|
|
||||||
|
|
||||||
|
|
||||||
%clean
|
|
||||||
[ "%{buildroot}" != "/" ] && %{__rm} -rf %{buildroot}
|
|
||||||
|
|
||||||
|
|
||||||
%files
|
|
||||||
%defattr(-,root,root)
|
|
||||||
/usr/bin/repmgr
|
|
||||||
/usr/bin/repmgrd
|
|
||||||
/usr/pgsql-9.3/bin/repmgr
|
|
||||||
/usr/pgsql-9.3/bin/repmgrd
|
|
||||||
/usr/pgsql-9.3/lib/repmgr_funcs.so
|
|
||||||
/usr/pgsql-9.3/share/contrib/repmgr.sql
|
|
||||||
/usr/pgsql-9.3/share/contrib/repmgr_funcs.sql
|
|
||||||
/usr/pgsql-9.3/share/contrib/uninstall_repmgr.sql
|
|
||||||
/usr/pgsql-9.3/share/contrib/uninstall_repmgr_funcs.sql
|
|
||||||
%attr(0755,root,root)/etc/init.d/repmgrd
|
|
||||||
%attr(0644,root,root)/etc/sysconfig/repmgrd
|
|
||||||
%attr(0644,root,root)/etc/repmgr/repmgr.conf.sample
|
|
||||||
|
|
||||||
%changelog
|
|
||||||
* Tue Mar 10 2015 Ian Barwick ian@2ndquadrant.com>
|
|
||||||
- build for repmgr 3.0
|
|
||||||
* Thu Jun 05 2014 Nathan Van Overloop <nathan.van.overloop@nexperteam.be> 2.0.2
|
|
||||||
- fix witness creation to create db and user if needed
|
|
||||||
* Fri Apr 04 2014 Nathan Van Overloop <nathan.van.overloop@nexperteam.be> 2.0.1
|
|
||||||
- initial build for RHEL6
|
|
||||||
@@ -1,133 +0,0 @@
|
|||||||
#!/bin/sh
|
|
||||||
#
|
|
||||||
# chkconfig: - 75 16
|
|
||||||
# description: Enable repmgrd replication management and monitoring daemon for PostgreSQL
|
|
||||||
# processname: repmgrd
|
|
||||||
# pidfile="/var/run/${NAME}.pid"
|
|
||||||
|
|
||||||
# Source function library.
|
|
||||||
INITD=/etc/rc.d/init.d
|
|
||||||
. $INITD/functions
|
|
||||||
|
|
||||||
# Get function listing for cross-distribution logic.
|
|
||||||
TYPESET=`typeset -f|grep "declare"`
|
|
||||||
|
|
||||||
# Get network config.
|
|
||||||
. /etc/sysconfig/network
|
|
||||||
|
|
||||||
DESC="PostgreSQL replication management and monitoring daemon"
|
|
||||||
NAME=repmgrd
|
|
||||||
|
|
||||||
REPMGRD_ENABLED=no
|
|
||||||
REPMGRD_OPTS=
|
|
||||||
REPMGRD_USER=postgres
|
|
||||||
REPMGRD_BIN=/usr/pgsql-9.3/bin/repmgrd
|
|
||||||
REPMGRD_PIDFILE=/var/run/repmgrd.pid
|
|
||||||
REPMGRD_LOCK=/var/lock/subsys/${NAME}
|
|
||||||
REPMGRD_LOG=/var/lib/pgsql/9.3/data/pg_log/repmgrd.log
|
|
||||||
|
|
||||||
# Read configuration variable file if it is present
|
|
||||||
[ -r /etc/sysconfig/$NAME ] && . /etc/sysconfig/$NAME
|
|
||||||
|
|
||||||
# For SELinux we need to use 'runuser' not 'su'
|
|
||||||
if [ -x /sbin/runuser ]
|
|
||||||
then
|
|
||||||
SU=runuser
|
|
||||||
else
|
|
||||||
SU=su
|
|
||||||
fi
|
|
||||||
|
|
||||||
test -x $REPMGRD_BIN || exit 0
|
|
||||||
|
|
||||||
case "$REPMGRD_ENABLED" in
|
|
||||||
[Yy]*)
|
|
||||||
break
|
|
||||||
;;
|
|
||||||
*)
|
|
||||||
exit 0
|
|
||||||
;;
|
|
||||||
esac
|
|
||||||
|
|
||||||
|
|
||||||
if [ -z "${REPMGRD_OPTS}" ]
|
|
||||||
then
|
|
||||||
echo "Not starting ${NAME}, REPMGRD_OPTS not set in /etc/sysconfig/${NAME}"
|
|
||||||
exit 0
|
|
||||||
fi
|
|
||||||
|
|
||||||
start()
|
|
||||||
{
|
|
||||||
REPMGRD_START=$"Starting ${NAME} service: "
|
|
||||||
|
|
||||||
# Make sure startup-time log file is valid
|
|
||||||
if [ ! -e "${REPMGRD_LOG}" -a ! -h "${REPMGRD_LOG}" ]
|
|
||||||
then
|
|
||||||
touch "${REPMGRD_LOG}" || exit 1
|
|
||||||
chown ${REPMGRD_USER}:postgres "${REPMGRD_LOG}"
|
|
||||||
chmod go-rwx "${REPMGRD_LOG}"
|
|
||||||
[ -x /sbin/restorecon ] && /sbin/restorecon "${REPMGRD_LOG}"
|
|
||||||
fi
|
|
||||||
|
|
||||||
echo -n "${REPMGRD_START}"
|
|
||||||
$SU -l $REPMGRD_USER -c "${REPMGRD_BIN} ${REPMGRD_OPTS} -p ${REPMGRD_PIDFILE} &" >> "${REPMGRD_LOG}" 2>&1 < /dev/null
|
|
||||||
sleep 2
|
|
||||||
pid=`head -n 1 "${REPMGRD_PIDFILE}" 2>/dev/null`
|
|
||||||
if [ "x${pid}" != "x" ]
|
|
||||||
then
|
|
||||||
success "${REPMGRD_START}"
|
|
||||||
touch "${REPMGRD_LOCK}"
|
|
||||||
echo $pid > "${REPMGRD_PIDFILE}"
|
|
||||||
echo
|
|
||||||
else
|
|
||||||
failure "${REPMGRD_START}"
|
|
||||||
echo
|
|
||||||
script_result=1
|
|
||||||
fi
|
|
||||||
}
|
|
||||||
|
|
||||||
stop()
|
|
||||||
{
|
|
||||||
echo -n $"Stopping ${NAME} service: "
|
|
||||||
if [ -e "${REPMGRD_LOCK}" ]
|
|
||||||
then
|
|
||||||
killproc ${NAME}
|
|
||||||
ret=$?
|
|
||||||
if [ $ret -eq 0 ]
|
|
||||||
then
|
|
||||||
echo_success
|
|
||||||
rm -f "${REPMGRD_PIDFILE}"
|
|
||||||
rm -f "${REPMGRD_LOCK}"
|
|
||||||
else
|
|
||||||
echo_failure
|
|
||||||
script_result=1
|
|
||||||
fi
|
|
||||||
else
|
|
||||||
# not running; per LSB standards this is "ok"
|
|
||||||
echo_success
|
|
||||||
fi
|
|
||||||
echo
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
# See how we were called.
|
|
||||||
case "$1" in
|
|
||||||
start)
|
|
||||||
start
|
|
||||||
;;
|
|
||||||
stop)
|
|
||||||
stop
|
|
||||||
;;
|
|
||||||
status)
|
|
||||||
status -p $REPMGRD_PIDFILE $NAME
|
|
||||||
script_result=$?
|
|
||||||
;;
|
|
||||||
restart)
|
|
||||||
stop
|
|
||||||
start
|
|
||||||
;;
|
|
||||||
*)
|
|
||||||
echo $"Usage: $0 {start|stop|status|restart}"
|
|
||||||
exit 2
|
|
||||||
esac
|
|
||||||
|
|
||||||
exit $script_result
|
|
||||||
@@ -1,21 +0,0 @@
|
|||||||
# default settings for repmgrd. This file is source by /bin/sh from
|
|
||||||
# /etc/init.d/repmgrd
|
|
||||||
|
|
||||||
# disable repmgrd by default so it won't get started upon installation
|
|
||||||
# valid values: yes/no
|
|
||||||
REPMGRD_ENABLED=no
|
|
||||||
|
|
||||||
# Options for repmgrd (required)
|
|
||||||
#REPMGRD_OPTS="--verbose -d -f /var/lib/pgsql/repmgr/repmgr.conf"
|
|
||||||
|
|
||||||
# User to run repmgrd as
|
|
||||||
#REPMGRD_USER=postgres
|
|
||||||
|
|
||||||
# repmgrd binary
|
|
||||||
#REPMGRD_BIN=/usr/bin/repmgrd
|
|
||||||
|
|
||||||
# pid file
|
|
||||||
#REPMGRD_PIDFILE=/var/lib/pgsql/repmgr/repmgrd.pid
|
|
||||||
|
|
||||||
# log file
|
|
||||||
#REPMGRD_LOG=/var/lib/pgsql/repmgr/repmgrd.log
|
|
||||||
11
TODO
11
TODO
@@ -40,13 +40,6 @@ Planned feature improvements
|
|||||||
* make old master node ID available for event notification commands
|
* make old master node ID available for event notification commands
|
||||||
(See github issue #80).
|
(See github issue #80).
|
||||||
|
|
||||||
* Have pg_basebackup use replication slots, if and when support for
|
|
||||||
this is added; see:
|
|
||||||
http://www.postgresql.org/message-id/555DD2B2.7020000@gmx.net
|
|
||||||
|
|
||||||
* use "primary/standby" terminology in place of "master/slave" for consistency
|
|
||||||
with main PostrgreSQL usage
|
|
||||||
|
|
||||||
* repmgr standby clone: possibility to use barman instead of performing a new base backup
|
* repmgr standby clone: possibility to use barman instead of performing a new base backup
|
||||||
|
|
||||||
* possibility to transform a failed master into a new standby with pg_rewind
|
* possibility to transform a failed master into a new standby with pg_rewind
|
||||||
@@ -60,6 +53,10 @@ Planned feature improvements
|
|||||||
requested, activate the replication slot using pg_receivexlog to negate the
|
requested, activate the replication slot using pg_receivexlog to negate the
|
||||||
need to set `wal_keep_segments` just for the initial clone (9.4 and 9.5).
|
need to set `wal_keep_segments` just for the initial clone (9.4 and 9.5).
|
||||||
|
|
||||||
|
* repmgr: enable "standby follow" to point a standby at another standby, not
|
||||||
|
just the replication cluster master (see GitHub #130)
|
||||||
|
|
||||||
|
|
||||||
Usability improvements
|
Usability improvements
|
||||||
======================
|
======================
|
||||||
|
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* check_dir.c - Directories management functions
|
* check_dir.c - Directories management functions
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* check_dir.h
|
* check_dir.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
|||||||
107
compat.c
Normal file
107
compat.c
Normal file
@@ -0,0 +1,107 @@
|
|||||||
|
/*
|
||||||
|
*
|
||||||
|
* compat.c
|
||||||
|
* Provides a couple of useful string utility functions adapted
|
||||||
|
* from the backend code, which are not publicly exposed. They're
|
||||||
|
* unlikely to change but it would be worth keeping an eye on them
|
||||||
|
* for any fixes/improvements
|
||||||
|
*
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
|
*
|
||||||
|
* Portions Copyright (c) 1996-2013, PostgreSQL Global Development Group
|
||||||
|
* Portions Copyright (c) 1994, Regents of the University of California
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include "repmgr.h"
|
||||||
|
#include "compat.h"
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Append the given string to the buffer, with suitable quoting for passing
|
||||||
|
* the string as a value, in a keyword/pair value in a libpq connection
|
||||||
|
* string
|
||||||
|
*
|
||||||
|
* This function is adapted from src/fe_utils/string_utils.c (before 9.6
|
||||||
|
* located in: src/bin/pg_dump/dumputils.c)
|
||||||
|
*/
|
||||||
|
void
|
||||||
|
appendConnStrVal(PQExpBuffer buf, const char *str)
|
||||||
|
{
|
||||||
|
const char *s;
|
||||||
|
bool needquotes;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* If the string is one or more plain ASCII characters, no need to quote
|
||||||
|
* it. This is quite conservative, but better safe than sorry.
|
||||||
|
*/
|
||||||
|
needquotes = true;
|
||||||
|
for (s = str; *s; s++)
|
||||||
|
{
|
||||||
|
if (!((*s >= 'a' && *s <= 'z') || (*s >= 'A' && *s <= 'Z') ||
|
||||||
|
(*s >= '0' && *s <= '9') || *s == '_' || *s == '.'))
|
||||||
|
{
|
||||||
|
needquotes = true;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
needquotes = false;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (needquotes)
|
||||||
|
{
|
||||||
|
appendPQExpBufferChar(buf, '\'');
|
||||||
|
while (*str)
|
||||||
|
{
|
||||||
|
/* ' and \ must be escaped by to \' and \\ */
|
||||||
|
if (*str == '\'' || *str == '\\')
|
||||||
|
appendPQExpBufferChar(buf, '\\');
|
||||||
|
|
||||||
|
appendPQExpBufferChar(buf, *str);
|
||||||
|
str++;
|
||||||
|
}
|
||||||
|
appendPQExpBufferChar(buf, '\'');
|
||||||
|
}
|
||||||
|
else
|
||||||
|
appendPQExpBufferStr(buf, str);
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Adapted from: src/fe_utils/string_utils.c
|
||||||
|
*/
|
||||||
|
void
|
||||||
|
appendShellString(PQExpBuffer buf, const char *str)
|
||||||
|
{
|
||||||
|
const char *p;
|
||||||
|
|
||||||
|
appendPQExpBufferChar(buf, '\'');
|
||||||
|
for (p = str; *p; p++)
|
||||||
|
{
|
||||||
|
if (*p == '\n' || *p == '\r')
|
||||||
|
{
|
||||||
|
fprintf(stderr,
|
||||||
|
_("shell command argument contains a newline or carriage return: \"%s\"\n"),
|
||||||
|
str);
|
||||||
|
exit(ERR_BAD_CONFIG);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (*p == '\'')
|
||||||
|
appendPQExpBufferStr(buf, "'\"'\"'");
|
||||||
|
else
|
||||||
|
appendPQExpBufferChar(buf, *p);
|
||||||
|
}
|
||||||
|
|
||||||
|
appendPQExpBufferChar(buf, '\'');
|
||||||
|
}
|
||||||
|
|
||||||
29
compat.h
Normal file
29
compat.h
Normal file
@@ -0,0 +1,29 @@
|
|||||||
|
/*
|
||||||
|
* compat.h
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
|
||||||
|
#ifndef _COMPAT_H_
|
||||||
|
#define _COMPAT_H_
|
||||||
|
|
||||||
|
extern void
|
||||||
|
appendConnStrVal(PQExpBuffer buf, const char *str);
|
||||||
|
|
||||||
|
extern void
|
||||||
|
appendShellString(PQExpBuffer buf, const char *str);
|
||||||
|
|
||||||
|
#endif
|
||||||
424
config.c
424
config.c
@@ -1,6 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* config.c - Functions to parse the config file
|
* config.c - Functions to parse the config file
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
*
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -9,11 +10,11 @@
|
|||||||
*
|
*
|
||||||
* This program is distributed in the hope that it will be useful,
|
* This program is distributed in the hope that it will be useful,
|
||||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
* GNU General Public License for more details.
|
* GNU General Public License for more details.
|
||||||
*
|
*
|
||||||
* You should have received a copy of the GNU General Public License
|
* You should have received a copy of the GNU General Public License
|
||||||
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
@@ -26,12 +27,12 @@
|
|||||||
|
|
||||||
static void parse_event_notifications_list(t_configuration_options *options, const char *arg);
|
static void parse_event_notifications_list(t_configuration_options *options, const char *arg);
|
||||||
static void tablespace_list_append(t_configuration_options *options, const char *arg);
|
static void tablespace_list_append(t_configuration_options *options, const char *arg);
|
||||||
static void exit_with_errors(ErrorList *config_errors);
|
static void exit_with_errors(ItemList *config_errors);
|
||||||
|
|
||||||
const static char *_progname = '\0';
|
const static char *_progname = NULL;
|
||||||
static char config_file_path[MAXPGPATH];
|
static char config_file_path[MAXPGPATH];
|
||||||
static bool config_file_provided = false;
|
static bool config_file_provided = false;
|
||||||
static bool config_file_found = false;
|
bool config_file_found = false;
|
||||||
|
|
||||||
|
|
||||||
void
|
void
|
||||||
@@ -54,8 +55,8 @@ progname(void)
|
|||||||
*
|
*
|
||||||
* Returns true if a configuration file could be parsed, otherwise false.
|
* Returns true if a configuration file could be parsed, otherwise false.
|
||||||
*
|
*
|
||||||
* Any configuration options changed in this function must also be changed in
|
* Any *repmgrd-specific* configuration options added/changed in this function must also be
|
||||||
* reload_config()
|
* added/changed in reload_config()
|
||||||
*
|
*
|
||||||
* NOTE: this function is called before the logger is set up, so we need
|
* NOTE: this function is called before the logger is set up, so we need
|
||||||
* to handle the verbose option ourselves; also the default log level is NOTICE,
|
* to handle the verbose option ourselves; also the default log level is NOTICE,
|
||||||
@@ -98,9 +99,9 @@ load_config(const char *config_file, bool verbose, t_configuration_options *opti
|
|||||||
/*
|
/*
|
||||||
* If no configuration file was provided, attempt to find a default file
|
* If no configuration file was provided, attempt to find a default file
|
||||||
* in this order:
|
* in this order:
|
||||||
* - current directory
|
* - current directory
|
||||||
* - /etc/repmgr.conf
|
* - /etc/repmgr.conf
|
||||||
* - default sysconfdir
|
* - default sysconfdir
|
||||||
*
|
*
|
||||||
* here we just check for the existence of the file; parse_config()
|
* here we just check for the existence of the file; parse_config()
|
||||||
* will handle read errors etc.
|
* will handle read errors etc.
|
||||||
@@ -149,7 +150,7 @@ load_config(const char *config_file, bool verbose, t_configuration_options *opti
|
|||||||
|
|
||||||
if (verbose == true)
|
if (verbose == true)
|
||||||
{
|
{
|
||||||
log_notice(_("looking for configuration file in %s"), sysconf_etc_path);
|
log_notice(_("looking for configuration file in %s\n"), sysconf_etc_path);
|
||||||
}
|
}
|
||||||
|
|
||||||
snprintf(config_file_path, MAXPGPATH, "%s/%s", sysconf_etc_path, CONFIG_FILE_NAME);
|
snprintf(config_file_path, MAXPGPATH, "%s/%s", sysconf_etc_path, CONFIG_FILE_NAME);
|
||||||
@@ -180,6 +181,23 @@ load_config(const char *config_file, bool verbose, t_configuration_options *opti
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
bool
|
||||||
|
parse_config(t_configuration_options *options)
|
||||||
|
{
|
||||||
|
/* Collate configuration file errors here for friendlier reporting */
|
||||||
|
static ItemList config_errors = { NULL, NULL };
|
||||||
|
|
||||||
|
_parse_config(options, &config_errors);
|
||||||
|
|
||||||
|
if (config_errors.head != NULL)
|
||||||
|
{
|
||||||
|
exit_with_errors(&config_errors);
|
||||||
|
}
|
||||||
|
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Parse configuration file; if any errors are encountered,
|
* Parse configuration file; if any errors are encountered,
|
||||||
* list them and exit.
|
* list them and exit.
|
||||||
@@ -187,8 +205,8 @@ load_config(const char *config_file, bool verbose, t_configuration_options *opti
|
|||||||
* Ensure any default values set here are synced with repmgr.conf.sample
|
* Ensure any default values set here are synced with repmgr.conf.sample
|
||||||
* and any other documentation.
|
* and any other documentation.
|
||||||
*/
|
*/
|
||||||
bool
|
void
|
||||||
parse_config(t_configuration_options *options)
|
_parse_config(t_configuration_options *options, ItemList *error_list)
|
||||||
{
|
{
|
||||||
FILE *fp;
|
FILE *fp;
|
||||||
char *s,
|
char *s,
|
||||||
@@ -198,30 +216,37 @@ parse_config(t_configuration_options *options)
|
|||||||
|
|
||||||
/* For sanity-checking provided conninfo string */
|
/* For sanity-checking provided conninfo string */
|
||||||
PQconninfoOption *conninfo_options;
|
PQconninfoOption *conninfo_options;
|
||||||
char *conninfo_errmsg = NULL;
|
char *conninfo_errmsg = NULL;
|
||||||
|
|
||||||
/* Collate configuration file errors here for friendlier reporting */
|
bool node_found = false;
|
||||||
static ErrorList config_errors = { NULL, NULL };
|
|
||||||
|
|
||||||
/* Initialize configuration options with sensible defaults
|
/* Initialize configuration options with sensible defaults
|
||||||
* note: the default log level is set in log.c and does not need
|
* note: the default log level is set in log.c and does not need
|
||||||
* to be initialised here
|
* to be initialised here
|
||||||
*/
|
*/
|
||||||
memset(options->cluster_name, 0, sizeof(options->cluster_name));
|
memset(options->cluster_name, 0, sizeof(options->cluster_name));
|
||||||
options->node = -1;
|
options->node = UNKNOWN_NODE_ID;
|
||||||
options->upstream_node = NO_UPSTREAM_NODE;
|
options->upstream_node = NO_UPSTREAM_NODE;
|
||||||
options->use_replication_slots = 0;
|
options->use_replication_slots = 0;
|
||||||
memset(options->conninfo, 0, sizeof(options->conninfo));
|
memset(options->conninfo, 0, sizeof(options->conninfo));
|
||||||
|
memset(options->barman_server, 0, sizeof(options->barman_server));
|
||||||
|
memset(options->barman_config, 0, sizeof(options->barman_config));
|
||||||
options->failover = MANUAL_FAILOVER;
|
options->failover = MANUAL_FAILOVER;
|
||||||
options->priority = DEFAULT_PRIORITY;
|
options->priority = DEFAULT_PRIORITY;
|
||||||
memset(options->node_name, 0, sizeof(options->node_name));
|
memset(options->node_name, 0, sizeof(options->node_name));
|
||||||
memset(options->promote_command, 0, sizeof(options->promote_command));
|
memset(options->promote_command, 0, sizeof(options->promote_command));
|
||||||
memset(options->follow_command, 0, sizeof(options->follow_command));
|
memset(options->follow_command, 0, sizeof(options->follow_command));
|
||||||
|
memset(options->service_stop_command, 0, sizeof(options->service_stop_command));
|
||||||
|
memset(options->service_start_command, 0, sizeof(options->service_start_command));
|
||||||
|
memset(options->service_restart_command, 0, sizeof(options->service_restart_command));
|
||||||
|
memset(options->service_reload_command, 0, sizeof(options->service_reload_command));
|
||||||
|
memset(options->service_promote_command, 0, sizeof(options->service_promote_command));
|
||||||
memset(options->rsync_options, 0, sizeof(options->rsync_options));
|
memset(options->rsync_options, 0, sizeof(options->rsync_options));
|
||||||
memset(options->ssh_options, 0, sizeof(options->ssh_options));
|
memset(options->ssh_options, 0, sizeof(options->ssh_options));
|
||||||
memset(options->pg_bindir, 0, sizeof(options->pg_bindir));
|
memset(options->pg_bindir, 0, sizeof(options->pg_bindir));
|
||||||
memset(options->pg_ctl_options, 0, sizeof(options->pg_ctl_options));
|
memset(options->pg_ctl_options, 0, sizeof(options->pg_ctl_options));
|
||||||
memset(options->pg_basebackup_options, 0, sizeof(options->pg_basebackup_options));
|
memset(options->pg_basebackup_options, 0, sizeof(options->pg_basebackup_options));
|
||||||
|
memset(options->restore_command, 0, sizeof(options->restore_command));
|
||||||
|
|
||||||
/* default master_response_timeout is 60 seconds */
|
/* default master_response_timeout is 60 seconds */
|
||||||
options->master_response_timeout = 60;
|
options->master_response_timeout = 60;
|
||||||
@@ -233,7 +258,12 @@ parse_config(t_configuration_options *options)
|
|||||||
options->monitor_interval_secs = 2;
|
options->monitor_interval_secs = 2;
|
||||||
options->retry_promote_interval_secs = 300;
|
options->retry_promote_interval_secs = 300;
|
||||||
|
|
||||||
|
/* default to resyncing repl_nodes table every 30 seconds on the witness server */
|
||||||
|
options->witness_repl_nodes_sync_interval_secs = 30;
|
||||||
|
|
||||||
memset(options->event_notification_command, 0, sizeof(options->event_notification_command));
|
memset(options->event_notification_command, 0, sizeof(options->event_notification_command));
|
||||||
|
options->event_notifications.head = NULL;
|
||||||
|
options->event_notifications.tail = NULL;
|
||||||
|
|
||||||
options->tablespace_mapping.head = NULL;
|
options->tablespace_mapping.head = NULL;
|
||||||
options->tablespace_mapping.tail = NULL;
|
options->tablespace_mapping.tail = NULL;
|
||||||
@@ -244,9 +274,9 @@ parse_config(t_configuration_options *options)
|
|||||||
*/
|
*/
|
||||||
if (config_file_found == false)
|
if (config_file_found == false)
|
||||||
{
|
{
|
||||||
log_notice(_("no configuration file provided and no default file found - "
|
log_verbose(LOG_NOTICE, _("no configuration file provided and no default file found - "
|
||||||
"continuing with default values\n"));
|
"continuing with default values\n"));
|
||||||
return true;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
fp = fopen(config_file_path, "r");
|
fp = fopen(config_file_path, "r");
|
||||||
@@ -290,11 +320,18 @@ parse_config(t_configuration_options *options)
|
|||||||
if (strcmp(name, "cluster") == 0)
|
if (strcmp(name, "cluster") == 0)
|
||||||
strncpy(options->cluster_name, value, MAXLEN);
|
strncpy(options->cluster_name, value, MAXLEN);
|
||||||
else if (strcmp(name, "node") == 0)
|
else if (strcmp(name, "node") == 0)
|
||||||
options->node = repmgr_atoi(value, "node", &config_errors);
|
{
|
||||||
|
options->node = repmgr_atoi(value, "node", error_list, false);
|
||||||
|
node_found = true;
|
||||||
|
}
|
||||||
else if (strcmp(name, "upstream_node") == 0)
|
else if (strcmp(name, "upstream_node") == 0)
|
||||||
options->upstream_node = repmgr_atoi(value, "upstream_node", &config_errors);
|
options->upstream_node = repmgr_atoi(value, "upstream_node", error_list, false);
|
||||||
else if (strcmp(name, "conninfo") == 0)
|
else if (strcmp(name, "conninfo") == 0)
|
||||||
strncpy(options->conninfo, value, MAXLEN);
|
strncpy(options->conninfo, value, MAXLEN);
|
||||||
|
else if (strcmp(name, "barman_server") == 0)
|
||||||
|
strncpy(options->barman_server, value, MAXLEN);
|
||||||
|
else if (strcmp(name, "barman_config") == 0)
|
||||||
|
strncpy(options->barman_config, value, MAXLEN);
|
||||||
else if (strcmp(name, "rsync_options") == 0)
|
else if (strcmp(name, "rsync_options") == 0)
|
||||||
strncpy(options->rsync_options, value, QUERY_STR_LEN);
|
strncpy(options->rsync_options, value, QUERY_STR_LEN);
|
||||||
else if (strcmp(name, "ssh_options") == 0)
|
else if (strcmp(name, "ssh_options") == 0)
|
||||||
@@ -319,28 +356,39 @@ parse_config(t_configuration_options *options)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
error_list_append(&config_errors,_("value for 'failover' must be 'automatic' or 'manual'\n"));
|
item_list_append(error_list, _("value for 'failover' must be 'automatic' or 'manual'\n"));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else if (strcmp(name, "priority") == 0)
|
else if (strcmp(name, "priority") == 0)
|
||||||
options->priority = repmgr_atoi(value, "priority", &config_errors);
|
options->priority = repmgr_atoi(value, "priority", error_list, true);
|
||||||
else if (strcmp(name, "node_name") == 0)
|
else if (strcmp(name, "node_name") == 0)
|
||||||
strncpy(options->node_name, value, MAXLEN);
|
strncpy(options->node_name, value, MAXLEN);
|
||||||
else if (strcmp(name, "promote_command") == 0)
|
else if (strcmp(name, "promote_command") == 0)
|
||||||
strncpy(options->promote_command, value, MAXLEN);
|
strncpy(options->promote_command, value, MAXLEN);
|
||||||
else if (strcmp(name, "follow_command") == 0)
|
else if (strcmp(name, "follow_command") == 0)
|
||||||
strncpy(options->follow_command, value, MAXLEN);
|
strncpy(options->follow_command, value, MAXLEN);
|
||||||
|
else if (strcmp(name, "service_stop_command") == 0)
|
||||||
|
strncpy(options->service_stop_command, value, MAXLEN);
|
||||||
|
else if (strcmp(name, "service_start_command") == 0)
|
||||||
|
strncpy(options->service_start_command, value, MAXLEN);
|
||||||
|
else if (strcmp(name, "service_restart_command") == 0)
|
||||||
|
strncpy(options->service_restart_command, value, MAXLEN);
|
||||||
|
else if (strcmp(name, "service_reload_command") == 0)
|
||||||
|
strncpy(options->service_reload_command, value, MAXLEN);
|
||||||
|
else if (strcmp(name, "service_promote_command") == 0)
|
||||||
|
strncpy(options->service_promote_command, value, MAXLEN);
|
||||||
else if (strcmp(name, "master_response_timeout") == 0)
|
else if (strcmp(name, "master_response_timeout") == 0)
|
||||||
options->master_response_timeout = repmgr_atoi(value, "master_response_timeout", &config_errors);
|
options->master_response_timeout = repmgr_atoi(value, "master_response_timeout", error_list, false);
|
||||||
/* 'primary_response_timeout' as synonym for 'master_response_timeout' -
|
/*
|
||||||
|
* 'primary_response_timeout' as synonym for 'master_response_timeout' -
|
||||||
* we'll switch terminology in a future release (3.1?)
|
* we'll switch terminology in a future release (3.1?)
|
||||||
*/
|
*/
|
||||||
else if (strcmp(name, "primary_response_timeout") == 0)
|
else if (strcmp(name, "primary_response_timeout") == 0)
|
||||||
options->master_response_timeout = repmgr_atoi(value, "primary_response_timeout", &config_errors);
|
options->master_response_timeout = repmgr_atoi(value, "primary_response_timeout", error_list, false);
|
||||||
else if (strcmp(name, "reconnect_attempts") == 0)
|
else if (strcmp(name, "reconnect_attempts") == 0)
|
||||||
options->reconnect_attempts = repmgr_atoi(value, "reconnect_attempts", &config_errors);
|
options->reconnect_attempts = repmgr_atoi(value, "reconnect_attempts", error_list, false);
|
||||||
else if (strcmp(name, "reconnect_interval") == 0)
|
else if (strcmp(name, "reconnect_interval") == 0)
|
||||||
options->reconnect_interval = repmgr_atoi(value, "reconnect_interval", &config_errors);
|
options->reconnect_interval = repmgr_atoi(value, "reconnect_interval", error_list, false);
|
||||||
else if (strcmp(name, "pg_bindir") == 0)
|
else if (strcmp(name, "pg_bindir") == 0)
|
||||||
strncpy(options->pg_bindir, value, MAXLEN);
|
strncpy(options->pg_bindir, value, MAXLEN);
|
||||||
else if (strcmp(name, "pg_ctl_options") == 0)
|
else if (strcmp(name, "pg_ctl_options") == 0)
|
||||||
@@ -350,18 +398,22 @@ parse_config(t_configuration_options *options)
|
|||||||
else if (strcmp(name, "logfile") == 0)
|
else if (strcmp(name, "logfile") == 0)
|
||||||
strncpy(options->logfile, value, MAXLEN);
|
strncpy(options->logfile, value, MAXLEN);
|
||||||
else if (strcmp(name, "monitor_interval_secs") == 0)
|
else if (strcmp(name, "monitor_interval_secs") == 0)
|
||||||
options->monitor_interval_secs = repmgr_atoi(value, "monitor_interval_secs", &config_errors);
|
options->monitor_interval_secs = repmgr_atoi(value, "monitor_interval_secs", error_list, false);
|
||||||
else if (strcmp(name, "retry_promote_interval_secs") == 0)
|
else if (strcmp(name, "retry_promote_interval_secs") == 0)
|
||||||
options->retry_promote_interval_secs = repmgr_atoi(value, "retry_promote_interval_secs", &config_errors);
|
options->retry_promote_interval_secs = repmgr_atoi(value, "retry_promote_interval_secs", error_list, false);
|
||||||
|
else if (strcmp(name, "witness_repl_nodes_sync_interval_secs") == 0)
|
||||||
|
options->witness_repl_nodes_sync_interval_secs = repmgr_atoi(value, "witness_repl_nodes_sync_interval_secs", error_list, false);
|
||||||
else if (strcmp(name, "use_replication_slots") == 0)
|
else if (strcmp(name, "use_replication_slots") == 0)
|
||||||
/* XXX we should have a dedicated boolean argument format */
|
/* XXX we should have a dedicated boolean argument format */
|
||||||
options->use_replication_slots = repmgr_atoi(value, "use_replication_slots", &config_errors);
|
options->use_replication_slots = repmgr_atoi(value, "use_replication_slots", error_list, false);
|
||||||
else if (strcmp(name, "event_notification_command") == 0)
|
else if (strcmp(name, "event_notification_command") == 0)
|
||||||
strncpy(options->event_notification_command, value, MAXLEN);
|
strncpy(options->event_notification_command, value, MAXLEN);
|
||||||
else if (strcmp(name, "event_notifications") == 0)
|
else if (strcmp(name, "event_notifications") == 0)
|
||||||
parse_event_notifications_list(options, value);
|
parse_event_notifications_list(options, value);
|
||||||
else if (strcmp(name, "tablespace_mapping") == 0)
|
else if (strcmp(name, "tablespace_mapping") == 0)
|
||||||
tablespace_list_append(options, value);
|
tablespace_list_append(options, value);
|
||||||
|
else if (strcmp(name, "restore_command") == 0)
|
||||||
|
strncpy(options->restore_command, value, MAXLEN);
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
known_parameter = false;
|
known_parameter = false;
|
||||||
@@ -381,35 +433,27 @@ parse_config(t_configuration_options *options)
|
|||||||
_("no value provided for parameter \"%s\""),
|
_("no value provided for parameter \"%s\""),
|
||||||
name);
|
name);
|
||||||
|
|
||||||
error_list_append(&config_errors, error_message_buf);
|
item_list_append(error_list, error_message_buf);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fclose(fp);
|
fclose(fp);
|
||||||
|
|
||||||
/* Check config settings */
|
|
||||||
|
|
||||||
/* The following checks are for the presence of the parameter */
|
if (node_found == false)
|
||||||
if (*options->cluster_name == '\0')
|
|
||||||
{
|
{
|
||||||
error_list_append(&config_errors, _("\"cluster\": parameter was not found\n"));
|
item_list_append(error_list, _("\"node\": parameter was not found"));
|
||||||
|
}
|
||||||
|
else if (options->node == 0)
|
||||||
|
{
|
||||||
|
item_list_append(error_list, _("\"node\": must be greater than zero"));
|
||||||
|
}
|
||||||
|
else if (options->node < 0)
|
||||||
|
{
|
||||||
|
item_list_append(error_list, _("\"node\": must be a positive signed 32 bit integer, i.e. 2147483647 or less"));
|
||||||
}
|
}
|
||||||
|
|
||||||
if (options->node == -1)
|
if (strlen(options->conninfo))
|
||||||
{
|
|
||||||
error_list_append(&config_errors, _("\"node\": parameter was not found\n"));
|
|
||||||
}
|
|
||||||
|
|
||||||
if (*options->node_name == '\0')
|
|
||||||
{
|
|
||||||
error_list_append(&config_errors, _("\"node_name\": parameter was not found\n"));
|
|
||||||
}
|
|
||||||
|
|
||||||
if (*options->conninfo == '\0')
|
|
||||||
{
|
|
||||||
error_list_append(&config_errors, _("\"conninfo\": parameter was not found\n"));
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
{
|
||||||
|
|
||||||
/* Sanity check the provided conninfo string
|
/* Sanity check the provided conninfo string
|
||||||
@@ -426,18 +470,11 @@ parse_config(t_configuration_options *options)
|
|||||||
_("\"conninfo\": %s"),
|
_("\"conninfo\": %s"),
|
||||||
conninfo_errmsg);
|
conninfo_errmsg);
|
||||||
|
|
||||||
error_list_append(&config_errors, error_message_buf);
|
item_list_append(error_list, error_message_buf);
|
||||||
}
|
}
|
||||||
|
|
||||||
PQconninfoFree(conninfo_options);
|
PQconninfoFree(conninfo_options);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (config_errors.head != NULL)
|
|
||||||
{
|
|
||||||
exit_with_errors(&config_errors);
|
|
||||||
}
|
|
||||||
|
|
||||||
return true;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@@ -527,70 +564,85 @@ parse_line(char *buf, char *name, char *value)
|
|||||||
trim(value);
|
trim(value);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* reload_config()
|
||||||
|
*
|
||||||
|
* This is only called by repmgrd after receiving a SIGHUP or when a monitoring
|
||||||
|
* loop is started up; it therefore only needs to reload options required
|
||||||
|
* by repmgrd, which are as follows:
|
||||||
|
*
|
||||||
|
* changeable options:
|
||||||
|
* - failover
|
||||||
|
* - follow_command
|
||||||
|
* - logfacility
|
||||||
|
* - logfile
|
||||||
|
* - loglevel
|
||||||
|
* - master_response_timeout
|
||||||
|
* - monitor_interval_secs
|
||||||
|
* - priority
|
||||||
|
* - promote_command
|
||||||
|
* - reconnect_attempts
|
||||||
|
* - reconnect_interval
|
||||||
|
* - retry_promote_interval_secs
|
||||||
|
* - witness_repl_nodes_sync_interval_secs
|
||||||
|
*
|
||||||
|
* non-changeable options:
|
||||||
|
* - cluster_name
|
||||||
|
* - conninfo
|
||||||
|
* - node
|
||||||
|
* - node_name
|
||||||
|
*
|
||||||
|
* extract with something like:
|
||||||
|
* grep local_options\\. repmgrd.c | perl -n -e '/local_options\.([\w_]+)/ && print qq|$1\n|;' | sort | uniq
|
||||||
|
|
||||||
|
*/
|
||||||
bool
|
bool
|
||||||
reload_config(t_configuration_options *orig_options)
|
reload_config(t_configuration_options *orig_options)
|
||||||
{
|
{
|
||||||
PGconn *conn;
|
PGconn *conn;
|
||||||
t_configuration_options new_options;
|
t_configuration_options new_options = T_CONFIGURATION_OPTIONS_INITIALIZER;
|
||||||
bool config_changed = false;
|
bool config_changed = false;
|
||||||
|
bool log_config_changed = false;
|
||||||
|
|
||||||
|
static ItemList config_errors = { NULL, NULL };
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Re-read the configuration file: repmgr.conf
|
* Re-read the configuration file: repmgr.conf
|
||||||
*/
|
*/
|
||||||
log_info(_("reloading configuration file and updating repmgr tables\n"));
|
log_info(_("reloading configuration file\n"));
|
||||||
|
|
||||||
parse_config(&new_options);
|
_parse_config(&new_options, &config_errors);
|
||||||
if (new_options.node == -1)
|
|
||||||
|
if (config_errors.head != NULL)
|
||||||
{
|
{
|
||||||
|
/* XXX dump errors to log */
|
||||||
log_warning(_("unable to parse new configuration, retaining current configuration\n"));
|
log_warning(_("unable to parse new configuration, retaining current configuration\n"));
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* The following options cannot be changed */
|
||||||
if (strcmp(new_options.cluster_name, orig_options->cluster_name) != 0)
|
if (strcmp(new_options.cluster_name, orig_options->cluster_name) != 0)
|
||||||
{
|
{
|
||||||
log_warning(_("unable to change cluster name, retaining current configuration\n"));
|
log_warning(_("cluster_name cannot be changed, retaining current configuration\n"));
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (new_options.node != orig_options->node)
|
if (new_options.node != orig_options->node)
|
||||||
{
|
{
|
||||||
log_warning(_("unable to change node ID, retaining current configuration\n"));
|
log_warning(_("node ID cannot be changed, retaining current configuration\n"));
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (strcmp(new_options.node_name, orig_options->node_name) != 0)
|
if (strcmp(new_options.node_name, orig_options->node_name) != 0)
|
||||||
{
|
{
|
||||||
log_warning(_("unable to change standby name, keeping current configuration\n"));
|
log_warning(_("node_name cannot be changed, keeping current configuration\n"));
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (new_options.failover != MANUAL_FAILOVER && new_options.failover != AUTOMATIC_FAILOVER)
|
|
||||||
{
|
|
||||||
log_warning(_("new value for 'failover' must be 'automatic' or 'manual'\n"));
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (new_options.master_response_timeout <= 0)
|
|
||||||
{
|
|
||||||
log_warning(_("new value for 'master_response_timeout' must be greater than zero\n"));
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (new_options.reconnect_attempts < 0)
|
|
||||||
{
|
|
||||||
log_warning(_("new value for 'reconnect_attempts' must be zero or greater\n"));
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (new_options.reconnect_interval < 0)
|
|
||||||
{
|
|
||||||
log_warning(_("new value for 'reconnect_interval' must be zero or greater\n"));
|
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (strcmp(orig_options->conninfo, new_options.conninfo) != 0)
|
if (strcmp(orig_options->conninfo, new_options.conninfo) != 0)
|
||||||
{
|
{
|
||||||
/* Test conninfo string */
|
/* Test conninfo string works*/
|
||||||
conn = establish_db_connection(new_options.conninfo, false);
|
conn = establish_db_connection(new_options.conninfo, false);
|
||||||
if (!conn || (PQstatus(conn) != CONNECTION_OK))
|
if (!conn || (PQstatus(conn) != CONNECTION_OK))
|
||||||
{
|
{
|
||||||
@@ -607,27 +659,6 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
* to manage them
|
* to manage them
|
||||||
*/
|
*/
|
||||||
|
|
||||||
/* cluster_name */
|
|
||||||
if (strcmp(orig_options->cluster_name, new_options.cluster_name) != 0)
|
|
||||||
{
|
|
||||||
strcpy(orig_options->cluster_name, new_options.cluster_name);
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* conninfo */
|
|
||||||
if (strcmp(orig_options->conninfo, new_options.conninfo) != 0)
|
|
||||||
{
|
|
||||||
strcpy(orig_options->conninfo, new_options.conninfo);
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* node */
|
|
||||||
if (orig_options->node != new_options.node)
|
|
||||||
{
|
|
||||||
orig_options->node = new_options.node;
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* failover */
|
/* failover */
|
||||||
if (orig_options->failover != new_options.failover)
|
if (orig_options->failover != new_options.failover)
|
||||||
{
|
{
|
||||||
@@ -635,27 +666,6 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* priority */
|
|
||||||
if (orig_options->priority != new_options.priority)
|
|
||||||
{
|
|
||||||
orig_options->priority = new_options.priority;
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* node_name */
|
|
||||||
if (strcmp(orig_options->node_name, new_options.node_name) != 0)
|
|
||||||
{
|
|
||||||
strcpy(orig_options->node_name, new_options.node_name);
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* promote_command */
|
|
||||||
if (strcmp(orig_options->promote_command, new_options.promote_command) != 0)
|
|
||||||
{
|
|
||||||
strcpy(orig_options->promote_command, new_options.promote_command);
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* follow_command */
|
/* follow_command */
|
||||||
if (strcmp(orig_options->follow_command, new_options.follow_command) != 0)
|
if (strcmp(orig_options->follow_command, new_options.follow_command) != 0)
|
||||||
{
|
{
|
||||||
@@ -663,30 +673,6 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
|
||||||
* XXX These ones can change with a simple SIGHUP?
|
|
||||||
*
|
|
||||||
* strcpy (orig_options->loglevel, new_options.loglevel); strcpy
|
|
||||||
* (orig_options->logfacility, new_options.logfacility);
|
|
||||||
*
|
|
||||||
* logger_shutdown(); XXX do we have progname here ? logger_init(progname,
|
|
||||||
* orig_options.loglevel, orig_options.logfacility);
|
|
||||||
*/
|
|
||||||
|
|
||||||
/* rsync_options */
|
|
||||||
if (strcmp(orig_options->rsync_options, new_options.rsync_options) != 0)
|
|
||||||
{
|
|
||||||
strcpy(orig_options->rsync_options, new_options.rsync_options);
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* ssh_options */
|
|
||||||
if (strcmp(orig_options->ssh_options, new_options.ssh_options) != 0)
|
|
||||||
{
|
|
||||||
strcpy(orig_options->ssh_options, new_options.ssh_options);
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* master_response_timeout */
|
/* master_response_timeout */
|
||||||
if (orig_options->master_response_timeout != new_options.master_response_timeout)
|
if (orig_options->master_response_timeout != new_options.master_response_timeout)
|
||||||
{
|
{
|
||||||
@@ -694,6 +680,27 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* monitor_interval_secs */
|
||||||
|
if (orig_options->monitor_interval_secs != new_options.monitor_interval_secs)
|
||||||
|
{
|
||||||
|
orig_options->monitor_interval_secs = new_options.monitor_interval_secs;
|
||||||
|
config_changed = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* priority */
|
||||||
|
if (orig_options->priority != new_options.priority)
|
||||||
|
{
|
||||||
|
orig_options->priority = new_options.priority;
|
||||||
|
config_changed = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* promote_command */
|
||||||
|
if (strcmp(orig_options->promote_command, new_options.promote_command) != 0)
|
||||||
|
{
|
||||||
|
strcpy(orig_options->promote_command, new_options.promote_command);
|
||||||
|
config_changed = true;
|
||||||
|
}
|
||||||
|
|
||||||
/* reconnect_attempts */
|
/* reconnect_attempts */
|
||||||
if (orig_options->reconnect_attempts != new_options.reconnect_attempts)
|
if (orig_options->reconnect_attempts != new_options.reconnect_attempts)
|
||||||
{
|
{
|
||||||
@@ -708,27 +715,6 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* pg_ctl_options */
|
|
||||||
if (strcmp(orig_options->pg_ctl_options, new_options.pg_ctl_options) != 0)
|
|
||||||
{
|
|
||||||
strcpy(orig_options->pg_ctl_options, new_options.pg_ctl_options);
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* pg_basebackup_options */
|
|
||||||
if (strcmp(orig_options->pg_basebackup_options, new_options.pg_basebackup_options) != 0)
|
|
||||||
{
|
|
||||||
strcpy(orig_options->pg_basebackup_options, new_options.pg_basebackup_options);
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* monitor_interval_secs */
|
|
||||||
if (orig_options->monitor_interval_secs != new_options.monitor_interval_secs)
|
|
||||||
{
|
|
||||||
orig_options->monitor_interval_secs = new_options.monitor_interval_secs;
|
|
||||||
config_changed = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* retry_promote_interval_secs */
|
/* retry_promote_interval_secs */
|
||||||
if (orig_options->retry_promote_interval_secs != new_options.retry_promote_interval_secs)
|
if (orig_options->retry_promote_interval_secs != new_options.retry_promote_interval_secs)
|
||||||
{
|
{
|
||||||
@@ -736,20 +722,54 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* use_replication_slots */
|
|
||||||
if (orig_options->use_replication_slots != new_options.use_replication_slots)
|
/* witness_repl_nodes_sync_interval_secs */
|
||||||
|
if (orig_options->witness_repl_nodes_sync_interval_secs != new_options.witness_repl_nodes_sync_interval_secs)
|
||||||
{
|
{
|
||||||
orig_options->use_replication_slots = new_options.use_replication_slots;
|
orig_options->witness_repl_nodes_sync_interval_secs = new_options.witness_repl_nodes_sync_interval_secs;
|
||||||
config_changed = true;
|
config_changed = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Handle changes to logging configuration
|
||||||
|
*/
|
||||||
|
if (strcmp(orig_options->logfacility, new_options.logfacility) != 0)
|
||||||
|
{
|
||||||
|
strcpy(orig_options->logfacility, new_options.logfacility);
|
||||||
|
log_config_changed = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (strcmp(orig_options->logfile, new_options.logfile) != 0)
|
||||||
|
{
|
||||||
|
strcpy(orig_options->logfile, new_options.logfile);
|
||||||
|
log_config_changed = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
if (strcmp(orig_options->loglevel, new_options.loglevel) != 0)
|
||||||
|
{
|
||||||
|
strcpy(orig_options->loglevel, new_options.loglevel);
|
||||||
|
log_config_changed = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (log_config_changed == true)
|
||||||
|
{
|
||||||
|
log_notice(_("restarting logging with changed parameters\n"));
|
||||||
|
logger_shutdown();
|
||||||
|
logger_init(orig_options, progname());
|
||||||
|
}
|
||||||
|
|
||||||
if (config_changed == true)
|
if (config_changed == true)
|
||||||
{
|
{
|
||||||
log_debug(_("reload_config(): configuration has changed\n"));
|
log_notice(_("configuration file reloaded with changed parameters\n"));
|
||||||
}
|
}
|
||||||
else
|
/*
|
||||||
|
* if logging configuration changed, don't say the configuration didn't
|
||||||
|
* change, as it clearly has.
|
||||||
|
*/
|
||||||
|
else if (log_config_changed == false)
|
||||||
{
|
{
|
||||||
log_debug(_("reload_config(): configuration has not changed\n"));
|
log_info(_("configuration has not changed\n"));
|
||||||
}
|
}
|
||||||
|
|
||||||
return config_changed;
|
return config_changed;
|
||||||
@@ -757,11 +777,11 @@ reload_config(t_configuration_options *orig_options)
|
|||||||
|
|
||||||
|
|
||||||
void
|
void
|
||||||
error_list_append(ErrorList *error_list, char *error_message)
|
item_list_append(ItemList *item_list, char *error_message)
|
||||||
{
|
{
|
||||||
ErrorListCell *cell;
|
ItemListCell *cell;
|
||||||
|
|
||||||
cell = (ErrorListCell *) pg_malloc0(sizeof(ErrorListCell));
|
cell = (ItemListCell *) pg_malloc0(sizeof(ItemListCell));
|
||||||
|
|
||||||
if (cell == NULL)
|
if (cell == NULL)
|
||||||
{
|
{
|
||||||
@@ -769,19 +789,19 @@ error_list_append(ErrorList *error_list, char *error_message)
|
|||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
}
|
}
|
||||||
|
|
||||||
cell->error_message = pg_malloc0(MAXLEN);
|
cell->string = pg_malloc0(MAXLEN);
|
||||||
strncpy(cell->error_message, error_message, MAXLEN);
|
strncpy(cell->string, error_message, MAXLEN);
|
||||||
|
|
||||||
if (error_list->tail)
|
if (item_list->tail)
|
||||||
{
|
{
|
||||||
error_list->tail->next = cell;
|
item_list->tail->next = cell;
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
error_list->head = cell;
|
item_list->head = cell;
|
||||||
}
|
}
|
||||||
|
|
||||||
error_list->tail = cell;
|
item_list->tail = cell;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@@ -791,7 +811,7 @@ error_list_append(ErrorList *error_list, char *error_message)
|
|||||||
* otherwise exit
|
* otherwise exit
|
||||||
*/
|
*/
|
||||||
int
|
int
|
||||||
repmgr_atoi(const char *value, const char *config_item, ErrorList *error_list)
|
repmgr_atoi(const char *value, const char *config_item, ItemList *error_list, bool allow_negative)
|
||||||
{
|
{
|
||||||
char *endptr;
|
char *endptr;
|
||||||
long longval = 0;
|
long longval = 0;
|
||||||
@@ -822,8 +842,8 @@ repmgr_atoi(const char *value, const char *config_item, ErrorList *error_list)
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/* Currently there are no values which could be negative */
|
/* Disallow negative values for most parameters */
|
||||||
if (longval < 0)
|
if (allow_negative == false && longval < 0)
|
||||||
{
|
{
|
||||||
snprintf(error_message_buf,
|
snprintf(error_message_buf,
|
||||||
MAXLEN,
|
MAXLEN,
|
||||||
@@ -840,7 +860,7 @@ repmgr_atoi(const char *value, const char *config_item, ErrorList *error_list)
|
|||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
}
|
}
|
||||||
|
|
||||||
error_list_append(error_list, error_message_buf);
|
item_list_append(error_list, error_message_buf);
|
||||||
}
|
}
|
||||||
|
|
||||||
return (int32) longval;
|
return (int32) longval;
|
||||||
@@ -923,7 +943,7 @@ static void
|
|||||||
parse_event_notifications_list(t_configuration_options *options, const char *arg)
|
parse_event_notifications_list(t_configuration_options *options, const char *arg)
|
||||||
{
|
{
|
||||||
const char *arg_ptr;
|
const char *arg_ptr;
|
||||||
char event_type_buf[MAXLEN] = "";
|
char event_type_buf[MAXLEN] = "";
|
||||||
char *dst_ptr = event_type_buf;
|
char *dst_ptr = event_type_buf;
|
||||||
|
|
||||||
|
|
||||||
@@ -982,15 +1002,15 @@ parse_event_notifications_list(t_configuration_options *options, const char *arg
|
|||||||
|
|
||||||
|
|
||||||
static void
|
static void
|
||||||
exit_with_errors(ErrorList *config_errors)
|
exit_with_errors(ItemList *config_errors)
|
||||||
{
|
{
|
||||||
ErrorListCell *cell;
|
ItemListCell *cell;
|
||||||
|
|
||||||
log_err(_("%s: following errors were found in the configuration file.\n"), progname());
|
log_err(_("%s: following errors were found in the configuration file.\n"), progname());
|
||||||
|
|
||||||
for (cell = config_errors->head; cell; cell = cell->next)
|
for (cell = config_errors->head; cell; cell = cell->next)
|
||||||
{
|
{
|
||||||
log_err("%s\n", cell->error_message);
|
log_err("%s\n", cell->string);
|
||||||
}
|
}
|
||||||
|
|
||||||
exit(ERR_BAD_CONFIG);
|
exit(ERR_BAD_CONFIG);
|
||||||
|
|||||||
64
config.h
64
config.h
@@ -1,6 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* config.h
|
* config.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
*
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -57,11 +58,20 @@ typedef struct
|
|||||||
int node;
|
int node;
|
||||||
int upstream_node;
|
int upstream_node;
|
||||||
char conninfo[MAXLEN];
|
char conninfo[MAXLEN];
|
||||||
|
char barman_server[MAXLEN];
|
||||||
|
char barman_config[MAXLEN];
|
||||||
int failover;
|
int failover;
|
||||||
int priority;
|
int priority;
|
||||||
char node_name[MAXLEN];
|
char node_name[MAXLEN];
|
||||||
|
/* commands executed by repmgrd */
|
||||||
char promote_command[MAXLEN];
|
char promote_command[MAXLEN];
|
||||||
char follow_command[MAXLEN];
|
char follow_command[MAXLEN];
|
||||||
|
/* Overrides for pg_ctl commands */
|
||||||
|
char service_stop_command[MAXLEN];
|
||||||
|
char service_start_command[MAXLEN];
|
||||||
|
char service_restart_command[MAXLEN];
|
||||||
|
char service_reload_command[MAXLEN];
|
||||||
|
char service_promote_command[MAXLEN];
|
||||||
char loglevel[MAXLEN];
|
char loglevel[MAXLEN];
|
||||||
char logfacility[MAXLEN];
|
char logfacility[MAXLEN];
|
||||||
char rsync_options[QUERY_STR_LEN];
|
char rsync_options[QUERY_STR_LEN];
|
||||||
@@ -72,40 +82,66 @@ typedef struct
|
|||||||
char pg_bindir[MAXLEN];
|
char pg_bindir[MAXLEN];
|
||||||
char pg_ctl_options[MAXLEN];
|
char pg_ctl_options[MAXLEN];
|
||||||
char pg_basebackup_options[MAXLEN];
|
char pg_basebackup_options[MAXLEN];
|
||||||
|
char restore_command[MAXLEN];
|
||||||
char logfile[MAXLEN];
|
char logfile[MAXLEN];
|
||||||
int monitor_interval_secs;
|
int monitor_interval_secs;
|
||||||
int retry_promote_interval_secs;
|
int retry_promote_interval_secs;
|
||||||
|
int witness_repl_nodes_sync_interval_secs;
|
||||||
int use_replication_slots;
|
int use_replication_slots;
|
||||||
char event_notification_command[MAXLEN];
|
char event_notification_command[MAXLEN];
|
||||||
EventNotificationList event_notifications;
|
EventNotificationList event_notifications;
|
||||||
TablespaceList tablespace_mapping;
|
TablespaceList tablespace_mapping;
|
||||||
} t_configuration_options;
|
} t_configuration_options;
|
||||||
|
|
||||||
#define T_CONFIGURATION_OPTIONS_INITIALIZER { "", -1, NO_UPSTREAM_NODE, "", MANUAL_FAILOVER, -1, "", "", "", "", "", "", "", -1, -1, -1, "", "", "", "", 0, 0, 0, "", { NULL, NULL }, {NULL, NULL} }
|
/*
|
||||||
|
* The following will initialize the structure with a minimal set of options;
|
||||||
|
* actual defaults are set in parse_config() before parsing the configuration file
|
||||||
|
*/
|
||||||
|
#define T_CONFIGURATION_OPTIONS_INITIALIZER { "", UNKNOWN_NODE_ID, NO_UPSTREAM_NODE, "", "", "", MANUAL_FAILOVER, -1, "", "", "", "", "", "", "", "", "", "", "", "", -1, -1, -1, "", "", "", "", "", 0, 0, 0, 0, "", { NULL, NULL }, { NULL, NULL } }
|
||||||
|
|
||||||
typedef struct ErrorListCell
|
typedef struct ItemListCell
|
||||||
{
|
{
|
||||||
struct ErrorListCell *next;
|
struct ItemListCell *next;
|
||||||
char *error_message;
|
char *string;
|
||||||
} ErrorListCell;
|
} ItemListCell;
|
||||||
|
|
||||||
typedef struct ErrorList
|
typedef struct ItemList
|
||||||
{
|
{
|
||||||
ErrorListCell *head;
|
ItemListCell *head;
|
||||||
ErrorListCell *tail;
|
ItemListCell *tail;
|
||||||
} ErrorList;
|
} ItemList;
|
||||||
|
|
||||||
|
typedef struct TablespaceDataListCell
|
||||||
|
{
|
||||||
|
struct TablespaceDataListCell *next;
|
||||||
|
char *name;
|
||||||
|
char *oid;
|
||||||
|
char *location;
|
||||||
|
/* optional payload */
|
||||||
|
FILE *f;
|
||||||
|
} TablespaceDataListCell;
|
||||||
|
|
||||||
|
typedef struct TablespaceDataList
|
||||||
|
{
|
||||||
|
TablespaceDataListCell *head;
|
||||||
|
TablespaceDataListCell *tail;
|
||||||
|
} TablespaceDataList;
|
||||||
|
|
||||||
void set_progname(const char *argv0);
|
void set_progname(const char *argv0);
|
||||||
const char * progname(void);
|
const char * progname(void);
|
||||||
|
|
||||||
bool load_config(const char *config_file, bool verbose, t_configuration_options *options, char *argv0);
|
bool load_config(const char *config_file, bool verbose, t_configuration_options *options, char *argv0);
|
||||||
bool reload_config(t_configuration_options *orig_options);
|
|
||||||
|
void _parse_config(t_configuration_options *options, ItemList *error_list);
|
||||||
bool parse_config(t_configuration_options *options);
|
bool parse_config(t_configuration_options *options);
|
||||||
|
bool reload_config(t_configuration_options *orig_options);
|
||||||
|
|
||||||
void parse_line(char *buff, char *name, char *value);
|
void parse_line(char *buff, char *name, char *value);
|
||||||
char *trim(char *s);
|
char *trim(char *s);
|
||||||
void error_list_append(ErrorList *error_list, char *error_message);
|
void item_list_append(ItemList *item_list, char *error_message);
|
||||||
int repmgr_atoi(const char *s,
|
int repmgr_atoi(const char *s,
|
||||||
const char *config_item,
|
const char *config_item,
|
||||||
ErrorList *error_list);
|
ItemList *error_list,
|
||||||
|
bool allow_negative);
|
||||||
|
extern bool config_file_found;
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
50
dbutils.h
50
dbutils.h
@@ -1,6 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* dbutils.h
|
* dbutils.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
*
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -21,6 +22,7 @@
|
|||||||
#define _REPMGR_DBUTILS_H_
|
#define _REPMGR_DBUTILS_H_
|
||||||
|
|
||||||
#include "access/xlogdefs.h"
|
#include "access/xlogdefs.h"
|
||||||
|
#include "pqexpbuffer.h"
|
||||||
|
|
||||||
#include "config.h"
|
#include "config.h"
|
||||||
#include "strutil.h"
|
#include "strutil.h"
|
||||||
@@ -66,8 +68,27 @@ typedef struct s_node_info
|
|||||||
InvalidXLogRecPtr \
|
InvalidXLogRecPtr \
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Struct to store replication slot information
|
||||||
|
*/
|
||||||
|
|
||||||
|
typedef struct s_replication_slot
|
||||||
|
{
|
||||||
|
char slot_name[MAXLEN];
|
||||||
|
char slot_type[MAXLEN];
|
||||||
|
bool active;
|
||||||
|
} t_replication_slot;
|
||||||
|
|
||||||
|
extern char repmgr_schema[MAXLEN];
|
||||||
|
|
||||||
|
PGconn *_establish_db_connection(const char *conninfo,
|
||||||
|
const bool exit_on_error,
|
||||||
|
const bool log_notice,
|
||||||
|
const bool verbose_only);
|
||||||
PGconn *establish_db_connection(const char *conninfo,
|
PGconn *establish_db_connection(const char *conninfo,
|
||||||
const bool exit_on_error);
|
const bool exit_on_error);
|
||||||
|
PGconn *establish_db_connection_quiet(const char *conninfo);
|
||||||
|
PGconn *test_db_connection(const char *conninfo);
|
||||||
PGconn *establish_db_connection_by_params(const char *keywords[],
|
PGconn *establish_db_connection_by_params(const char *keywords[],
|
||||||
const char *values[],
|
const char *values[],
|
||||||
const bool exit_on_error);
|
const bool exit_on_error);
|
||||||
@@ -86,7 +107,7 @@ int guc_set(PGconn *conn, const char *parameter, const char *op,
|
|||||||
const char *value);
|
const char *value);
|
||||||
int guc_set_typed(PGconn *conn, const char *parameter, const char *op,
|
int guc_set_typed(PGconn *conn, const char *parameter, const char *op,
|
||||||
const char *value, const char *datatype);
|
const char *value, const char *datatype);
|
||||||
|
bool get_conninfo_value(const char *conninfo, const char *keyword, char *output);
|
||||||
PGconn *get_upstream_connection(PGconn *standby_conn, char *cluster,
|
PGconn *get_upstream_connection(PGconn *standby_conn, char *cluster,
|
||||||
int node_id,
|
int node_id,
|
||||||
int *upstream_node_id_ptr,
|
int *upstream_node_id_ptr,
|
||||||
@@ -98,18 +119,25 @@ int wait_connection_availability(PGconn *conn, long long timeout);
|
|||||||
bool cancel_query(PGconn *conn, int timeout);
|
bool cancel_query(PGconn *conn, int timeout);
|
||||||
char *get_repmgr_schema(void);
|
char *get_repmgr_schema(void);
|
||||||
char *get_repmgr_schema_quoted(PGconn *conn);
|
char *get_repmgr_schema_quoted(PGconn *conn);
|
||||||
bool create_replication_slot(PGconn *conn, char *slot_name);
|
bool create_replication_slot(PGconn *conn, char *slot_name, int server_version_num, PQExpBufferData *error_msg);
|
||||||
|
int get_slot_record(PGconn *conn, char *slot_name, t_replication_slot *record);
|
||||||
bool drop_replication_slot(PGconn *conn, char *slot_name);
|
bool drop_replication_slot(PGconn *conn, char *slot_name);
|
||||||
|
bool start_backup(PGconn *conn, char *first_wal_segment, bool fast_checkpoint, int server_version_num);
|
||||||
bool start_backup(PGconn *conn, char *first_wal_segment, bool fast_checkpoint);
|
bool stop_backup(PGconn *conn, char *last_wal_segment, int server_version_num);
|
||||||
bool stop_backup(PGconn *conn, char *last_wal_segment);
|
bool set_config(PGconn *conn, const char *config_param, const char *config_value);
|
||||||
bool set_config_bool(PGconn *conn, const char *config_param, bool state);
|
bool set_config_bool(PGconn *conn, const char *config_param, bool state);
|
||||||
bool copy_configuration(PGconn *masterconn, PGconn *witnessconn, char *cluster_name);
|
bool witness_copy_node_records(PGconn *masterconn, PGconn *witnessconn, char *cluster_name);
|
||||||
bool create_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name);
|
bool create_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name, bool active);
|
||||||
bool delete_node_record(PGconn *conn, int node, char *action);
|
bool delete_node_record(PGconn *conn, int node, char *action);
|
||||||
bool create_event_record(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
int get_node_record(PGconn *conn, char *cluster, int node_id, t_node_info *node_info);
|
||||||
|
int get_node_record_by_name(PGconn *conn, char *cluster, const char *node_name, t_node_info *node_info);
|
||||||
|
bool update_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name, bool active);
|
||||||
bool update_node_record_status(PGconn *conn, char *cluster_name, int this_node_id, char *type, int upstream_node_id, bool active);
|
bool update_node_record_status(PGconn *conn, char *cluster_name, int this_node_id, char *type, int upstream_node_id, bool active);
|
||||||
bool update_node_record_set_upstream(PGconn *conn, char *cluster_name, int this_node_id, int new_upstream_node_id);
|
bool update_node_record_set_upstream(PGconn *conn, char *cluster_name, int this_node_id, int new_upstream_node_id);
|
||||||
PGresult * get_node_record(PGconn *conn, char *cluster, int node_id);
|
bool create_event_record(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details);
|
||||||
|
|
||||||
|
int get_node_replication_state(PGconn *conn, char *node_name, char *output);
|
||||||
|
t_server_type parse_node_type(const char *type);
|
||||||
|
int get_data_checksum_version(const char *data_directory);
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
|||||||
6
debian/DEBIAN/control
vendored
6
debian/DEBIAN/control
vendored
@@ -1,9 +1,9 @@
|
|||||||
Package: repmgr-auto
|
Package: repmgr-auto
|
||||||
Version: 2.0beta2
|
Version: 3.2dev
|
||||||
Section: database
|
Section: database
|
||||||
Priority: optional
|
Priority: optional
|
||||||
Architecture: all
|
Architecture: all
|
||||||
Depends: rsync, postgresql-9.0 | postgresql-9.1 | postgresql-9.2 | postgresql-9.3 | postgresql-9.4
|
Depends: rsync, postgresql-9.3 | postgresql-9.4 | postgresql-9.5
|
||||||
Maintainer: Jaime Casanova <jaime@2ndQuadrant.com>
|
Maintainer: Self built package <user@localhost>
|
||||||
Description: PostgreSQL replication setup, magament and monitoring
|
Description: PostgreSQL replication setup, magament and monitoring
|
||||||
has two main executables
|
has two main executables
|
||||||
|
|||||||
194
dirmod.c
Normal file
194
dirmod.c
Normal file
@@ -0,0 +1,194 @@
|
|||||||
|
/*
|
||||||
|
*
|
||||||
|
* dirmod.c
|
||||||
|
* directory handling functions
|
||||||
|
*
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
|
*
|
||||||
|
* Portions Copyright (c) 1996-2013, PostgreSQL Global Development Group
|
||||||
|
* Portions Copyright (c) 1994, Regents of the University of California
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include "postgres_fe.h"
|
||||||
|
|
||||||
|
/* Don't modify declarations in system headers */
|
||||||
|
|
||||||
|
#include <unistd.h>
|
||||||
|
#include <dirent.h>
|
||||||
|
#include <sys/stat.h>
|
||||||
|
|
||||||
|
/*
|
||||||
|
* pgfnames
|
||||||
|
*
|
||||||
|
* return a list of the names of objects in the argument directory. Caller
|
||||||
|
* must call pgfnames_cleanup later to free the memory allocated by this
|
||||||
|
* function.
|
||||||
|
*/
|
||||||
|
char **
|
||||||
|
pgfnames(const char *path)
|
||||||
|
{
|
||||||
|
DIR *dir;
|
||||||
|
struct dirent *file;
|
||||||
|
char **filenames;
|
||||||
|
int numnames = 0;
|
||||||
|
int fnsize = 200; /* enough for many small dbs */
|
||||||
|
|
||||||
|
dir = opendir(path);
|
||||||
|
if (dir == NULL)
|
||||||
|
{
|
||||||
|
return NULL;
|
||||||
|
}
|
||||||
|
|
||||||
|
filenames = (char **) palloc(fnsize * sizeof(char *));
|
||||||
|
|
||||||
|
while (errno = 0, (file = readdir(dir)) != NULL)
|
||||||
|
{
|
||||||
|
if (strcmp(file->d_name, ".") != 0 && strcmp(file->d_name, "..") != 0)
|
||||||
|
{
|
||||||
|
if (numnames + 1 >= fnsize)
|
||||||
|
{
|
||||||
|
fnsize *= 2;
|
||||||
|
filenames = (char **) repalloc(filenames,
|
||||||
|
fnsize * sizeof(char *));
|
||||||
|
}
|
||||||
|
filenames[numnames++] = pstrdup(file->d_name);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (errno)
|
||||||
|
{
|
||||||
|
fprintf(stderr, _("could not read directory \"%s\": %s\n"),
|
||||||
|
path, strerror(errno));
|
||||||
|
}
|
||||||
|
|
||||||
|
filenames[numnames] = NULL;
|
||||||
|
|
||||||
|
if (closedir(dir))
|
||||||
|
{
|
||||||
|
fprintf(stderr, _("could not close directory \"%s\": %s\n"),
|
||||||
|
path, strerror(errno));
|
||||||
|
}
|
||||||
|
|
||||||
|
return filenames;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* pgfnames_cleanup
|
||||||
|
*
|
||||||
|
* deallocate memory used for filenames
|
||||||
|
*/
|
||||||
|
void
|
||||||
|
pgfnames_cleanup(char **filenames)
|
||||||
|
{
|
||||||
|
char **fn;
|
||||||
|
|
||||||
|
for (fn = filenames; *fn; fn++)
|
||||||
|
pfree(*fn);
|
||||||
|
|
||||||
|
pfree(filenames);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* rmtree
|
||||||
|
*
|
||||||
|
* Delete a directory tree recursively.
|
||||||
|
* Assumes path points to a valid directory.
|
||||||
|
* Deletes everything under path.
|
||||||
|
* If rmtopdir is true deletes the directory too.
|
||||||
|
* Returns true if successful, false if there was any problem.
|
||||||
|
* (The details of the problem are reported already, so caller
|
||||||
|
* doesn't really have to say anything more, but most do.)
|
||||||
|
*/
|
||||||
|
bool
|
||||||
|
rmtree(const char *path, bool rmtopdir)
|
||||||
|
{
|
||||||
|
bool result = true;
|
||||||
|
char pathbuf[MAXPGPATH];
|
||||||
|
char **filenames;
|
||||||
|
char **filename;
|
||||||
|
struct stat statbuf;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* we copy all the names out of the directory before we start modifying
|
||||||
|
* it.
|
||||||
|
*/
|
||||||
|
filenames = pgfnames(path);
|
||||||
|
|
||||||
|
if (filenames == NULL)
|
||||||
|
return false;
|
||||||
|
|
||||||
|
/* now we have the names we can start removing things */
|
||||||
|
for (filename = filenames; *filename; filename++)
|
||||||
|
{
|
||||||
|
snprintf(pathbuf, MAXPGPATH, "%s/%s", path, *filename);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* It's ok if the file is not there anymore; we were just about to
|
||||||
|
* delete it anyway.
|
||||||
|
*
|
||||||
|
* This is not an academic possibility. One scenario where this
|
||||||
|
* happens is when bgwriter has a pending unlink request for a file in
|
||||||
|
* a database that's being dropped. In dropdb(), we call
|
||||||
|
* ForgetDatabaseFsyncRequests() to flush out any such pending unlink
|
||||||
|
* requests, but because that's asynchronous, it's not guaranteed that
|
||||||
|
* the bgwriter receives the message in time.
|
||||||
|
*/
|
||||||
|
if (lstat(pathbuf, &statbuf) != 0)
|
||||||
|
{
|
||||||
|
if (errno != ENOENT)
|
||||||
|
{
|
||||||
|
result = false;
|
||||||
|
}
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (S_ISDIR(statbuf.st_mode))
|
||||||
|
{
|
||||||
|
/* call ourselves recursively for a directory */
|
||||||
|
if (!rmtree(pathbuf, true))
|
||||||
|
{
|
||||||
|
/* we already reported the error */
|
||||||
|
result = false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
if (unlink(pathbuf) != 0)
|
||||||
|
{
|
||||||
|
if (errno != ENOENT)
|
||||||
|
{
|
||||||
|
result = false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (rmtopdir)
|
||||||
|
{
|
||||||
|
if (rmdir(path) != 0)
|
||||||
|
{
|
||||||
|
result = false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pgfnames_cleanup(filenames);
|
||||||
|
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
23
dirmod.h
Normal file
23
dirmod.h
Normal file
@@ -0,0 +1,23 @@
|
|||||||
|
/*
|
||||||
|
* dirmod.h
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
|
||||||
|
#ifndef _DIRMOD_H_
|
||||||
|
#define _DIRMOD_H_
|
||||||
|
|
||||||
|
#endif
|
||||||
75
docs/repmgrd-failover-mechanism.md
Normal file
75
docs/repmgrd-failover-mechanism.md
Normal file
@@ -0,0 +1,75 @@
|
|||||||
|
repmgrd's failover algorithm
|
||||||
|
============================
|
||||||
|
|
||||||
|
When implementing automatic failover, there are two factors which are critical in
|
||||||
|
ensuring the desired result is achieved:
|
||||||
|
|
||||||
|
- has the master node genuinely failed?
|
||||||
|
- which is the best node to promote to the new master?
|
||||||
|
|
||||||
|
This document outlines repmgrd's decision-making process during automatic failover
|
||||||
|
for standbys directly connected to the master node.
|
||||||
|
|
||||||
|
|
||||||
|
Master node failure detection
|
||||||
|
-----------------------------
|
||||||
|
|
||||||
|
If a `repmgrd` instance running on a PostgreSQL standby node is unable to connect to
|
||||||
|
the master node, this doesn't neccesarily mean that the master is down and a
|
||||||
|
failover is required. Factors such as network connectivity issues could mean that
|
||||||
|
even though the standby node is isolated, the replication cluster as a whole
|
||||||
|
is functioning correctly, and promoting the standby without further verification
|
||||||
|
could result in a "split-brain" situation.
|
||||||
|
|
||||||
|
In the event that `repmgrd` is unable to connect to the master node, it will attempt
|
||||||
|
to reconnect to the master server several times (as defined by the `reconnect_attempts`
|
||||||
|
parameter in `repmgr.conf`), with reconnection attempts occuring at the interval
|
||||||
|
specified by `reconnect_interval`. This happens to verify that the master is definitively
|
||||||
|
not accessible (e.g. that connection was not lost due to a brief network glitch).
|
||||||
|
|
||||||
|
Appropriate values for these settings will depend very much on the replication
|
||||||
|
cluster environment. There will necessarily be a trade-off between the time it
|
||||||
|
takes to assume the master is not reachable, and the reliability of that conclusion.
|
||||||
|
A standby in a different physical location to the master will probably need a longer
|
||||||
|
check interval to rule out possible network issues, whereas one located in the same
|
||||||
|
rack with a direct connection between servers could perform the check very quickly.
|
||||||
|
|
||||||
|
Note that it's possible the master comes back online after this point is reached,
|
||||||
|
but before a new master has been selected; in this case it will be noticed
|
||||||
|
during the selection of a new master and no actual failover will take place.
|
||||||
|
|
||||||
|
Promotion candidate selection
|
||||||
|
-----------------------------
|
||||||
|
|
||||||
|
Once `repmgrd` has decided the master is definitively unreachable, following checks
|
||||||
|
will be carried out:
|
||||||
|
|
||||||
|
* attempts to connect to all other nodes in the cluster (including the witness
|
||||||
|
node, if defined) to establish the state of the cluster, including their
|
||||||
|
current LSN
|
||||||
|
|
||||||
|
* If less than half of the nodes are visible (from the viewpoint
|
||||||
|
of this node), `repmgrd` will not take any further action. This is to ensure that
|
||||||
|
e.g. if a replication cluster is spread over multiple data centres, a split-brain
|
||||||
|
situation does not occur if there is a network failure between datacentres. Note
|
||||||
|
that if nodes are split evenly between data centres, a witness server can be
|
||||||
|
used to establish the "majority" data centre.
|
||||||
|
|
||||||
|
* `repmgrd` polls all visible servers and waits for each node to return a valid LSN;
|
||||||
|
it updates the LSN previously stored for this node if it has increased since
|
||||||
|
the initial check
|
||||||
|
|
||||||
|
* once all LSNs have been retrieved, `repmgrd` will check for the highest LSN; if
|
||||||
|
its own node has the highest LSN, it will attempt to promote itself (using the
|
||||||
|
command defined in `promote_command` in `repmgr.conf`. Note that if using
|
||||||
|
`repmgr standby promote` as the promotion command, and the original master becomes available
|
||||||
|
before the promotion takes effect, `repmgr` will return an error and no promotion
|
||||||
|
will take place, and `repmgrd` will resume monitoring as usual.
|
||||||
|
|
||||||
|
* if the node is not the promotion candidate, `repmgrd` will execute the
|
||||||
|
`follow_command` defined in `repmgr.conf`. If using `repmgr standby follow` here,
|
||||||
|
`repmgr` will attempt to detect the new master node and attach to that.
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
152
docs/repmgrd-node-fencing.md
Normal file
152
docs/repmgrd-node-fencing.md
Normal file
@@ -0,0 +1,152 @@
|
|||||||
|
Fencing a failed master node with repmgrd and pgbouncer
|
||||||
|
=======================================================
|
||||||
|
|
||||||
|
With automatic failover, it's essential to ensure that a failed master
|
||||||
|
remains inaccessible to your application, even if it comes back online
|
||||||
|
again, to avoid a split-brain situation.
|
||||||
|
|
||||||
|
By using `pgbouncer` together with `repmgrd`, it's possible to combine
|
||||||
|
automatic failover with a process to isolate the failed master from
|
||||||
|
your application and ensure that all connections which should go to
|
||||||
|
the master are directed there smoothly without having to reconfigure
|
||||||
|
your application. (Note that as a connection pooler, `pgbouncer` can
|
||||||
|
benefit your application in other ways, but those are beyond the scope
|
||||||
|
of this document).
|
||||||
|
|
||||||
|
* * *
|
||||||
|
|
||||||
|
> *WARNING*: automatic failover is tricky to get right. This document
|
||||||
|
> demonstrates one possible implementation method, however you should
|
||||||
|
> carefully configure and test any setup to suit the needs of your own
|
||||||
|
> replication cluster/application.
|
||||||
|
|
||||||
|
* * *
|
||||||
|
|
||||||
|
In a failover situation, `repmgrd` promotes a standby to master by executing
|
||||||
|
the command defined in `promote_command`. Normally this would be something like:
|
||||||
|
|
||||||
|
repmgr standby promote -f /etc/repmgr.conf
|
||||||
|
|
||||||
|
By wrapping this in a custom script which adjusts the `pgbouncer` configuration
|
||||||
|
on all nodes, it's possible to fence the failed master and redirect write
|
||||||
|
connections to the new master.
|
||||||
|
|
||||||
|
The script consists of three sections:
|
||||||
|
|
||||||
|
* commands to pause `pgbouncer` on all nodes
|
||||||
|
* the promotion command itself
|
||||||
|
* commands to reconfigure and restart `pgbouncer` on all nodes
|
||||||
|
|
||||||
|
Note that it requires password-less SSH access between all nodes to be able to
|
||||||
|
update the `pgbouncer` configuration files.
|
||||||
|
|
||||||
|
For the purposes of this demonstration, we'll assume there are 3 nodes (master
|
||||||
|
and two standbys), with `pgbouncer` listening on port 6432 handling connections
|
||||||
|
to a database called `appdb`. The `postgres` system user must have write
|
||||||
|
access to the `pgbouncer` configuration files on all nodes. We'll assume
|
||||||
|
there's a main `pgbouncer` configuration file, `/etc/pgbouncer.ini`, which uses
|
||||||
|
the `%include` directive (available from PgBouncer 1.6) to include a separate
|
||||||
|
configuration file, `/etc/pgbouncer.database.ini`, which will be modified by
|
||||||
|
`repmgr`.
|
||||||
|
|
||||||
|
`/etc/pgbouncer.ini` should look something like this:
|
||||||
|
|
||||||
|
[pgbouncer]
|
||||||
|
|
||||||
|
logfile = /var/log/pgbouncer/pgbouncer.log
|
||||||
|
pidfile = /var/run/pgbouncer/pgbouncer.pid
|
||||||
|
|
||||||
|
listen_addr = *
|
||||||
|
listen_port = 6532
|
||||||
|
unix_socket_dir = /tmp
|
||||||
|
|
||||||
|
auth_type = trust
|
||||||
|
auth_file = /etc/pgbouncer.auth
|
||||||
|
|
||||||
|
admin_users = postgres
|
||||||
|
stats_users = postgres
|
||||||
|
|
||||||
|
pool_mode = transaction
|
||||||
|
|
||||||
|
max_client_conn = 100
|
||||||
|
default_pool_size = 20
|
||||||
|
min_pool_size = 5
|
||||||
|
reserve_pool_size = 5
|
||||||
|
reserve_pool_timeout = 3
|
||||||
|
|
||||||
|
log_connections = 1
|
||||||
|
log_disconnections = 1
|
||||||
|
log_pooler_errors = 1
|
||||||
|
|
||||||
|
%include /etc/pgbouncer.database.ini
|
||||||
|
|
||||||
|
The actual script is as follows; adjust the configurable items as appropriate:
|
||||||
|
|
||||||
|
`/var/lib/postgres/repmgr/promote.sh`
|
||||||
|
|
||||||
|
|
||||||
|
#!/usr/bin/env bash
|
||||||
|
set -u
|
||||||
|
set -e
|
||||||
|
|
||||||
|
# Configurable items
|
||||||
|
PGBOUNCER_HOSTS="node1 node2 node3"
|
||||||
|
PGBOUNCER_DATABASE_INI="/etc/pgbouncer.database.ini"
|
||||||
|
PGBOUNCER_DATABASE="appdb"
|
||||||
|
PGBOUNCER_PORT=6432
|
||||||
|
|
||||||
|
REPMGR_DB="repmgr"
|
||||||
|
REPMGR_USER="repmgr"
|
||||||
|
REPMGR_SCHEMA="repmgr_test"
|
||||||
|
|
||||||
|
# 1. Pause running pgbouncer instances
|
||||||
|
for HOST in $PGBOUNCER_HOSTS
|
||||||
|
do
|
||||||
|
psql -t -c "pause" -h $HOST -p $PGBOUNCER_PORT -U postgres pgbouncer
|
||||||
|
done
|
||||||
|
|
||||||
|
# 2. Promote this node from standby to master
|
||||||
|
|
||||||
|
repmgr standby promote -f /etc/repmgr.conf
|
||||||
|
|
||||||
|
# 3. Reconfigure pgbouncer instances
|
||||||
|
|
||||||
|
PGBOUNCER_DATABASE_INI_NEW="/tmp/pgbouncer.database.ini"
|
||||||
|
|
||||||
|
for HOST in $PGBOUNCER_HOSTS
|
||||||
|
do
|
||||||
|
# Recreate the pgbouncer config file
|
||||||
|
echo -e "[databases]\n" > $PGBOUNCER_DATABASE_INI_NEW
|
||||||
|
|
||||||
|
psql -d $REPMGR_DB -U $REPMGR_USER -t -A \
|
||||||
|
-c "SELECT '${PGBOUNCER_DATABASE}-rw= ' || conninfo || ' application_name=pgbouncer_${HOST}' \
|
||||||
|
FROM ${REPMGR_SCHEMA}.repl_nodes \
|
||||||
|
WHERE active = TRUE AND type='master'" >> $PGBOUNCER_DATABASE_INI_NEW
|
||||||
|
|
||||||
|
psql -d $REPMGR_DB -U $REPMGR_USER -t -A \
|
||||||
|
-c "SELECT '${PGBOUNCER_DATABASE}-ro= ' || conninfo || ' application_name=pgbouncer_${HOST}' \
|
||||||
|
FROM $REPMGR_SCHEMA.repl_nodes \
|
||||||
|
WHERE node_name='${HOST}'" >> $PGBOUNCER_DATABASE_INI_NEW
|
||||||
|
|
||||||
|
rsync $PGBOUNCER_DATABASE_INI_NEW $HOST:$PGBOUNCER_DATABASE_INI
|
||||||
|
|
||||||
|
psql -tc "reload" -h $HOST -p $PGBOUNCER_PORT -U postgres pgbouncer
|
||||||
|
psql -tc "resume" -h $HOST -p $PGBOUNCER_PORT -U postgres pgbouncer
|
||||||
|
|
||||||
|
done
|
||||||
|
|
||||||
|
# Clean up generated file
|
||||||
|
rm $PGBOUNCER_DATABASE_INI_NEW
|
||||||
|
|
||||||
|
echo "Reconfiguration of pgbouncer complete"
|
||||||
|
|
||||||
|
Script and template file should be installed on each node where
|
||||||
|
`repmgrd` is running.
|
||||||
|
|
||||||
|
Finally, set `promote_command` in `repmgr.conf` on each node to
|
||||||
|
point to the custom promote script:
|
||||||
|
|
||||||
|
promote_command=/var/lib/postgres/repmgr/promote.sh
|
||||||
|
|
||||||
|
and reload/restart any running `repmgrd` instances for the changes to take
|
||||||
|
effect.
|
||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* errcode.h
|
* errcode.h
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -29,7 +29,6 @@
|
|||||||
#define ERR_DB_CON 6
|
#define ERR_DB_CON 6
|
||||||
#define ERR_DB_QUERY 7
|
#define ERR_DB_QUERY 7
|
||||||
#define ERR_PROMOTED 8
|
#define ERR_PROMOTED 8
|
||||||
#define ERR_BAD_PASSWORD 9
|
|
||||||
#define ERR_STR_OVERFLOW 10
|
#define ERR_STR_OVERFLOW 10
|
||||||
#define ERR_FAILOVER_FAIL 11
|
#define ERR_FAILOVER_FAIL 11
|
||||||
#define ERR_BAD_SSH 12
|
#define ERR_BAD_SSH 12
|
||||||
@@ -37,5 +36,10 @@
|
|||||||
#define ERR_BAD_BASEBACKUP 14
|
#define ERR_BAD_BASEBACKUP 14
|
||||||
#define ERR_INTERNAL 15
|
#define ERR_INTERNAL 15
|
||||||
#define ERR_MONITORING_FAIL 16
|
#define ERR_MONITORING_FAIL 16
|
||||||
|
#define ERR_BAD_BACKUP_LABEL 17
|
||||||
|
#define ERR_SWITCHOVER_FAIL 18
|
||||||
|
#define ERR_BARMAN 19
|
||||||
|
#define ERR_REGISTRATION_SYNC 20
|
||||||
|
|
||||||
|
|
||||||
#endif /* _ERRCODE_H_ */
|
#endif /* _ERRCODE_H_ */
|
||||||
|
|||||||
18
expected/repmgr_funcs.out
Normal file
18
expected/repmgr_funcs.out
Normal file
@@ -0,0 +1,18 @@
|
|||||||
|
/*
|
||||||
|
* repmgr_function.sql
|
||||||
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
-- SET SEARCH_PATH TO 'repmgr';
|
||||||
|
CREATE FUNCTION repmgr_update_standby_location(text) RETURNS boolean
|
||||||
|
AS '$libdir/repmgr_funcs', 'repmgr_update_standby_location'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
CREATE FUNCTION repmgr_get_last_standby_location() RETURNS text
|
||||||
|
AS '$libdir/repmgr_funcs', 'repmgr_get_last_standby_location'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
CREATE FUNCTION repmgr_update_last_updated() RETURNS TIMESTAMP WITH TIME ZONE
|
||||||
|
AS '$libdir/repmgr_funcs', 'repmgr_update_last_updated'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
|
CREATE FUNCTION repmgr_get_last_updated() RETURNS TIMESTAMP WITH TIME ZONE
|
||||||
|
AS '$libdir/repmgr_funcs', 'repmgr_get_last_updated'
|
||||||
|
LANGUAGE C STRICT;
|
||||||
24
expected/repmgr_test.out
Normal file
24
expected/repmgr_test.out
Normal file
@@ -0,0 +1,24 @@
|
|||||||
|
select * from repmgr_update_standby_location('');
|
||||||
|
repmgr_update_standby_location
|
||||||
|
--------------------------------
|
||||||
|
f
|
||||||
|
(1 row)
|
||||||
|
|
||||||
|
select * from repmgr_get_last_standby_location();
|
||||||
|
repmgr_get_last_standby_location
|
||||||
|
----------------------------------
|
||||||
|
|
||||||
|
(1 row)
|
||||||
|
|
||||||
|
select * from repmgr_update_last_updated();
|
||||||
|
repmgr_update_last_updated
|
||||||
|
----------------------------
|
||||||
|
|
||||||
|
(1 row)
|
||||||
|
|
||||||
|
select * from repmgr_get_last_updated();
|
||||||
|
repmgr_get_last_updated
|
||||||
|
-------------------------
|
||||||
|
|
||||||
|
(1 row)
|
||||||
|
|
||||||
67
log.c
67
log.c
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* log.c - Logging methods
|
* log.c - Logging methods
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This module is a set of methods for logging (currently only syslog)
|
* This module is a set of methods for logging (currently only syslog)
|
||||||
*
|
*
|
||||||
@@ -40,15 +40,21 @@
|
|||||||
/* #define REPMGR_DEBUG */
|
/* #define REPMGR_DEBUG */
|
||||||
|
|
||||||
static int detect_log_facility(const char *facility);
|
static int detect_log_facility(const char *facility);
|
||||||
static void _stderr_log_with_level(const char *level_name, int level, const char *fmt, va_list ap);
|
static void _stderr_log_with_level(const char *level_name, int level, const char *fmt, va_list ap)
|
||||||
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 0)));
|
||||||
|
|
||||||
int log_type = REPMGR_STDERR;
|
int log_type = REPMGR_STDERR;
|
||||||
int log_level = LOG_NOTICE;
|
int log_level = LOG_NOTICE;
|
||||||
int last_log_level = LOG_NOTICE;
|
int last_log_level = LOG_NOTICE;
|
||||||
int verbose_logging = false;
|
int verbose_logging = false;
|
||||||
int terse_logging = false;
|
int terse_logging = false;
|
||||||
|
/*
|
||||||
|
* Global variable to be set by the main application to ensure any log output
|
||||||
|
* emitted before logger_init is called, is output in the correct format
|
||||||
|
*/
|
||||||
|
int logger_output_mode = OM_DAEMON;
|
||||||
|
|
||||||
void
|
extern void
|
||||||
stderr_log_with_level(const char *level_name, int level, const char *fmt, ...)
|
stderr_log_with_level(const char *level_name, int level, const char *fmt, ...)
|
||||||
{
|
{
|
||||||
va_list arglist;
|
va_list arglist;
|
||||||
@@ -61,22 +67,31 @@ stderr_log_with_level(const char *level_name, int level, const char *fmt, ...)
|
|||||||
static void
|
static void
|
||||||
_stderr_log_with_level(const char *level_name, int level, const char *fmt, va_list ap)
|
_stderr_log_with_level(const char *level_name, int level, const char *fmt, va_list ap)
|
||||||
{
|
{
|
||||||
time_t t;
|
char buf[100];
|
||||||
struct tm *tm;
|
|
||||||
char buff[100];
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Store the requested level so that if there's a subsequent
|
* Store the requested level so that if there's a subsequent
|
||||||
* log_hint(), we can suppress that if appropriate.
|
* log_hint() or log_detail(), we can suppress that if appropriate.
|
||||||
*/
|
*/
|
||||||
last_log_level = level;
|
last_log_level = level;
|
||||||
|
|
||||||
if (log_level >= level)
|
if (log_level >= level)
|
||||||
{
|
{
|
||||||
time(&t);
|
|
||||||
tm = localtime(&t);
|
/* Format log line prefix with timestamp if in daemon mode */
|
||||||
strftime(buff, 100, "[%Y-%m-%d %H:%M:%S]", tm);
|
if (logger_output_mode == OM_DAEMON)
|
||||||
fprintf(stderr, "%s [%s] ", buff, level_name);
|
{
|
||||||
|
time_t t;
|
||||||
|
struct tm *tm;
|
||||||
|
time(&t);
|
||||||
|
tm = localtime(&t);
|
||||||
|
strftime(buf, 100, "[%Y-%m-%d %H:%M:%S]", tm);
|
||||||
|
fprintf(stderr, "%s [%s] ", buf, level_name);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
fprintf(stderr, "%s: ", level_name);
|
||||||
|
}
|
||||||
|
|
||||||
vfprintf(stderr, fmt, ap);
|
vfprintf(stderr, fmt, ap);
|
||||||
|
|
||||||
@@ -98,6 +113,20 @@ log_hint(const char *fmt, ...)
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
void
|
||||||
|
log_detail(const char *fmt, ...)
|
||||||
|
{
|
||||||
|
va_list ap;
|
||||||
|
|
||||||
|
if (terse_logging == false)
|
||||||
|
{
|
||||||
|
va_start(ap, fmt);
|
||||||
|
_stderr_log_with_level("DETAIL", last_log_level, fmt, ap);
|
||||||
|
va_end(ap);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
void
|
void
|
||||||
log_verbose(int level, const char *fmt, ...)
|
log_verbose(int level, const char *fmt, ...)
|
||||||
{
|
{
|
||||||
@@ -141,7 +170,7 @@ log_verbose(int level, const char *fmt, ...)
|
|||||||
|
|
||||||
|
|
||||||
bool
|
bool
|
||||||
logger_init(t_configuration_options * opts, const char *ident)
|
logger_init(t_configuration_options *opts, const char *ident)
|
||||||
{
|
{
|
||||||
char *level = opts->loglevel;
|
char *level = opts->loglevel;
|
||||||
char *facility = opts->logfacility;
|
char *facility = opts->logfacility;
|
||||||
@@ -175,6 +204,13 @@ logger_init(t_configuration_options * opts, const char *ident)
|
|||||||
stderr_log_warning(_("Invalid log level \"%s\" (available values: DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG)\n"), level);
|
stderr_log_warning(_("Invalid log level \"%s\" (available values: DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG)\n"), level);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* STDERR only logging requested - finish here without setting up any further
|
||||||
|
* logging facility.
|
||||||
|
*/
|
||||||
|
if (logger_output_mode == OM_COMMAND_LINE)
|
||||||
|
return true;
|
||||||
|
|
||||||
if (facility && *facility)
|
if (facility && *facility)
|
||||||
{
|
{
|
||||||
|
|
||||||
@@ -235,9 +271,10 @@ logger_init(t_configuration_options * opts, const char *ident)
|
|||||||
stderr_log_notice(_("Redirecting logging output to '%s'\n"), opts->logfile);
|
stderr_log_notice(_("Redirecting logging output to '%s'\n"), opts->logfile);
|
||||||
fd = freopen(opts->logfile, "a", stderr);
|
fd = freopen(opts->logfile, "a", stderr);
|
||||||
|
|
||||||
/* It's possible freopen() may still fail due to e.g. a race condition;
|
/*
|
||||||
as it's not feasible to restore stderr after a failed freopen(),
|
* It's possible freopen() may still fail due to e.g. a race condition;
|
||||||
we'll write to stdout as a last resort.
|
* as it's not feasible to restore stderr after a failed freopen(),
|
||||||
|
* we'll write to stdout as a last resort.
|
||||||
*/
|
*/
|
||||||
if (fd == NULL)
|
if (fd == NULL)
|
||||||
{
|
{
|
||||||
|
|||||||
20
log.h
20
log.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* log.h
|
* log.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -25,7 +25,10 @@
|
|||||||
#define REPMGR_SYSLOG 1
|
#define REPMGR_SYSLOG 1
|
||||||
#define REPMGR_STDERR 2
|
#define REPMGR_STDERR 2
|
||||||
|
|
||||||
void
|
#define OM_COMMAND_LINE 1
|
||||||
|
#define OM_DAEMON 2
|
||||||
|
|
||||||
|
extern void
|
||||||
stderr_log_with_level(const char *level_name, int level, const char *fmt,...)
|
stderr_log_with_level(const char *level_name, int level, const char *fmt,...)
|
||||||
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 4)));
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 3, 4)));
|
||||||
|
|
||||||
@@ -123,10 +126,17 @@ bool logger_shutdown(void);
|
|||||||
void logger_set_verbose(void);
|
void logger_set_verbose(void);
|
||||||
void logger_set_terse(void);
|
void logger_set_terse(void);
|
||||||
|
|
||||||
void log_hint(const char *fmt, ...);
|
void log_detail(const char *fmt, ...)
|
||||||
void log_verbose(int level, const char *fmt, ...);
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 1, 2)));
|
||||||
|
void log_hint(const char *fmt, ...)
|
||||||
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 1, 2)));
|
||||||
|
void log_verbose(int level, const char *fmt, ...)
|
||||||
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 2, 3)));
|
||||||
|
|
||||||
extern int log_type;
|
extern int log_type;
|
||||||
extern int log_level;
|
extern int log_level;
|
||||||
|
extern int verbose_logging;
|
||||||
|
extern int terse_logging;
|
||||||
|
extern int logger_output_mode;
|
||||||
|
|
||||||
#endif
|
#endif /* _REPMGR_LOG_H_ */
|
||||||
|
|||||||
@@ -2,6 +2,10 @@
|
|||||||
# Replication Manager sample configuration file
|
# Replication Manager sample configuration file
|
||||||
###################################################
|
###################################################
|
||||||
|
|
||||||
|
# Some configuration items will be set with a default value; this
|
||||||
|
# is noted for each item. Where no default value is shown, the
|
||||||
|
# parameter will be treated as empty or false.
|
||||||
|
|
||||||
# Required configuration items
|
# Required configuration items
|
||||||
# ============================
|
# ============================
|
||||||
#
|
#
|
||||||
@@ -11,21 +15,29 @@
|
|||||||
# schema (pattern: "repmgr_{cluster}"); while this name will be quoted
|
# schema (pattern: "repmgr_{cluster}"); while this name will be quoted
|
||||||
# to preserve case, we recommend using lower case and avoiding whitespace
|
# to preserve case, we recommend using lower case and avoiding whitespace
|
||||||
# to facilitate easier querying of the repmgr views and tables.
|
# to facilitate easier querying of the repmgr views and tables.
|
||||||
cluster=example_cluster
|
#cluster=example_cluster
|
||||||
|
|
||||||
# Node ID and name
|
# Node ID and name
|
||||||
# (Note: we recommend to avoid naming nodes after their initial
|
# (Note: we recommend to avoid naming nodes after their initial
|
||||||
# replication funcion, as this will cause confusion when e.g.
|
# replication function, as this will cause confusion when e.g.
|
||||||
# "standby2" is promoted to primary)
|
# "standby2" is promoted to primary)
|
||||||
node=2 # a unique integer
|
#node=2 # a unique integer
|
||||||
node_name=node2 # an arbitrary (but unique) string; we recommend using
|
#node_name=node2 # an arbitrary (but unique) string; we recommend using
|
||||||
# the server's hostname or another identifier unambiguously
|
# the server's hostname or another identifier unambiguously
|
||||||
# associated with the server to avoid confusion
|
# associated with the server to avoid confusion
|
||||||
|
|
||||||
# Database connection information as a conninfo string
|
# Database connection information as a conninfo string
|
||||||
# This must be accessible to all servers in the cluster; for details see:
|
# This must be accessible to all servers in the cluster; for details see:
|
||||||
# http://www.postgresql.org/docs/current/static/libpq-connect.html#LIBPQ-CONNSTRING
|
#
|
||||||
conninfo='host=192.168.204.104 dbname=repmgr_db user=repmgr_usr'
|
# https://www.postgresql.org/docs/current/static/libpq-connect.html#LIBPQ-CONNSTRING
|
||||||
|
#
|
||||||
|
#conninfo='host=192.168.204.104 dbname=repmgr user=repmgr'
|
||||||
|
#
|
||||||
|
# If repmgrd is in use, consider explicitly setting `connect_timeout` in the
|
||||||
|
# conninfo string to determine the length of time which elapses before
|
||||||
|
# a network connection attempt is abandoned; for details see:
|
||||||
|
#
|
||||||
|
# https://www.postgresql.org/docs/current/static/libpq-connect.html#LIBPQ-CONNECT-CONNECT-TIMEOUT
|
||||||
|
|
||||||
# Optional configuration items
|
# Optional configuration items
|
||||||
# ============================
|
# ============================
|
||||||
@@ -33,18 +45,17 @@ conninfo='host=192.168.204.104 dbname=repmgr_db user=repmgr_usr'
|
|||||||
# Replication settings
|
# Replication settings
|
||||||
# ---------------------
|
# ---------------------
|
||||||
|
|
||||||
# when using cascading replication and a standby is to be connected to an
|
# When using cascading replication, a standby can connect to another
|
||||||
# upstream standby, specify that node's ID with 'upstream_node'. The node
|
# upstream standby node which is specified by setting 'upstream_node'.
|
||||||
# must exist before the new standby can be registered. If a standby is
|
# In that case, the upstream node must exist before the new standby
|
||||||
# to connect directly to a primary node, this parameter is not required.
|
# can be registered. If 'upstream_node' is not set, then the standby
|
||||||
#
|
# will connect directly to the primary node.
|
||||||
# upstream_node=1
|
#upstream_node=1
|
||||||
|
|
||||||
# physical replication slots - PostgreSQL 9.4 and later only
|
# use physical replication slots - PostgreSQL 9.4 and later only
|
||||||
# (default: 0)
|
# (default: 0)
|
||||||
#
|
#use_replication_slots=0
|
||||||
# use_replication_slots=0
|
|
||||||
#
|
|
||||||
# NOTE: 'max_replication_slots' should be configured for at least the
|
# NOTE: 'max_replication_slots' should be configured for at least the
|
||||||
# number of standbys which will connect to the primary.
|
# number of standbys which will connect to the primary.
|
||||||
|
|
||||||
@@ -53,15 +64,21 @@ conninfo='host=192.168.204.104 dbname=repmgr_db user=repmgr_usr'
|
|||||||
|
|
||||||
# Log level: possible values are DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG
|
# Log level: possible values are DEBUG, INFO, NOTICE, WARNING, ERR, ALERT, CRIT or EMERG
|
||||||
# (default: NOTICE)
|
# (default: NOTICE)
|
||||||
loglevel=NOTICE
|
#loglevel=NOTICE
|
||||||
|
|
||||||
|
# Note that logging facility settings will only apply to `repmgrd` by default;
|
||||||
|
# `repmgr` will always write to STDERR unless the switch `--log-to-file` is
|
||||||
|
# supplied, in which case it will log to the same destination as `repmgrd`.
|
||||||
|
# This is mainly intended for those cases when `repmgr` is executed directly
|
||||||
|
# by `repmgrd`.
|
||||||
|
|
||||||
# Logging facility: possible values are STDERR or - for Syslog integration - one of LOCAL0, LOCAL1, ..., LOCAL7, USER
|
# Logging facility: possible values are STDERR or - for Syslog integration - one of LOCAL0, LOCAL1, ..., LOCAL7, USER
|
||||||
# (default: STDERR)
|
# (default: STDERR)
|
||||||
logfacility=STDERR
|
#logfacility=STDERR
|
||||||
|
|
||||||
# stderr can be redirected to an arbitrary file:
|
# stderr can be redirected to an arbitrary file:
|
||||||
#
|
#
|
||||||
# logfile='/var/log/repmgr.log'
|
#logfile='/var/log/repmgr/repmgr.log'
|
||||||
|
|
||||||
# event notifications can be passed to an arbitrary external program
|
# event notifications can be passed to an arbitrary external program
|
||||||
# together with the following parameters:
|
# together with the following parameters:
|
||||||
@@ -75,12 +92,12 @@ logfacility=STDERR
|
|||||||
# the values provided for "%t" and "%d" will probably contain spaces,
|
# the values provided for "%t" and "%d" will probably contain spaces,
|
||||||
# so should be quoted in the provided command configuration, e.g.:
|
# so should be quoted in the provided command configuration, e.g.:
|
||||||
#
|
#
|
||||||
# event_notification_command='/path/to/some/script %n %e %s "%t" "%d"'
|
#event_notification_command='/path/to/some/script %n %e %s "%t" "%d"'
|
||||||
|
|
||||||
# By default, all notifications will be passed; the notification types
|
# By default, all notifications will be passed; the notification types
|
||||||
# can be filtered to explicitly named ones:
|
# can be filtered to explicitly named ones:
|
||||||
#
|
#
|
||||||
# event_notifications=master_register,standby_register,witness_create
|
#event_notifications=master_register,standby_register,witness_create
|
||||||
|
|
||||||
|
|
||||||
# Environment/command settings
|
# Environment/command settings
|
||||||
@@ -88,18 +105,53 @@ logfacility=STDERR
|
|||||||
|
|
||||||
# path to PostgreSQL binary directory (location of pg_ctl, pg_basebackup etc.)
|
# path to PostgreSQL binary directory (location of pg_ctl, pg_basebackup etc.)
|
||||||
# (if not provided, defaults to system $PATH)
|
# (if not provided, defaults to system $PATH)
|
||||||
# pg_bindir=/usr/bin/
|
#pg_bindir=/usr/bin/
|
||||||
|
#
|
||||||
|
# Debian/Ubuntu users: you will probably need to set this to the directory
|
||||||
|
# where `pg_ctl` is located, e.g. /usr/lib/postgresql/9.5/bin/
|
||||||
|
|
||||||
|
# service control commands
|
||||||
|
#
|
||||||
|
# repmgr provides options to override the default pg_ctl commands
|
||||||
|
# used to stop, start, restart, reload and promote the PostgreSQL cluster
|
||||||
|
#
|
||||||
|
# NOTE: These commands must be runnable on remote nodes as well for switchover
|
||||||
|
# to function correctly.
|
||||||
|
#
|
||||||
|
# If you use sudo, the user repmgr runs as (usually 'postgres') must have
|
||||||
|
# passwordless sudo access to execute the command
|
||||||
|
#
|
||||||
|
# For example, to use systemd, you may use the following configuration:
|
||||||
|
#
|
||||||
|
# # this is required when running sudo over ssh without -t:
|
||||||
|
# Defaults:postgres !requiretty
|
||||||
|
# postgres ALL = NOPASSWD: /usr/bin/systemctl stop postgresql-9.5, \
|
||||||
|
# /usr/bin/systemctl start postgresql-9.5, \
|
||||||
|
# /usr/bin/systemctl restart postgresql-9.5
|
||||||
|
#
|
||||||
|
# service_start_command = systemctl start postgresql-9.5
|
||||||
|
# service_stop_command = systemctl stop postgresql-9.5
|
||||||
|
# service_restart_command = systemctl restart postgresql-9.5
|
||||||
|
# service_reload_command = pg_ctlcluster 9.5 main reload
|
||||||
|
# service_promote_command = pg_ctlcluster 9.5 main promote
|
||||||
|
|
||||||
# external command options
|
# external command options
|
||||||
|
|
||||||
# rsync_options=--archive --checksum --compress --progress --rsh="ssh -o \"StrictHostKeyChecking no\""
|
#rsync_options=--archive --checksum --compress --progress --rsh="ssh -o \"StrictHostKeyChecking no\""
|
||||||
# ssh_options=-o "StrictHostKeyChecking no"
|
#ssh_options=-o "StrictHostKeyChecking no"
|
||||||
|
|
||||||
# external command arguments
|
# external command arguments. Values shown are examples.
|
||||||
|
|
||||||
# pg_ctl_options='-s'
|
#pg_ctl_options='-s'
|
||||||
# pg_basebackup_options='--xlog-method=s'
|
#pg_basebackup_options='--label=repmgr_backup'
|
||||||
|
|
||||||
|
# This is the host name of the barman server, which is used for connecting over
|
||||||
|
# to the barman server (passwordless ssh keys should be in place)
|
||||||
|
#barman_server='backup_server'
|
||||||
|
# If you are placing the barman.conf file in a non-standard path, or using
|
||||||
|
# a name other than barman.conf, use this parameter to specify the path and
|
||||||
|
# name of the barman configuration file.
|
||||||
|
#barman_config='/path/to/barman.conf'
|
||||||
|
|
||||||
# Standby clone settings
|
# Standby clone settings
|
||||||
# ----------------------
|
# ----------------------
|
||||||
@@ -110,35 +162,51 @@ logfacility=STDERR
|
|||||||
#
|
#
|
||||||
# tablespace_mapping=/path/to/original/tablespace=/path/to/new/tablespace
|
# tablespace_mapping=/path/to/original/tablespace=/path/to/new/tablespace
|
||||||
|
|
||||||
|
# You can specify a restore_command to be used in the recovery.conf that
|
||||||
|
# will be placed in the cloned standby
|
||||||
|
#
|
||||||
|
# restore_command = cp /path/to/archived/wals/%f %p
|
||||||
|
|
||||||
# Failover settings (repmgrd)
|
# Failover settings (repmgrd)
|
||||||
# ---------------------------
|
# ---------------------------
|
||||||
#
|
#
|
||||||
# These settings are only applied when repmgrd is running.
|
# These settings are only applied when repmgrd is running. Values shown
|
||||||
|
# are defaults.
|
||||||
# Number of seconds to wait for a response from the primary server before
|
|
||||||
# deciding it has failed
|
|
||||||
|
|
||||||
master_response_timeout=60
|
|
||||||
|
|
||||||
# Number of times to try and reconnect to the primary before starting
|
|
||||||
# the failover procedure
|
|
||||||
reconnect_attempts=6
|
|
||||||
reconnect_interval=10
|
|
||||||
|
|
||||||
# Autofailover options
|
|
||||||
failover=automatic # one of 'automatic', 'manual'
|
|
||||||
priority=100 # a value of zero or less prevents the node being promoted to primary
|
|
||||||
promote_command='repmgr standby promote -f /path/to/repmgr.conf'
|
|
||||||
follow_command='repmgr standby follow -f /path/to/repmgr.conf -W'
|
|
||||||
|
|
||||||
# monitoring interval in seconds; default is 2
|
# monitoring interval in seconds; default is 2
|
||||||
#
|
#monitor_interval_secs=2
|
||||||
# monitor_interval_secs=2
|
|
||||||
|
# Maximum number of seconds to wait for a response from the primary server
|
||||||
|
# before deciding it has failed.
|
||||||
|
#master_response_timeout=60
|
||||||
|
|
||||||
|
# Number of attempts at what interval (in seconds) to try and
|
||||||
|
# connect to a server to establish its status (e.g. master
|
||||||
|
# during failover)
|
||||||
|
#reconnect_attempts=6
|
||||||
|
#reconnect_interval=10
|
||||||
|
|
||||||
|
# Autofailover options
|
||||||
|
#failover=manual # one of 'automatic', 'manual' (default: manual)
|
||||||
|
# defines the action to take in the event of upstream failure
|
||||||
|
#
|
||||||
|
# 'automatic': repmgrd will automatically attempt to promote the
|
||||||
|
# node or follow the new upstream node
|
||||||
|
# 'manual': repmgrd will take no action and the mode will require
|
||||||
|
# manual attention to reattach it to replication
|
||||||
|
|
||||||
|
#priority=100 # indicate a preferred priorty for promoting nodes
|
||||||
|
# a value of zero or less prevents the node being promoted to primary
|
||||||
|
# (default: 100)
|
||||||
|
|
||||||
|
#promote_command='repmgr standby promote -f /path/to/repmgr.conf'
|
||||||
|
#follow_command='repmgr standby follow -f /path/to/repmgr.conf -W'
|
||||||
|
|
||||||
# change wait time for primary; before we bail out and exit when the primary
|
# change wait time for primary; before we bail out and exit when the primary
|
||||||
# disappears, we wait 'reconnect_attempts' * 'retry_promote_interval_secs'
|
# disappears, we wait 'reconnect_attempts' * 'retry_promote_interval_secs'
|
||||||
# seconds; by default this would be half an hour, as 'retry_promote_interval_secs'
|
# seconds; by default this would be half an hour, as 'retry_promote_interval_secs'
|
||||||
# default value is 300)
|
# default value is 300)
|
||||||
#
|
#retry_promote_interval_secs=300
|
||||||
# retry_promote_interval_secs=300
|
|
||||||
|
# Number of seconds after which the witness server resyncs the repl_nodes table
|
||||||
|
#witness_repl_nodes_sync_interval_secs=15
|
||||||
|
|||||||
210
repmgr.h
210
repmgr.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr.h
|
* repmgr.h
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -23,23 +23,21 @@
|
|||||||
#include <libpq-fe.h>
|
#include <libpq-fe.h>
|
||||||
#include <postgres_fe.h>
|
#include <postgres_fe.h>
|
||||||
#include <getopt_long.h>
|
#include <getopt_long.h>
|
||||||
|
#include "pqexpbuffer.h"
|
||||||
|
|
||||||
#include "strutil.h"
|
#include "strutil.h"
|
||||||
#include "dbutils.h"
|
#include "dbutils.h"
|
||||||
#include "errcode.h"
|
#include "errcode.h"
|
||||||
#include "config.h"
|
#include "config.h"
|
||||||
|
#include "dirmod.h"
|
||||||
|
|
||||||
#define MIN_SUPPORTED_VERSION "9.3"
|
#define MIN_SUPPORTED_VERSION "9.3"
|
||||||
#define MIN_SUPPORTED_VERSION_NUM 90300
|
#define MIN_SUPPORTED_VERSION_NUM 90300
|
||||||
|
|
||||||
#include "config.h"
|
|
||||||
#define MAXFILENAME 1024
|
|
||||||
#define ERRBUFF_SIZE 512
|
#define ERRBUFF_SIZE 512
|
||||||
|
|
||||||
#define DEFAULT_WAL_KEEP_SEGMENTS "5000"
|
#define DEFAULT_WAL_KEEP_SEGMENTS "0"
|
||||||
#define DEFAULT_DEST_DIR "."
|
#define DEFAULT_DEST_DIR "."
|
||||||
#define DEFAULT_MASTER_PORT "5432"
|
|
||||||
#define DEFAULT_DBNAME "postgres"
|
|
||||||
#define DEFAULT_REPMGR_SCHEMA_PREFIX "repmgr_"
|
#define DEFAULT_REPMGR_SCHEMA_PREFIX "repmgr_"
|
||||||
#define DEFAULT_PRIORITY 100
|
#define DEFAULT_PRIORITY 100
|
||||||
#define FAILOVER_NODES_MAX_CHECK 50
|
#define FAILOVER_NODES_MAX_CHECK 50
|
||||||
@@ -50,44 +48,200 @@
|
|||||||
#define NO_UPSTREAM_NODE -1
|
#define NO_UPSTREAM_NODE -1
|
||||||
#define UNKNOWN_NODE_ID -1
|
#define UNKNOWN_NODE_ID -1
|
||||||
|
|
||||||
|
/* command line options without short versions */
|
||||||
|
#define OPT_HELP 1
|
||||||
|
#define OPT_CHECK_UPSTREAM_CONFIG 2
|
||||||
|
#define OPT_RECOVERY_MIN_APPLY_DELAY 3
|
||||||
|
#define OPT_COPY_EXTERNAL_CONFIG_FILES 4
|
||||||
|
#define OPT_CONFIG_ARCHIVE_DIR 5
|
||||||
|
#define OPT_PG_REWIND 6
|
||||||
|
#define OPT_CSV 8
|
||||||
|
#define OPT_NODE 9
|
||||||
|
#define OPT_WITHOUT_BARMAN 10
|
||||||
|
#define OPT_NO_UPSTREAM_CONNECTION 11
|
||||||
|
#define OPT_REGISTER_WAIT 12
|
||||||
|
#define OPT_CLUSTER 13
|
||||||
|
#define OPT_LOG_TO_FILE 14
|
||||||
|
#define OPT_UPSTREAM_CONNINFO 15
|
||||||
|
#define OPT_NO_CONNINFO_PASSWORD 16
|
||||||
|
#define OPT_REPLICATION_USER 17
|
||||||
|
|
||||||
|
/* deprecated command line options */
|
||||||
|
#define OPT_INITDB_NO_PWPROMPT 998
|
||||||
|
#define OPT_IGNORE_EXTERNAL_CONFIG_FILES 999
|
||||||
|
|
||||||
|
/* values for --copy-external-config-files */
|
||||||
|
#define CONFIG_FILE_SAMEPATH 1
|
||||||
|
#define CONFIG_FILE_PGDATA 2
|
||||||
|
|
||||||
|
|
||||||
/* Run time options type */
|
/* Run time options type */
|
||||||
typedef struct
|
typedef struct
|
||||||
{
|
{
|
||||||
|
/* general repmgr options */
|
||||||
char dbname[MAXLEN];
|
char config_file[MAXPGPATH];
|
||||||
char host[MAXLEN];
|
|
||||||
char username[MAXLEN];
|
|
||||||
char dest_dir[MAXFILENAME];
|
|
||||||
char config_file[MAXFILENAME];
|
|
||||||
char remote_user[MAXLEN];
|
|
||||||
char superuser[MAXLEN];
|
|
||||||
char wal_keep_segments[MAXLEN];
|
|
||||||
bool verbose;
|
bool verbose;
|
||||||
bool terse;
|
bool terse;
|
||||||
bool force;
|
bool force;
|
||||||
bool wait_for_master;
|
char pg_bindir[MAXLEN]; /* overrides setting in repmgr.conf */
|
||||||
|
|
||||||
|
/* logging parameters */
|
||||||
|
char loglevel[MAXLEN]; /* overrides setting in repmgr.conf */
|
||||||
|
bool log_to_file;
|
||||||
|
|
||||||
|
/* connection parameters */
|
||||||
|
char dbname[MAXLEN];
|
||||||
|
char host[MAXLEN];
|
||||||
|
char username[MAXLEN];
|
||||||
|
char dest_dir[MAXPGPATH];
|
||||||
|
char remote_user[MAXLEN];
|
||||||
|
char superuser[MAXLEN];
|
||||||
|
char masterport[MAXLEN];
|
||||||
|
bool conninfo_provided;
|
||||||
|
bool connection_param_provided;
|
||||||
|
bool host_param_provided;
|
||||||
|
|
||||||
|
/* standby clone parameters */
|
||||||
|
bool wal_keep_segments_used;
|
||||||
|
char wal_keep_segments[MAXLEN];
|
||||||
bool ignore_rsync_warn;
|
bool ignore_rsync_warn;
|
||||||
bool initdb_no_pwprompt;
|
|
||||||
bool rsync_only;
|
bool rsync_only;
|
||||||
bool fast_checkpoint;
|
bool fast_checkpoint;
|
||||||
bool ignore_external_config_files;
|
bool without_barman;
|
||||||
char masterport[MAXLEN];
|
bool no_upstream_connection;
|
||||||
char localport[MAXLEN];
|
bool no_conninfo_password;
|
||||||
char loglevel[MAXLEN];
|
bool copy_external_config_files;
|
||||||
|
int copy_external_config_files_destination;
|
||||||
/* parameter used by CLUSTER CLEANUP */
|
char upstream_conninfo[MAXLEN];
|
||||||
int keep_history;
|
char replication_user[MAXLEN];
|
||||||
|
|
||||||
char pg_bindir[MAXLEN];
|
|
||||||
|
|
||||||
char recovery_min_apply_delay[MAXLEN];
|
char recovery_min_apply_delay[MAXLEN];
|
||||||
|
|
||||||
|
/* standby register parameters */
|
||||||
|
bool wait_register_sync;
|
||||||
|
int wait_register_sync_seconds;
|
||||||
|
|
||||||
|
/* witness create parameters */
|
||||||
|
bool witness_pwprompt;
|
||||||
|
|
||||||
|
/* standby follow parameters */
|
||||||
|
bool wait_for_master;
|
||||||
|
|
||||||
|
/* cluster {show|matrix|crosscheck} parameters */
|
||||||
|
bool csv_mode;
|
||||||
|
|
||||||
|
/* cluster cleanup parameters */
|
||||||
|
int keep_history;
|
||||||
|
|
||||||
|
/* standby switchover parameters */
|
||||||
|
char remote_config_file[MAXLEN];
|
||||||
|
bool pg_rewind_supplied;
|
||||||
|
char pg_rewind[MAXPGPATH];
|
||||||
|
char pg_ctl_mode[MAXLEN];
|
||||||
|
|
||||||
|
/* standby {archive_config | restore_config} parameters */
|
||||||
|
char config_archive_dir[MAXLEN];
|
||||||
|
|
||||||
|
/* {standby|witness} unregister parameters */
|
||||||
|
int node;
|
||||||
|
|
||||||
} t_runtime_options;
|
} t_runtime_options;
|
||||||
|
|
||||||
#define T_RUNTIME_OPTIONS_INITIALIZER { "", "", "", "", "", "", "", DEFAULT_WAL_KEEP_SEGMENTS, false, false, false, false, false, false, false, false, false, "", "", "", 0, "", "" }
|
#define T_RUNTIME_OPTIONS_INITIALIZER { \
|
||||||
|
/* general repmgr options */ \
|
||||||
|
"", false, false, false, "", \
|
||||||
|
/* logging parameters */ \
|
||||||
|
"", false, \
|
||||||
|
/* connection parameters */ \
|
||||||
|
"", "", "", "", "", "", "", \
|
||||||
|
false, false, false, \
|
||||||
|
/* standby clone parameters */ \
|
||||||
|
false, DEFAULT_WAL_KEEP_SEGMENTS, false, false, false, false, false, false, \
|
||||||
|
false, CONFIG_FILE_SAMEPATH, "", "", "", \
|
||||||
|
/* standby register paarameters */ \
|
||||||
|
false, 0, \
|
||||||
|
/* witness create parameters */ \
|
||||||
|
false, \
|
||||||
|
/* standby follow parameters */ \
|
||||||
|
false, \
|
||||||
|
/* cluster {show|matrix|crosscheck} parameters */ \
|
||||||
|
false, \
|
||||||
|
/* cluster cleanup parameters */ \
|
||||||
|
0, \
|
||||||
|
/* standby switchover parameters */ \
|
||||||
|
"", false, "", "fast", \
|
||||||
|
/* standby {archive_config | restore_config} parameters */ \
|
||||||
|
"", \
|
||||||
|
/* {standby|witness} unregister parameters */ \
|
||||||
|
UNKNOWN_NODE_ID }
|
||||||
|
|
||||||
|
struct BackupLabel
|
||||||
|
{
|
||||||
|
XLogRecPtr start_wal_location;
|
||||||
|
char start_wal_file[MAXLEN];
|
||||||
|
XLogRecPtr checkpoint_location;
|
||||||
|
char backup_from[MAXLEN];
|
||||||
|
char backup_method[MAXLEN];
|
||||||
|
char start_time[MAXLEN];
|
||||||
|
char label[MAXLEN];
|
||||||
|
XLogRecPtr min_failover_slot_lsn;
|
||||||
|
};
|
||||||
|
|
||||||
|
|
||||||
|
typedef struct
|
||||||
|
{
|
||||||
|
char slot[MAXLEN];
|
||||||
|
char xlog_method[MAXLEN];
|
||||||
|
bool no_slot; /* from PostgreSQL 10 */
|
||||||
|
} t_basebackup_options;
|
||||||
|
|
||||||
|
#define T_BASEBACKUP_OPTIONS_INITIALIZER { "", "", false }
|
||||||
|
|
||||||
|
typedef struct
|
||||||
|
{
|
||||||
|
int size;
|
||||||
|
char **keywords;
|
||||||
|
char **values;
|
||||||
|
} t_conninfo_param_list;
|
||||||
|
|
||||||
|
typedef struct
|
||||||
|
{
|
||||||
|
char filepath[MAXPGPATH];
|
||||||
|
char filename[MAXPGPATH];
|
||||||
|
bool in_data_directory;
|
||||||
|
} t_configfile_info;
|
||||||
|
|
||||||
|
|
||||||
|
typedef struct
|
||||||
|
{
|
||||||
|
int size;
|
||||||
|
int entries;
|
||||||
|
t_configfile_info **files;
|
||||||
|
} t_configfile_list;
|
||||||
|
|
||||||
|
#define T_CONFIGFILE_LIST_INITIALIZER { 0, 0, NULL }
|
||||||
|
|
||||||
|
|
||||||
|
typedef struct
|
||||||
|
{
|
||||||
|
int node_id;
|
||||||
|
int node_status;
|
||||||
|
} t_node_status_rec;
|
||||||
|
|
||||||
|
typedef struct
|
||||||
|
{
|
||||||
|
int node_id;
|
||||||
|
char node_name[MAXLEN];
|
||||||
|
t_node_status_rec **node_status_list;
|
||||||
|
} t_node_matrix_rec;
|
||||||
|
|
||||||
|
typedef struct
|
||||||
|
{
|
||||||
|
int node_id;
|
||||||
|
char node_name[MAXLEN];
|
||||||
|
t_node_matrix_rec **matrix_list_rec;
|
||||||
|
} t_node_status_cube;
|
||||||
|
|
||||||
extern char repmgr_schema[MAXLEN];
|
|
||||||
|
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|||||||
11
repmgr.sql
11
repmgr.sql
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr.sql
|
* repmgr.sql
|
||||||
*
|
*
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
@@ -59,3 +59,12 @@ WHERE (standby_node, last_monitor_time) IN (SELECT standby_node, MAX(last_monito
|
|||||||
ALTER VIEW repl_status OWNER TO repmgr;
|
ALTER VIEW repl_status OWNER TO repmgr;
|
||||||
|
|
||||||
CREATE INDEX idx_repl_status_sort ON repl_monitor(last_monitor_time, standby_node);
|
CREATE INDEX idx_repl_status_sort ON repl_monitor(last_monitor_time, standby_node);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* This view shows the list of nodes with the information of which one is the upstream
|
||||||
|
* in each case (when appliable)
|
||||||
|
*/
|
||||||
|
CREATE VIEW repl_show_nodes AS
|
||||||
|
SELECT rn.id, rn.conninfo, rn.type, rn.name, rn.cluster,
|
||||||
|
rn.priority, rn.active, sq.name AS upstream_node_name
|
||||||
|
FROM repl_nodes as rn LEFT JOIN repl_nodes AS sq ON sq.id=rn.upstream_node_id;
|
||||||
|
|||||||
@@ -1,7 +1,7 @@
|
|||||||
#
|
#
|
||||||
# Makefile
|
# Makefile
|
||||||
#
|
#
|
||||||
# Copyright (c) 2ndQuadrant, 2010-2015
|
# Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
#
|
#
|
||||||
|
|
||||||
MODULE_big = repmgr_funcs
|
MODULE_big = repmgr_funcs
|
||||||
|
|||||||
@@ -63,6 +63,15 @@ UPDATE repl_nodes SET type = 'master' WHERE id = $master_id;
|
|||||||
|
|
||||||
-- UPDATE repl_nodes SET active = FALSE WHERE id IN (...);
|
-- UPDATE repl_nodes SET active = FALSE WHERE id IN (...);
|
||||||
|
|
||||||
|
/* There's also an event table which we need to create */
|
||||||
|
CREATE TABLE repl_events (
|
||||||
|
node_id INTEGER NOT NULL,
|
||||||
|
event TEXT NOT NULL,
|
||||||
|
successful BOOLEAN NOT NULL DEFAULT TRUE,
|
||||||
|
event_timestamp TIMESTAMP WITH TIME ZONE NOT NULL DEFAULT CURRENT_TIMESTAMP,
|
||||||
|
details TEXT NULL
|
||||||
|
);
|
||||||
|
|
||||||
/* When you're sure of your changes, commit them */
|
/* When you're sure of your changes, commit them */
|
||||||
|
|
||||||
-- COMMIT;
|
-- COMMIT;
|
||||||
|
|||||||
35
sql/repmgr3.0_repmgr3.1.sql
Normal file
35
sql/repmgr3.0_repmgr3.1.sql
Normal file
@@ -0,0 +1,35 @@
|
|||||||
|
/*
|
||||||
|
* Update a repmgr 3.0 installation to repmgr 3.1
|
||||||
|
* ----------------------------------------------
|
||||||
|
*
|
||||||
|
* The new repmgr package should be installed first. Then
|
||||||
|
* carry out these steps:
|
||||||
|
*
|
||||||
|
* 1. (If repmgrd is used) stop any running repmgrd instances
|
||||||
|
* 2. On the master node, execute the SQL statements listed below
|
||||||
|
* 3. (If repmgrd is used) restart repmgrd
|
||||||
|
*/
|
||||||
|
|
||||||
|
/*
|
||||||
|
* If your repmgr installation is not included in your repmgr
|
||||||
|
* user's search path, please set the search path to the name
|
||||||
|
* of the repmgr schema to ensure objects are installed in
|
||||||
|
* the correct location.
|
||||||
|
*
|
||||||
|
* The repmgr schema is "repmgr_" + the cluster name defined in
|
||||||
|
* 'repmgr.conf'.
|
||||||
|
*/
|
||||||
|
|
||||||
|
-- SET search_path TO 'name_of_repmgr_schema';
|
||||||
|
|
||||||
|
BEGIN;
|
||||||
|
|
||||||
|
-- New view "repl_show_nodes" which also displays the server's
|
||||||
|
-- upstream node
|
||||||
|
|
||||||
|
CREATE VIEW repl_show_nodes AS
|
||||||
|
SELECT rn.id, rn.conninfo, rn.type, rn.name, rn.cluster,
|
||||||
|
rn.priority, rn.active, sq.name AS upstream_node_name
|
||||||
|
FROM repl_nodes as rn LEFT JOIN repl_nodes AS sq ON sq.id=rn.upstream_node_id;
|
||||||
|
|
||||||
|
COMMIT;
|
||||||
32
sql/repmgr3.1.1_repmgr3.1.2.sql
Normal file
32
sql/repmgr3.1.1_repmgr3.1.2.sql
Normal file
@@ -0,0 +1,32 @@
|
|||||||
|
/*
|
||||||
|
* Update a repmgr 3.1.1 installation to repmgr 3.1.2
|
||||||
|
* --------------------------------------------------
|
||||||
|
*
|
||||||
|
* This update is only required if repmgrd is being used in conjunction
|
||||||
|
* with a witness server.
|
||||||
|
*
|
||||||
|
* The new repmgr package should be installed first. Then
|
||||||
|
* carry out these steps:
|
||||||
|
*
|
||||||
|
* 1. (If repmgrd is used) stop any running repmgrd instances
|
||||||
|
* 2. On the master node, execute the SQL statement listed below
|
||||||
|
* 3. (If repmgrd is used) restart repmgrd
|
||||||
|
*/
|
||||||
|
|
||||||
|
/*
|
||||||
|
* If your repmgr installation is not included in your repmgr
|
||||||
|
* user's search path, please set the search path to the name
|
||||||
|
* of the repmgr schema to ensure objects are installed in
|
||||||
|
* the correct location.
|
||||||
|
*
|
||||||
|
* The repmgr schema is "repmgr_" + the cluster name defined in
|
||||||
|
* 'repmgr.conf'.
|
||||||
|
*/
|
||||||
|
|
||||||
|
-- SET search_path TO 'name_of_repmgr_schema';
|
||||||
|
|
||||||
|
BEGIN;
|
||||||
|
|
||||||
|
ALTER TABLE repl_nodes DROP CONSTRAINT repl_nodes_upstream_node_id_fkey,
|
||||||
|
ADD CONSTRAINT repl_nodes_upstream_node_id_fkey FOREIGN KEY (upstream_node_id) REFERENCES repl_nodes(id) DEFERRABLE;
|
||||||
|
COMMIT;
|
||||||
@@ -83,7 +83,12 @@ _PG_init(void)
|
|||||||
* resources in repmgr_shmem_startup().
|
* resources in repmgr_shmem_startup().
|
||||||
*/
|
*/
|
||||||
RequestAddinShmemSpace(repmgr_memsize());
|
RequestAddinShmemSpace(repmgr_memsize());
|
||||||
|
|
||||||
|
#if (PG_VERSION_NUM >= 90600)
|
||||||
|
RequestNamedLWLockTranche("repmgr", 1);
|
||||||
|
#else
|
||||||
RequestAddinLWLocks(1);
|
RequestAddinLWLocks(1);
|
||||||
|
#endif
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Install hooks.
|
* Install hooks.
|
||||||
@@ -128,7 +133,11 @@ repmgr_shmem_startup(void)
|
|||||||
if (!found)
|
if (!found)
|
||||||
{
|
{
|
||||||
/* First time through ... */
|
/* First time through ... */
|
||||||
|
#if (PG_VERSION_NUM >= 90600)
|
||||||
|
shared_state->lock = &(GetNamedLWLockTranche("repmgr"))->lock;
|
||||||
|
#else
|
||||||
shared_state->lock = LWLockAssign();
|
shared_state->lock = LWLockAssign();
|
||||||
|
#endif
|
||||||
snprintf(shared_state->location,
|
snprintf(shared_state->location,
|
||||||
sizeof(shared_state->location), "%X/%X", 0, 0);
|
sizeof(shared_state->location), "%X/%X", 0, 0);
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* repmgr_function.sql
|
* repmgr_function.sql
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|||||||
4
sql/repmgr_test.sql
Normal file
4
sql/repmgr_test.sql
Normal file
@@ -0,0 +1,4 @@
|
|||||||
|
select * from repmgr_update_standby_location('');
|
||||||
|
select * from repmgr_get_last_standby_location();
|
||||||
|
select * from repmgr_update_last_updated();
|
||||||
|
select * from repmgr_get_last_updated();
|
||||||
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* uninstall_repmgr_funcs.sql
|
* uninstall_repmgr_funcs.sql
|
||||||
* Copyright (c) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|||||||
20
strutil.c
20
strutil.c
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* strutil.c
|
* strutil.c
|
||||||
*
|
*
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
* it under the terms of the GNU General Public License as published by
|
* it under the terms of the GNU General Public License as published by
|
||||||
@@ -87,3 +87,21 @@ maxlen_snprintf(char *str, const char *format,...)
|
|||||||
|
|
||||||
return retval;
|
return retval;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Escape a string for use as a parameter in recovery.conf
|
||||||
|
* Caller must free returned value
|
||||||
|
*/
|
||||||
|
char *
|
||||||
|
escape_recovery_conf_value(const char *src)
|
||||||
|
{
|
||||||
|
char *result = escape_single_quotes_ascii(src);
|
||||||
|
|
||||||
|
if (!result)
|
||||||
|
{
|
||||||
|
fprintf(stderr, _("%s: out of memory\n"), progname());
|
||||||
|
exit(ERR_INTERNAL);
|
||||||
|
}
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|||||||
10
strutil.h
10
strutil.h
@@ -1,6 +1,6 @@
|
|||||||
/*
|
/*
|
||||||
* strutil.h
|
* strutil.h
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
*
|
*
|
||||||
* This program is free software: you can redistribute it and/or modify
|
* This program is free software: you can redistribute it and/or modify
|
||||||
@@ -22,14 +22,20 @@
|
|||||||
#define _STRUTIL_H_
|
#define _STRUTIL_H_
|
||||||
|
|
||||||
#include <stdlib.h>
|
#include <stdlib.h>
|
||||||
|
#include "pqexpbuffer.h"
|
||||||
#include "errcode.h"
|
#include "errcode.h"
|
||||||
|
|
||||||
|
|
||||||
#define QUERY_STR_LEN 8192
|
#define QUERY_STR_LEN 8192
|
||||||
#define MAXLEN 1024
|
#define MAXLEN 1024
|
||||||
#define MAXLINELENGTH 4096
|
#define MAXLINELENGTH 4096
|
||||||
#define MAXVERSIONSTR 16
|
#define MAXVERSIONSTR 16
|
||||||
#define MAXCONNINFO 1024
|
#define MAXCONNINFO 1024
|
||||||
|
|
||||||
|
/* Why? http://stackoverflow.com/a/5459929/398670 */
|
||||||
|
#define STR(x) CppAsString(x)
|
||||||
|
|
||||||
|
#define MAXLEN_STR STR(MAXLEN)
|
||||||
|
|
||||||
extern int
|
extern int
|
||||||
xsnprintf(char *str, size_t size, const char *format,...)
|
xsnprintf(char *str, size_t size, const char *format,...)
|
||||||
@@ -43,4 +49,6 @@ extern int
|
|||||||
maxlen_snprintf(char *str, const char *format,...)
|
maxlen_snprintf(char *str, const char *format,...)
|
||||||
__attribute__((format(PG_PRINTF_ATTRIBUTE, 2, 3)));
|
__attribute__((format(PG_PRINTF_ATTRIBUTE, 2, 3)));
|
||||||
|
|
||||||
|
extern char *
|
||||||
|
escape_recovery_conf_value(const char *src);
|
||||||
#endif /* _STRUTIL_H_ */
|
#endif /* _STRUTIL_H_ */
|
||||||
|
|||||||
@@ -1,7 +1,7 @@
|
|||||||
/*
|
/*
|
||||||
* uninstall_repmgr.sql
|
* uninstall_repmgr.sql
|
||||||
*
|
*
|
||||||
* Copyright (C) 2ndQuadrant, 2010-2015
|
* Copyright (c) 2ndQuadrant, 2010-2017
|
||||||
*
|
*
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user