mirror of
https://github.com/EnterpriseDB/repmgr.git
synced 2026-03-22 22:56:29 +00:00
1859 lines
42 KiB
C
1859 lines
42 KiB
C
/*
|
|
* dbutils.c - Database connection/management functions
|
|
* Copyright (C) 2ndQuadrant, 2010-2016
|
|
*
|
|
* This program is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*
|
|
*/
|
|
|
|
#include <unistd.h>
|
|
#include <time.h>
|
|
#include <sys/time.h>
|
|
|
|
#include "repmgr.h"
|
|
#include "config.h"
|
|
#include "strutil.h"
|
|
#include "log.h"
|
|
|
|
#include "catalog/pg_control.h"
|
|
|
|
char repmgr_schema[MAXLEN] = "";
|
|
char repmgr_schema_quoted[MAXLEN] = "";
|
|
|
|
static int _get_node_record(PGconn *conn, char *cluster, char *sqlquery, t_node_info *node_info);
|
|
|
|
PGconn *
|
|
_establish_db_connection(const char *conninfo, const bool exit_on_error, const bool log_notice)
|
|
{
|
|
/* Make a connection to the database */
|
|
PGconn *conn = NULL;
|
|
char connection_string[MAXLEN];
|
|
|
|
strcpy(connection_string, conninfo);
|
|
strcat(connection_string, " fallback_application_name='repmgr'");
|
|
|
|
log_debug(_("connecting to: '%s'\n"), connection_string);
|
|
|
|
conn = PQconnectdb(connection_string);
|
|
|
|
/* Check to see that the backend connection was successfully made */
|
|
if ((PQstatus(conn) != CONNECTION_OK))
|
|
{
|
|
if (log_notice)
|
|
{
|
|
log_notice(_("connection to database failed: %s\n"),
|
|
PQerrorMessage(conn));
|
|
}
|
|
else
|
|
{
|
|
log_err(_("connection to database failed: %s\n"),
|
|
PQerrorMessage(conn));
|
|
}
|
|
|
|
if (exit_on_error)
|
|
{
|
|
PQfinish(conn);
|
|
exit(ERR_DB_CON);
|
|
}
|
|
}
|
|
|
|
return conn;
|
|
}
|
|
|
|
PGconn *
|
|
establish_db_connection(const char *conninfo, const bool exit_on_error)
|
|
{
|
|
return _establish_db_connection(conninfo, exit_on_error, false);
|
|
}
|
|
|
|
PGconn *
|
|
test_db_connection(const char *conninfo, const bool exit_on_error)
|
|
{
|
|
return _establish_db_connection(conninfo, exit_on_error, true);
|
|
}
|
|
|
|
|
|
PGconn *
|
|
establish_db_connection_by_params(const char *keywords[], const char *values[],
|
|
const bool exit_on_error)
|
|
{
|
|
/* Make a connection to the database */
|
|
PGconn *conn = PQconnectdbParams(keywords, values, true);
|
|
|
|
/* Check to see that the backend connection was successfully made */
|
|
if ((PQstatus(conn) != CONNECTION_OK))
|
|
{
|
|
log_err(_("connection to database failed: %s\n"),
|
|
PQerrorMessage(conn));
|
|
if (exit_on_error)
|
|
{
|
|
PQfinish(conn);
|
|
exit(ERR_DB_CON);
|
|
}
|
|
}
|
|
|
|
return conn;
|
|
}
|
|
|
|
|
|
bool
|
|
begin_transaction(PGconn *conn)
|
|
{
|
|
PGresult *res;
|
|
|
|
log_verbose(LOG_DEBUG, "begin_transaction()\n");
|
|
|
|
res = PQexec(conn, "BEGIN");
|
|
|
|
if (PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to begin transaction: %s\n"),
|
|
PQerrorMessage(conn));
|
|
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
bool
|
|
commit_transaction(PGconn *conn)
|
|
{
|
|
PGresult *res;
|
|
|
|
log_verbose(LOG_DEBUG, "commit_transaction()\n");
|
|
|
|
res = PQexec(conn, "COMMIT");
|
|
|
|
if (PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to commit transaction: %s\n"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
bool
|
|
rollback_transaction(PGconn *conn)
|
|
{
|
|
PGresult *res;
|
|
|
|
log_verbose(LOG_DEBUG, "rollback_transaction()\n");
|
|
|
|
res = PQexec(conn, "ROLLBACK");
|
|
|
|
if (PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to rollback transaction: %s\n"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
bool
|
|
check_cluster_schema(PGconn *conn)
|
|
{
|
|
PGresult *res;
|
|
char sqlquery[QUERY_STR_LEN];
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT 1 FROM pg_namespace WHERE nspname = '%s'",
|
|
get_repmgr_schema());
|
|
|
|
log_verbose(LOG_DEBUG, "check_cluster_schema(): %s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("check_cluster_schema(): unable to check cluster schema: %s\n"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
if (PQntuples(res) == 0)
|
|
{
|
|
/* schema doesn't exist */
|
|
log_debug(_("check_cluster_schema(): schema '%s' doesn't exist\n"), get_repmgr_schema());
|
|
PQclear(res);
|
|
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
int
|
|
is_standby(PGconn *conn)
|
|
{
|
|
PGresult *res;
|
|
int result = 0;
|
|
char *sqlquery = "SELECT pg_catalog.pg_is_in_recovery()";
|
|
|
|
log_verbose(LOG_DEBUG, "is_standby(): %s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
|
|
if (res == NULL || PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("Unable to query server mode: %s\n"),
|
|
PQerrorMessage(conn));
|
|
result = -1;
|
|
}
|
|
else if (PQntuples(res) == 1 && strcmp(PQgetvalue(res, 0, 0), "t") == 0)
|
|
{
|
|
result = 1;
|
|
}
|
|
|
|
PQclear(res);
|
|
return result;
|
|
}
|
|
|
|
|
|
/* check the PQStatus and try to 'select 1' to confirm good connection */
|
|
bool
|
|
is_pgup(PGconn *conn, int timeout)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
|
|
/* Check the connection status twice in case it changes after reset */
|
|
bool twice = false;
|
|
|
|
/* Check the connection status twice in case it changes after reset */
|
|
for (;;)
|
|
{
|
|
if (PQstatus(conn) != CONNECTION_OK)
|
|
{
|
|
if (twice)
|
|
return false;
|
|
PQreset(conn); /* reconnect */
|
|
twice = true;
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* Send a SELECT 1 just to check if the connection is OK
|
|
*/
|
|
if (!cancel_query(conn, timeout))
|
|
goto failed;
|
|
if (wait_connection_availability(conn, timeout) != 1)
|
|
goto failed;
|
|
|
|
sqlquery_snprintf(sqlquery, "SELECT 1");
|
|
if (PQsendQuery(conn, sqlquery) == 0)
|
|
{
|
|
log_warning(_("PQsendQuery: Query could not be sent to primary. %s\n"),
|
|
PQerrorMessage(conn));
|
|
goto failed;
|
|
}
|
|
if (wait_connection_availability(conn, timeout) != 1)
|
|
goto failed;
|
|
|
|
break;
|
|
|
|
failed:
|
|
|
|
/*
|
|
* we need to retry, because we might just have lost the
|
|
* connection once
|
|
*/
|
|
if (twice)
|
|
return false;
|
|
PQreset(conn); /* reconnect */
|
|
twice = true;
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
|
|
/*
|
|
* Return the id of the active master node, or NODE_NOT_FOUND if no
|
|
* record available.
|
|
*
|
|
* This reports the value stored in the database only and
|
|
* does not verify whether the node is actually available
|
|
*/
|
|
int
|
|
get_master_node_id(PGconn *conn, char *cluster)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
int retval;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT id "
|
|
" FROM %s.repl_nodes "
|
|
" WHERE cluster = '%s' "
|
|
" AND type = 'master' "
|
|
" AND active IS TRUE ",
|
|
get_repmgr_schema_quoted(conn),
|
|
cluster);
|
|
|
|
log_verbose(LOG_DEBUG, "get_master_node_id():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("get_master_node_id(): query failed\n%s\n"),
|
|
PQerrorMessage(conn));
|
|
retval = NODE_NOT_FOUND;
|
|
}
|
|
else if (PQntuples(res) == 0)
|
|
{
|
|
log_verbose(LOG_WARNING, _("get_master_node_id(): no active primary found\n"));
|
|
retval = NODE_NOT_FOUND;
|
|
}
|
|
else
|
|
{
|
|
retval = atoi(PQgetvalue(res, 0, 0));
|
|
}
|
|
PQclear(res);
|
|
|
|
return retval;
|
|
}
|
|
|
|
|
|
/*
|
|
* Return the server version number for the connection provided
|
|
*/
|
|
int
|
|
get_server_version(PGconn *conn, char *server_version)
|
|
{
|
|
PGresult *res;
|
|
res = PQexec(conn,
|
|
"SELECT current_setting('server_version_num'), "
|
|
" current_setting('server_version')");
|
|
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("unable to determine server version number:\n%s"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return -1;
|
|
}
|
|
|
|
if (server_version != NULL)
|
|
strcpy(server_version, PQgetvalue(res, 0, 0));
|
|
|
|
return atoi(PQgetvalue(res, 0, 0));
|
|
}
|
|
|
|
|
|
int
|
|
guc_set(PGconn *conn, const char *parameter, const char *op,
|
|
const char *value)
|
|
{
|
|
PGresult *res;
|
|
char sqlquery[QUERY_STR_LEN];
|
|
int retval = 1;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT true FROM pg_settings "
|
|
" WHERE name = '%s' AND setting %s '%s'",
|
|
parameter, op, value);
|
|
|
|
log_verbose(LOG_DEBUG, "guc_set():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("guc_set(): unable to execute query\n%s\n"),
|
|
PQerrorMessage(conn));
|
|
retval = -1;
|
|
}
|
|
else if (PQntuples(res) == 0)
|
|
{
|
|
retval = 0;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return retval;
|
|
}
|
|
|
|
/**
|
|
* Just like guc_set except with an extra parameter containing the name of
|
|
* the pg datatype so that the comparison can be done properly.
|
|
*/
|
|
int
|
|
guc_set_typed(PGconn *conn, const char *parameter, const char *op,
|
|
const char *value, const char *datatype)
|
|
{
|
|
PGresult *res;
|
|
char sqlquery[QUERY_STR_LEN];
|
|
int retval = 1;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT true FROM pg_settings "
|
|
" WHERE name = '%s' AND setting::%s %s '%s'::%s",
|
|
parameter, datatype, op, value, datatype);
|
|
|
|
log_verbose(LOG_DEBUG, "guc_set_typed():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("guc_set_typed(): unable to execute query\n%s\n"),
|
|
PQerrorMessage(conn));
|
|
retval = -1;
|
|
}
|
|
else if (PQntuples(res) == 0)
|
|
{
|
|
retval = 0;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return retval;
|
|
}
|
|
|
|
|
|
bool
|
|
get_cluster_size(PGconn *conn, char *size)
|
|
{
|
|
PGresult *res;
|
|
char sqlquery[QUERY_STR_LEN];
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT pg_catalog.pg_size_pretty(SUM(pg_catalog.pg_database_size(oid))::bigint) "
|
|
" FROM pg_database ");
|
|
|
|
log_verbose(LOG_DEBUG, "get_cluster_size():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (res == NULL || PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("get_cluster_size(): unable to execute query\n%s\n"),
|
|
PQerrorMessage(conn));
|
|
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
strncpy(size, PQgetvalue(res, 0, 0), MAXLEN);
|
|
|
|
PQclear(res);
|
|
return true;
|
|
}
|
|
|
|
|
|
bool
|
|
get_pg_setting(PGconn *conn, const char *setting, char *output)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
int i;
|
|
bool success = true;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT name, setting "
|
|
" FROM pg_settings WHERE name = '%s'",
|
|
setting);
|
|
|
|
log_verbose(LOG_DEBUG, "get_pg_setting(): %s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
|
|
if (res == NULL || PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("get_pg_setting() - PQexec failed: %s"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
for (i = 0; i < PQntuples(res); i++)
|
|
{
|
|
if (strcmp(PQgetvalue(res, i, 0), setting) == 0)
|
|
{
|
|
strncpy(output, PQgetvalue(res, i, 1), MAXLEN);
|
|
success = true;
|
|
break;
|
|
}
|
|
else
|
|
{
|
|
/* XXX highly unlikely this would ever happen */
|
|
log_err(_("get_pg_setting(): unknown parameter \"%s\""), PQgetvalue(res, i, 0));
|
|
}
|
|
}
|
|
|
|
if (success == true)
|
|
{
|
|
log_verbose(LOG_DEBUG, _("get_pg_setting(): returned value is \"%s\"\n"), output);
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return success;
|
|
}
|
|
|
|
|
|
/*
|
|
* get_conninfo_value()
|
|
*
|
|
* Extract the value represented by 'keyword' in 'conninfo' and copy
|
|
* it to the 'output' buffer.
|
|
*
|
|
* Returns true on success, or false on failure (conninfo string could
|
|
* not be parsed, or provided keyword not found).
|
|
*/
|
|
|
|
bool
|
|
get_conninfo_value(const char *conninfo, const char *keyword, char *output)
|
|
{
|
|
PQconninfoOption *conninfo_options;
|
|
PQconninfoOption *conninfo_option;
|
|
|
|
conninfo_options = PQconninfoParse(conninfo, NULL);
|
|
|
|
if (conninfo_options == NULL)
|
|
{
|
|
log_err(_("Unable to parse provided conninfo string \"%s\""), conninfo);
|
|
return false;
|
|
}
|
|
|
|
for (conninfo_option = conninfo_options; conninfo_option->keyword != NULL; conninfo_option++)
|
|
{
|
|
if (strcmp(conninfo_option->keyword, keyword) == 0)
|
|
{
|
|
if (conninfo_option->val != NULL && conninfo_option->val[0] != '\0')
|
|
{
|
|
strncpy(output, conninfo_option->val, MAXLEN);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
PQconninfoFree(conninfo_options);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/*
|
|
* get_upstream_connection()
|
|
*
|
|
* Returns connection to node's upstream node
|
|
*
|
|
* NOTE: will attempt to connect even if node is marked as inactive
|
|
*/
|
|
PGconn *
|
|
get_upstream_connection(PGconn *standby_conn, char *cluster, int node_id,
|
|
int *upstream_node_id_ptr, char *upstream_conninfo_out)
|
|
{
|
|
PGconn *upstream_conn = NULL;
|
|
PGresult *res;
|
|
char sqlquery[QUERY_STR_LEN];
|
|
char upstream_conninfo_stack[MAXCONNINFO];
|
|
char *upstream_conninfo = &*upstream_conninfo_stack;
|
|
|
|
/*
|
|
* If the caller wanted to get a copy of the connection info string, sub
|
|
* out the local stack pointer for the pointer passed by the caller.
|
|
*/
|
|
if (upstream_conninfo_out != NULL)
|
|
upstream_conninfo = upstream_conninfo_out;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
" SELECT un.conninfo, un.id "
|
|
" FROM %s.repl_nodes un "
|
|
"INNER JOIN %s.repl_nodes n "
|
|
" ON (un.id = n.upstream_node_id AND un.cluster = n.cluster)"
|
|
" WHERE n.cluster = '%s' "
|
|
" AND n.id = %i ",
|
|
get_repmgr_schema_quoted(standby_conn),
|
|
get_repmgr_schema_quoted(standby_conn),
|
|
cluster,
|
|
node_id);
|
|
|
|
log_verbose(LOG_DEBUG, "get_upstream_connection():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(standby_conn, sqlquery);
|
|
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("error when attempting to find upstream server\n%s\n"),
|
|
PQerrorMessage(standby_conn));
|
|
PQclear(res);
|
|
return NULL;
|
|
}
|
|
|
|
if (!PQntuples(res))
|
|
{
|
|
PQclear(res);
|
|
log_debug("no record found for upstream server\n");
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
" SELECT un.conninfo, un.id "
|
|
" FROM %s.repl_nodes un "
|
|
" WHERE un.cluster = '%s' "
|
|
" AND un.type='master' "
|
|
" AND un.active IS TRUE",
|
|
get_repmgr_schema_quoted(standby_conn),
|
|
cluster);
|
|
res = PQexec(standby_conn, sqlquery);
|
|
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("error when attempting to find active master server\n%s\n"),
|
|
PQerrorMessage(standby_conn));
|
|
PQclear(res);
|
|
return NULL;
|
|
}
|
|
|
|
if (!PQntuples(res))
|
|
{
|
|
PQclear(res);
|
|
log_notice(_("no record found for active master server\n"));
|
|
|
|
return NULL;
|
|
}
|
|
|
|
log_debug("record found for active master server\n");
|
|
}
|
|
|
|
strncpy(upstream_conninfo, PQgetvalue(res, 0, 0), MAXCONNINFO);
|
|
|
|
if (upstream_node_id_ptr != NULL)
|
|
*upstream_node_id_ptr = atoi(PQgetvalue(res, 0, 1));
|
|
|
|
PQclear(res);
|
|
|
|
log_verbose(LOG_DEBUG, "get_upstream_connection(): conninfo is \"%s\"\n", upstream_conninfo);
|
|
upstream_conn = establish_db_connection(upstream_conninfo, false);
|
|
|
|
if (PQstatus(upstream_conn) != CONNECTION_OK)
|
|
{
|
|
log_err(_("unable to connect to upstream node: %s\n"),
|
|
PQerrorMessage(upstream_conn));
|
|
return NULL;
|
|
}
|
|
|
|
return upstream_conn;
|
|
}
|
|
|
|
|
|
/*
|
|
* Read the node list from the local node and attempt to connect to each node
|
|
* in turn to definitely establish if it's the cluster primary.
|
|
*
|
|
* The node list is returned in the order which makes it likely that the
|
|
* current primary will be returned first, reducing the number of speculative
|
|
* connections which need to be made to other nodes.
|
|
*
|
|
* If master_conninfo_out points to allocated memory of MAXCONNINFO in length,
|
|
* the primary server's conninfo string will be copied there.
|
|
*/
|
|
|
|
PGconn *
|
|
get_master_connection(PGconn *standby_conn, char *cluster,
|
|
int *master_id, char *master_conninfo_out)
|
|
{
|
|
PGconn *remote_conn = NULL;
|
|
PGresult *res;
|
|
char sqlquery[QUERY_STR_LEN];
|
|
char remote_conninfo_stack[MAXCONNINFO];
|
|
char *remote_conninfo = &*remote_conninfo_stack;
|
|
|
|
int i,
|
|
node_id;
|
|
|
|
/*
|
|
* If the caller wanted to get a copy of the connection info string, sub
|
|
* out the local stack pointer for the pointer passed by the caller.
|
|
*/
|
|
if (master_conninfo_out != NULL)
|
|
remote_conninfo = master_conninfo_out;
|
|
|
|
if (master_id != NULL)
|
|
{
|
|
*master_id = NODE_NOT_FOUND;
|
|
}
|
|
|
|
/* find all nodes belonging to this cluster */
|
|
log_info(_("retrieving node list for cluster '%s'\n"),
|
|
cluster);
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
" SELECT id, conninfo, "
|
|
" CASE WHEN type = 'master' THEN 1 ELSE 2 END AS type_priority"
|
|
" FROM %s.repl_nodes "
|
|
" WHERE cluster = '%s' "
|
|
" AND type != 'witness' "
|
|
"ORDER BY active DESC, type_priority, priority, id",
|
|
get_repmgr_schema_quoted(standby_conn),
|
|
cluster);
|
|
|
|
log_verbose(LOG_DEBUG, "get_master_connection():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(standby_conn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("unable to retrieve node records: %s\n"),
|
|
PQerrorMessage(standby_conn));
|
|
PQclear(res);
|
|
return NULL;
|
|
}
|
|
|
|
for (i = 0; i < PQntuples(res); i++)
|
|
{
|
|
int is_node_standby;
|
|
|
|
/* initialize with the values of the current node being processed */
|
|
node_id = atoi(PQgetvalue(res, i, 0));
|
|
strncpy(remote_conninfo, PQgetvalue(res, i, 1), MAXCONNINFO);
|
|
log_verbose(LOG_INFO,
|
|
_("checking role of cluster node '%i'\n"),
|
|
node_id);
|
|
remote_conn = establish_db_connection(remote_conninfo, false);
|
|
|
|
if (PQstatus(remote_conn) != CONNECTION_OK)
|
|
continue;
|
|
|
|
is_node_standby = is_standby(remote_conn);
|
|
|
|
if (is_node_standby == -1)
|
|
{
|
|
log_err(_("unable to retrieve recovery state from node %i:\n%s\n"),
|
|
node_id,
|
|
PQerrorMessage(remote_conn));
|
|
PQfinish(remote_conn);
|
|
continue;
|
|
}
|
|
|
|
/* if is_standby() returns 0, queried node is the master */
|
|
if (is_node_standby == 0)
|
|
{
|
|
PQclear(res);
|
|
log_debug(_("get_master_connection(): current master node is %i\n"), node_id);
|
|
|
|
if (master_id != NULL)
|
|
{
|
|
*master_id = node_id;
|
|
}
|
|
|
|
return remote_conn;
|
|
}
|
|
|
|
|
|
/* if it is a standby, clear connection info and continue*/
|
|
PQfinish(remote_conn);
|
|
}
|
|
|
|
/*
|
|
* If we finish this loop without finding a master then we doesn't have
|
|
* the info or the master has failed (or we reached max_connections or
|
|
* superuser_reserved_connections, anything else I'm missing?).
|
|
*
|
|
* Probably we will need to check the error to know if we need to start
|
|
* failover procedure or just fix some situation on the standby.
|
|
*/
|
|
PQclear(res);
|
|
return NULL;
|
|
}
|
|
|
|
|
|
/*
|
|
* wait until current query finishes ignoring any results, this could be an
|
|
* async command or a cancelation of a query
|
|
* return 1 if Ok; 0 if any error ocurred; -1 if timeout reached
|
|
*/
|
|
int
|
|
wait_connection_availability(PGconn *conn, long long timeout)
|
|
{
|
|
PGresult *res;
|
|
fd_set read_set;
|
|
int sock = PQsocket(conn);
|
|
struct timeval tmout,
|
|
before,
|
|
after;
|
|
struct timezone tz;
|
|
|
|
/* recalc to microseconds */
|
|
timeout *= 1000000;
|
|
|
|
while (timeout > 0)
|
|
{
|
|
if (PQconsumeInput(conn) == 0)
|
|
{
|
|
log_warning(_("wait_connection_availability(): could not receive data from connection. %s\n"),
|
|
PQerrorMessage(conn));
|
|
return 0;
|
|
}
|
|
|
|
if (PQisBusy(conn) == 0)
|
|
{
|
|
do
|
|
{
|
|
res = PQgetResult(conn);
|
|
PQclear(res);
|
|
} while (res != NULL);
|
|
|
|
break;
|
|
}
|
|
|
|
|
|
tmout.tv_sec = 0;
|
|
tmout.tv_usec = 250000;
|
|
|
|
FD_ZERO(&read_set);
|
|
FD_SET(sock, &read_set);
|
|
|
|
gettimeofday(&before, &tz);
|
|
if (select(sock, &read_set, NULL, NULL, &tmout) == -1)
|
|
{
|
|
log_warning(
|
|
_("wait_connection_availability(): select() returned with error\n%s\n"),
|
|
strerror(errno));
|
|
return -1;
|
|
}
|
|
gettimeofday(&after, &tz);
|
|
|
|
timeout -= (after.tv_sec * 1000000 + after.tv_usec) -
|
|
(before.tv_sec * 1000000 + before.tv_usec);
|
|
}
|
|
|
|
|
|
if (timeout >= 0)
|
|
{
|
|
return 1;
|
|
}
|
|
|
|
log_warning(_("wait_connection_availability(): timeout reached"));
|
|
return -1;
|
|
}
|
|
|
|
|
|
bool
|
|
cancel_query(PGconn *conn, int timeout)
|
|
{
|
|
char errbuf[ERRBUFF_SIZE];
|
|
PGcancel *pgcancel;
|
|
|
|
if (wait_connection_availability(conn, timeout) != 1)
|
|
return false;
|
|
|
|
pgcancel = PQgetCancel(conn);
|
|
|
|
if (pgcancel == NULL)
|
|
return false;
|
|
|
|
/*
|
|
* PQcancel can only return 0 if socket()/connect()/send() fails, in any
|
|
* of those cases we can assume something bad happened to the connection
|
|
*/
|
|
if (PQcancel(pgcancel, errbuf, ERRBUFF_SIZE) == 0)
|
|
{
|
|
log_warning(_("Can't stop current query: %s\n"), errbuf);
|
|
PQfreeCancel(pgcancel);
|
|
return false;
|
|
}
|
|
|
|
PQfreeCancel(pgcancel);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/* Return the repmgr schema as an unmodified string
|
|
* This is useful for displaying the schema name in log messages,
|
|
* however inclusion in SQL statements, get_repmgr_schema_quoted() should
|
|
* always be used.
|
|
*/
|
|
char *
|
|
get_repmgr_schema(void)
|
|
{
|
|
return repmgr_schema;
|
|
}
|
|
|
|
|
|
char *
|
|
get_repmgr_schema_quoted(PGconn *conn)
|
|
{
|
|
if (strcmp(repmgr_schema_quoted, "") == 0)
|
|
{
|
|
char *identifier = PQescapeIdentifier(conn, repmgr_schema,
|
|
strlen(repmgr_schema));
|
|
|
|
maxlen_snprintf(repmgr_schema_quoted, "%s", identifier);
|
|
PQfreemem(identifier);
|
|
}
|
|
|
|
return repmgr_schema_quoted;
|
|
}
|
|
|
|
|
|
bool
|
|
create_replication_slot(PGconn *conn, char *slot_name, int server_version_num)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
int query_res;
|
|
PGresult *res;
|
|
t_replication_slot slot_info;
|
|
|
|
/*
|
|
* Check whether slot exists already; if it exists and is active, that
|
|
* means another active standby is using it, which creates an error situation;
|
|
* if not we can reuse it as-is
|
|
*/
|
|
|
|
query_res = get_slot_record(conn, slot_name, &slot_info);
|
|
|
|
if (query_res)
|
|
{
|
|
if (strcmp(slot_info.slot_type, "physical") != 0)
|
|
{
|
|
log_err(_("Slot '%s' exists and is not a physical slot\n"),
|
|
slot_name);
|
|
return false;
|
|
}
|
|
|
|
if (slot_info.active == false)
|
|
{
|
|
log_debug("Replication slot '%s' exists but is inactive; reusing\n",
|
|
slot_name);
|
|
|
|
return true;
|
|
}
|
|
|
|
log_err(_("Slot '%s' already exists as an active slot\n"),
|
|
slot_name);
|
|
return false;
|
|
}
|
|
|
|
/* In 9.6 and later, reserve the LSN straight away */
|
|
if (server_version_num >= 90600)
|
|
{
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT * FROM pg_create_physical_replication_slot('%s', TRUE)",
|
|
slot_name);
|
|
}
|
|
else
|
|
{
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT * FROM pg_create_physical_replication_slot('%s')",
|
|
slot_name);
|
|
}
|
|
|
|
log_debug(_("create_replication_slot(): Creating slot '%s' on primary\n"), slot_name);
|
|
log_verbose(LOG_DEBUG, "create_replication_slot():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (!res || PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("unable to create slot '%s' on the primary node: %s\n"),
|
|
slot_name,
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
return true;
|
|
}
|
|
|
|
|
|
int
|
|
get_slot_record(PGconn *conn, char *slot_name, t_replication_slot *record)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT slot_name, slot_type, active "
|
|
" FROM pg_replication_slots "
|
|
" WHERE slot_name = '%s' ",
|
|
slot_name);
|
|
|
|
log_verbose(LOG_DEBUG, "get_slot_record():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (!res || PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("unable to query pg_replication_slots: %s\n"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return -1;
|
|
}
|
|
|
|
if (!PQntuples(res))
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
strncpy(record->slot_name, PQgetvalue(res, 0, 0), MAXLEN);
|
|
strncpy(record->slot_type, PQgetvalue(res, 0, 1), MAXLEN);
|
|
record->active = (strcmp(PQgetvalue(res, 0, 2), "t") == 0)
|
|
? true
|
|
: false;
|
|
|
|
PQclear(res);
|
|
|
|
return 1;
|
|
}
|
|
|
|
bool
|
|
drop_replication_slot(PGconn *conn, char *slot_name)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT pg_drop_replication_slot('%s')",
|
|
slot_name);
|
|
|
|
log_verbose(LOG_DEBUG, "drop_replication_slot():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (!res || PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("unable to drop replication slot \"%s\":\n %s\n"),
|
|
slot_name,
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
log_verbose(LOG_DEBUG, "replication slot \"%s\" successfully dropped\n",
|
|
slot_name);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
bool
|
|
start_backup(PGconn *conn, char *first_wal_segment, bool fast_checkpoint)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT pg_catalog.pg_xlogfile_name(pg_catalog.pg_start_backup('repmgr_standby_clone_%ld', %s))",
|
|
time(NULL),
|
|
fast_checkpoint ? "TRUE" : "FALSE");
|
|
|
|
log_verbose(LOG_DEBUG, "start_backup():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("unable to start backup: %s\n"), PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
if (first_wal_segment != NULL)
|
|
{
|
|
char *first_wal_seg_pq = PQgetvalue(res, 0, 0);
|
|
size_t buf_sz = strlen(first_wal_seg_pq);
|
|
|
|
first_wal_segment = pg_malloc0(buf_sz + 1);
|
|
xsnprintf(first_wal_segment, buf_sz + 1, "%s", first_wal_seg_pq);
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
bool
|
|
stop_backup(PGconn *conn, char *last_wal_segment)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
|
|
sqlquery_snprintf(sqlquery, "SELECT pg_catalog.pg_xlogfile_name(pg_catalog.pg_stop_backup())");
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err(_("unable to stop backup: %s\n"), PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
if (last_wal_segment != NULL)
|
|
{
|
|
char *last_wal_seg_pq = PQgetvalue(res, 0, 0);
|
|
size_t buf_sz = strlen(last_wal_seg_pq);
|
|
|
|
last_wal_segment = pg_malloc0(buf_sz + 1);
|
|
xsnprintf(last_wal_segment, buf_sz + 1, "%s", last_wal_seg_pq);
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
bool
|
|
set_config_bool(PGconn *conn, const char *config_param, bool state)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"SET %s TO %s",
|
|
config_param,
|
|
state ? "TRUE" : "FALSE");
|
|
|
|
log_verbose(LOG_DEBUG, "set_config_bool():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
|
|
if (PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err("unable to set '%s': %s\n", config_param, PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/*
|
|
* witness_copy_node_records()
|
|
*
|
|
* Copy records in master's `repl_nodes` table to witness database
|
|
*
|
|
* This is used by `repmgr` when setting up the witness database, and
|
|
* `repmgrd` after a failover event occurs
|
|
*/
|
|
bool
|
|
witness_copy_node_records(PGconn *masterconn, PGconn *witnessconn, char *cluster_name)
|
|
{
|
|
char sqlquery[MAXLEN];
|
|
PGresult *res;
|
|
int i;
|
|
|
|
begin_transaction(witnessconn);
|
|
|
|
/* Defer constraints */
|
|
sqlquery_snprintf(sqlquery, "SET CONSTRAINTS ALL DEFERRED;");
|
|
log_verbose(LOG_DEBUG, "witness_copy_node_records():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(witnessconn, sqlquery);
|
|
if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to defer constraints:\n%s\n"),
|
|
PQerrorMessage(witnessconn));
|
|
rollback_transaction(witnessconn);
|
|
|
|
return false;
|
|
}
|
|
|
|
/* Truncate existing records */
|
|
sqlquery_snprintf(sqlquery, "TRUNCATE TABLE %s.repl_nodes", get_repmgr_schema_quoted(witnessconn));
|
|
|
|
log_verbose(LOG_DEBUG, "witness_copy_node_records():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(witnessconn, sqlquery);
|
|
if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to truncate witness servers's repl_nodes table:\n%s\n"),
|
|
PQerrorMessage(witnessconn));
|
|
rollback_transaction(witnessconn);
|
|
|
|
return false;
|
|
}
|
|
|
|
/* Get current records from primary */
|
|
sqlquery_snprintf(sqlquery,
|
|
"SELECT id, type, upstream_node_id, name, conninfo, priority, slot_name, active FROM %s.repl_nodes",
|
|
get_repmgr_schema_quoted(masterconn));
|
|
|
|
log_verbose(LOG_DEBUG, "witness_copy_node_records():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(masterconn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_err("Unable to retrieve node records from master:\n%s\n",
|
|
PQerrorMessage(masterconn));
|
|
PQclear(res);
|
|
rollback_transaction(witnessconn);
|
|
|
|
return false;
|
|
}
|
|
|
|
/* Insert primary records into witness table */
|
|
for (i = 0; i < PQntuples(res); i++)
|
|
{
|
|
bool node_record_created;
|
|
|
|
log_verbose(LOG_DEBUG,
|
|
"witness_copy_node_records(): writing node record for node %s (id: %s)\n",
|
|
PQgetvalue(res, i, 3),
|
|
PQgetvalue(res, i, 0));
|
|
|
|
node_record_created = create_node_record(witnessconn,
|
|
"witness_copy_node_records",
|
|
atoi(PQgetvalue(res, i, 0)),
|
|
PQgetvalue(res, i, 1),
|
|
strlen(PQgetvalue(res, i, 2))
|
|
? atoi(PQgetvalue(res, i, 2))
|
|
: NO_UPSTREAM_NODE,
|
|
cluster_name,
|
|
PQgetvalue(res, i, 3),
|
|
PQgetvalue(res, i, 4),
|
|
atoi(PQgetvalue(res, i, 5)),
|
|
strlen(PQgetvalue(res, i, 6))
|
|
? PQgetvalue(res, i, 6)
|
|
: NULL,
|
|
(strcmp(PQgetvalue(res, i, 7), "t") == 0)
|
|
? true
|
|
: false
|
|
);
|
|
|
|
if (node_record_created == false)
|
|
{
|
|
PQclear(res);
|
|
|
|
log_err("Unable to copy node record to witness database\n%s\n",
|
|
PQerrorMessage(witnessconn));
|
|
rollback_transaction(witnessconn);
|
|
|
|
return false;
|
|
}
|
|
}
|
|
PQclear(res);
|
|
|
|
/* And finished */
|
|
commit_transaction(witnessconn);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
/*
|
|
* create_node_record()
|
|
*
|
|
* Create an entry in the `repl_nodes` table.
|
|
*
|
|
* XXX we should pass the record parameters as a struct.
|
|
*/
|
|
bool
|
|
create_node_record(PGconn *conn, char *action, int node, char *type, int upstream_node, char *cluster_name, char *node_name, char *conninfo, int priority, char *slot_name, bool active)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
char upstream_node_id[MAXLEN];
|
|
char slot_name_buf[MAXLEN];
|
|
PGresult *res;
|
|
|
|
if (upstream_node == NO_UPSTREAM_NODE)
|
|
{
|
|
/*
|
|
* No explicit upstream node id provided for standby - attempt to
|
|
* get primary node id
|
|
*/
|
|
if (strcmp(type, "standby") == 0)
|
|
{
|
|
int primary_node_id = get_master_node_id(conn, cluster_name);
|
|
maxlen_snprintf(upstream_node_id, "%i", primary_node_id);
|
|
}
|
|
else
|
|
{
|
|
maxlen_snprintf(upstream_node_id, "%s", "NULL");
|
|
}
|
|
}
|
|
else
|
|
{
|
|
maxlen_snprintf(upstream_node_id, "%i", upstream_node);
|
|
}
|
|
|
|
if (slot_name != NULL && slot_name[0])
|
|
{
|
|
maxlen_snprintf(slot_name_buf, "'%s'", slot_name);
|
|
}
|
|
else
|
|
{
|
|
maxlen_snprintf(slot_name_buf, "%s", "NULL");
|
|
}
|
|
|
|
/* XXX convert to placeholder query */
|
|
sqlquery_snprintf(sqlquery,
|
|
"INSERT INTO %s.repl_nodes "
|
|
" (id, type, upstream_node_id, cluster, "
|
|
" name, conninfo, slot_name, priority, active) "
|
|
"VALUES (%i, '%s', %s, '%s', '%s', '%s', %s, %i, %s) ",
|
|
get_repmgr_schema_quoted(conn),
|
|
node,
|
|
type,
|
|
upstream_node_id,
|
|
cluster_name,
|
|
node_name,
|
|
conninfo,
|
|
slot_name_buf,
|
|
priority,
|
|
active == true ? "TRUE" : "FALSE");
|
|
|
|
log_verbose(LOG_DEBUG, "create_node_record(): %s\n", sqlquery);
|
|
|
|
if (action != NULL)
|
|
{
|
|
log_verbose(LOG_DEBUG, "create_node_record(): action is \"%s\"\n", action);
|
|
}
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to create node record\n%s\n"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
bool
|
|
delete_node_record(PGconn *conn, int node, char *action)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
"DELETE FROM %s.repl_nodes "
|
|
" WHERE id = %d",
|
|
get_repmgr_schema_quoted(conn),
|
|
node);
|
|
|
|
log_verbose(LOG_DEBUG, "delete_node_record(): %s\n", sqlquery);
|
|
|
|
if (action != NULL)
|
|
{
|
|
log_verbose(LOG_DEBUG, "delete_node_record(): action is \"%s\"\n", action);
|
|
}
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (!res || PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to delete node record: %s\n"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
return true;
|
|
}
|
|
|
|
|
|
/*
|
|
* create_event_record()
|
|
*
|
|
* If `conn` is not NULL, insert a record into the events table.
|
|
*
|
|
* If configuration parameter `event_notification_command` is set, also
|
|
* attempt to execute that command.
|
|
*
|
|
* Returns true if all operations succeeded, false if one or more failed.
|
|
*
|
|
* Note this function may be called with `conn` set to NULL in cases where
|
|
* the master node is not available and it's therefore not possible to write
|
|
* an event record. In this case, if `event_notification_command` is set, a
|
|
* user-defined notification to be generated; if not, this function will have
|
|
* no effect.
|
|
*/
|
|
|
|
bool
|
|
create_event_record(PGconn *conn, t_configuration_options *options, int node_id, char *event, bool successful, char *details)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult *res;
|
|
char event_timestamp[MAXLEN] = "";
|
|
bool success = true;
|
|
struct tm ts;
|
|
|
|
/* Only attempt to write a record if a connection handle was provided.
|
|
Also check that the repmgr schema has been properly intialised - if
|
|
not it means no configuration file was provided, which can happen with
|
|
e.g. `repmgr standby clone`, and we won't know which schema to write to.
|
|
*/
|
|
if (conn != NULL && strcmp(repmgr_schema, DEFAULT_REPMGR_SCHEMA_PREFIX) != 0)
|
|
{
|
|
int n_node_id = htonl(node_id);
|
|
char *t_successful = successful ? "TRUE" : "FALSE";
|
|
|
|
const char *values[4] = { (char *)&n_node_id,
|
|
event,
|
|
t_successful,
|
|
details
|
|
};
|
|
|
|
int lengths[4] = { sizeof(n_node_id),
|
|
0,
|
|
0,
|
|
0
|
|
};
|
|
|
|
int binary[4] = {1, 0, 0, 0};
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
" INSERT INTO %s.repl_events ( "
|
|
" node_id, "
|
|
" event, "
|
|
" successful, "
|
|
" details "
|
|
" ) "
|
|
" VALUES ($1, $2, $3, $4) "
|
|
" RETURNING event_timestamp ",
|
|
get_repmgr_schema_quoted(conn));
|
|
|
|
log_verbose(LOG_DEBUG, "create_event_record():\n%s\n", sqlquery);
|
|
|
|
res = PQexecParams(conn,
|
|
sqlquery,
|
|
4,
|
|
NULL,
|
|
values,
|
|
lengths,
|
|
binary,
|
|
0);
|
|
|
|
if (!res || PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
log_warning(_("Unable to create event record: %s\n"),
|
|
PQerrorMessage(conn));
|
|
|
|
success = false;
|
|
|
|
}
|
|
else
|
|
{
|
|
/* Store timestamp to send to the notification command */
|
|
strncpy(event_timestamp, PQgetvalue(res, 0, 0), MAXLEN);
|
|
log_verbose(LOG_DEBUG, "create_event_record(): Event timestamp is \"%s\"\n", event_timestamp);
|
|
}
|
|
|
|
PQclear(res);
|
|
}
|
|
|
|
/*
|
|
* If no database connection provided, or the query failed, generate a
|
|
* current timestamp ourselves. This isn't quite the same
|
|
* format as PostgreSQL, but is close enough for diagnostic use.
|
|
*/
|
|
if (!strlen(event_timestamp))
|
|
{
|
|
time_t now;
|
|
|
|
time(&now);
|
|
ts = *localtime(&now);
|
|
strftime(event_timestamp, MAXLEN, "%Y-%m-%d %H:%M:%S%z", &ts);
|
|
}
|
|
|
|
/* an event notification command was provided - parse and execute it */
|
|
if (strlen(options->event_notification_command))
|
|
{
|
|
char parsed_command[MAXPGPATH];
|
|
const char *src_ptr;
|
|
char *dst_ptr;
|
|
char *end_ptr;
|
|
int r;
|
|
|
|
/*
|
|
* If configuration option 'event_notifications' was provided,
|
|
* check if this event is one of the ones listed; if not listed,
|
|
* don't execute the notification script.
|
|
*
|
|
* (If 'event_notifications' was not provided, we assume the script
|
|
* should be executed for all events).
|
|
*/
|
|
if (options->event_notifications.head != NULL)
|
|
{
|
|
EventNotificationListCell *cell;
|
|
bool notify_ok = false;
|
|
|
|
for (cell = options->event_notifications.head; cell; cell = cell->next)
|
|
{
|
|
if (strcmp(event, cell->event_type) == 0)
|
|
{
|
|
notify_ok = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Event type not found in the 'event_notifications' list - return early
|
|
*/
|
|
if (notify_ok == false)
|
|
{
|
|
log_debug(_("Not executing notification script for event type '%s'\n"), event);
|
|
return success;
|
|
}
|
|
}
|
|
|
|
dst_ptr = parsed_command;
|
|
end_ptr = parsed_command + MAXPGPATH - 1;
|
|
*end_ptr = '\0';
|
|
|
|
for(src_ptr = options->event_notification_command; *src_ptr; src_ptr++)
|
|
{
|
|
if (*src_ptr == '%')
|
|
{
|
|
switch (src_ptr[1])
|
|
{
|
|
case 'n':
|
|
/* %n: node id */
|
|
src_ptr++;
|
|
snprintf(dst_ptr, end_ptr - dst_ptr, "%i", node_id);
|
|
dst_ptr += strlen(dst_ptr);
|
|
break;
|
|
case 'e':
|
|
/* %e: event type */
|
|
src_ptr++;
|
|
strlcpy(dst_ptr, event, end_ptr - dst_ptr);
|
|
dst_ptr += strlen(dst_ptr);
|
|
break;
|
|
case 'd':
|
|
/* %d: details */
|
|
src_ptr++;
|
|
if (details != NULL)
|
|
{
|
|
strlcpy(dst_ptr, details, end_ptr - dst_ptr);
|
|
dst_ptr += strlen(dst_ptr);
|
|
}
|
|
break;
|
|
case 's':
|
|
/* %s: successful */
|
|
src_ptr++;
|
|
strlcpy(dst_ptr, successful ? "1" : "0", end_ptr - dst_ptr);
|
|
dst_ptr += strlen(dst_ptr);
|
|
break;
|
|
case 't':
|
|
/* %: timestamp */
|
|
src_ptr++;
|
|
strlcpy(dst_ptr, event_timestamp, end_ptr - dst_ptr);
|
|
dst_ptr += strlen(dst_ptr);
|
|
break;
|
|
default:
|
|
/* otherwise treat the % as not special */
|
|
if (dst_ptr < end_ptr)
|
|
*dst_ptr++ = *src_ptr;
|
|
break;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
if (dst_ptr < end_ptr)
|
|
*dst_ptr++ = *src_ptr;
|
|
}
|
|
}
|
|
|
|
*dst_ptr = '\0';
|
|
|
|
log_debug("create_event_record(): executing\n%s\n", parsed_command);
|
|
|
|
r = system(parsed_command);
|
|
if (r != 0)
|
|
{
|
|
log_warning(_("Unable to execute event notification command\n"));
|
|
log_info(_("Parsed event notification command was:\n%s\n"), parsed_command);
|
|
success = false;
|
|
}
|
|
}
|
|
|
|
return success;
|
|
}
|
|
|
|
|
|
/*
|
|
* Update node record following change of status
|
|
* (e.g. inactive primary converted to standby)
|
|
*/
|
|
bool
|
|
update_node_record_status(PGconn *conn, char *cluster_name, int this_node_id, char *type, int upstream_node_id, bool active)
|
|
{
|
|
PGresult *res;
|
|
char sqlquery[QUERY_STR_LEN];
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
" UPDATE %s.repl_nodes "
|
|
" SET type = '%s', "
|
|
" upstream_node_id = %i, "
|
|
" active = %s "
|
|
" WHERE cluster = '%s' "
|
|
" AND id = %i ",
|
|
get_repmgr_schema_quoted(conn),
|
|
type,
|
|
upstream_node_id,
|
|
active ? "TRUE" : "FALSE",
|
|
cluster_name,
|
|
this_node_id);
|
|
|
|
log_verbose(LOG_DEBUG, "update_node_record_status():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
|
|
if (PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to update node record: %s\n"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
bool
|
|
update_node_record_set_upstream(PGconn *conn, char *cluster_name, int this_node_id, int new_upstream_node_id)
|
|
{
|
|
PGresult *res;
|
|
char sqlquery[QUERY_STR_LEN];
|
|
|
|
log_debug(_("update_node_record_set_upstream(): Updating node %i's upstream node to %i\n"), this_node_id, new_upstream_node_id);
|
|
|
|
sqlquery_snprintf(sqlquery,
|
|
" UPDATE %s.repl_nodes "
|
|
" SET upstream_node_id = %i "
|
|
" WHERE cluster = '%s' "
|
|
" AND id = %i ",
|
|
get_repmgr_schema_quoted(conn),
|
|
new_upstream_node_id,
|
|
cluster_name,
|
|
this_node_id);
|
|
|
|
log_verbose(LOG_DEBUG, "update_node_record_set_upstream():\n%s\n", sqlquery);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
|
|
if (PQresultStatus(res) != PGRES_COMMAND_OK)
|
|
{
|
|
log_err(_("Unable to set new upstream node id: %s\n"),
|
|
PQerrorMessage(conn));
|
|
PQclear(res);
|
|
|
|
return false;
|
|
}
|
|
|
|
PQclear(res);
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
int
|
|
get_node_record(PGconn *conn, char *cluster, int node_id, t_node_info *node_info)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
int result;
|
|
|
|
sqlquery_snprintf(
|
|
sqlquery,
|
|
"SELECT id, type, upstream_node_id, name, conninfo, slot_name, priority, active"
|
|
" FROM %s.repl_nodes "
|
|
" WHERE cluster = '%s' "
|
|
" AND id = %i",
|
|
get_repmgr_schema_quoted(conn),
|
|
cluster,
|
|
node_id);
|
|
|
|
log_verbose(LOG_DEBUG, "get_node_record():\n%s\n", sqlquery);
|
|
|
|
result = _get_node_record(conn, cluster, sqlquery, node_info);
|
|
|
|
if (result == 0)
|
|
{
|
|
log_verbose(LOG_DEBUG, "get_node_record(): no record found for node %i\n", node_id);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
int
|
|
get_node_record_by_name(PGconn *conn, char *cluster, const char *node_name, t_node_info *node_info)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
int result;
|
|
|
|
sqlquery_snprintf(
|
|
sqlquery,
|
|
"SELECT id, type, upstream_node_id, name, conninfo, slot_name, priority, active"
|
|
" FROM %s.repl_nodes "
|
|
" WHERE cluster = '%s' "
|
|
" AND name = '%s'",
|
|
get_repmgr_schema_quoted(conn),
|
|
cluster,
|
|
node_name);
|
|
|
|
log_verbose(LOG_DEBUG, "get_node_record_by_name():\n%s\n", sqlquery);
|
|
|
|
result = _get_node_record(conn, cluster, sqlquery, node_info);
|
|
|
|
if (result == 0)
|
|
{
|
|
log_verbose(LOG_DEBUG, "get_node_record(): no record found for node %s\n", node_name);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
static int
|
|
_get_node_record(PGconn *conn, char *cluster, char *sqlquery, t_node_info *node_info)
|
|
{
|
|
int ntuples;
|
|
PGresult *res;
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
return -1;
|
|
}
|
|
|
|
ntuples = PQntuples(res);
|
|
|
|
if (ntuples == 0)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
node_info->node_id = atoi(PQgetvalue(res, 0, 0));
|
|
node_info->type = parse_node_type(PQgetvalue(res, 0, 1));
|
|
node_info->upstream_node_id = atoi(PQgetvalue(res, 0, 2));
|
|
strncpy(node_info->name, PQgetvalue(res, 0, 3), MAXLEN);
|
|
strncpy(node_info->conninfo_str, PQgetvalue(res, 0, 4), MAXLEN);
|
|
strncpy(node_info->slot_name, PQgetvalue(res, 0, 5), MAXLEN);
|
|
node_info->priority = atoi(PQgetvalue(res, 0, 6));
|
|
node_info->active = (strcmp(PQgetvalue(res, 0, 7), "t") == 0)
|
|
? true
|
|
: false;
|
|
|
|
PQclear(res);
|
|
|
|
return ntuples;
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
|
get_node_replication_state(PGconn *conn, char *node_name, char *output)
|
|
{
|
|
char sqlquery[QUERY_STR_LEN];
|
|
PGresult * res;
|
|
|
|
sqlquery_snprintf(
|
|
sqlquery,
|
|
" SELECT state "
|
|
" FROM pg_catalog.pg_stat_replication"
|
|
" WHERE application_name = '%s'",
|
|
node_name
|
|
);
|
|
|
|
res = PQexec(conn, sqlquery);
|
|
|
|
if (PQresultStatus(res) != PGRES_TUPLES_OK)
|
|
{
|
|
PQclear(res);
|
|
return -1;
|
|
}
|
|
|
|
if (PQntuples(res) == 0)
|
|
{
|
|
PQclear(res);
|
|
return 0;
|
|
}
|
|
|
|
strncpy(output, PQgetvalue(res, 0, 0), MAXLEN);
|
|
PQclear(res);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
t_server_type
|
|
parse_node_type(const char *type)
|
|
{
|
|
if (strcmp(type, "master") == 0)
|
|
{
|
|
return MASTER;
|
|
}
|
|
else if (strcmp(type, "standby") == 0)
|
|
{
|
|
return STANDBY;
|
|
}
|
|
else if (strcmp(type, "witness") == 0)
|
|
{
|
|
return WITNESS;
|
|
}
|
|
|
|
return UNKNOWN;
|
|
}
|
|
|
|
|
|
int
|
|
get_data_checksum_version(const char *data_directory)
|
|
{
|
|
ControlFileData control_file;
|
|
int fd;
|
|
char control_file_path[MAXPGPATH];
|
|
|
|
snprintf(control_file_path, MAXPGPATH, "%s/global/pg_control", data_directory);
|
|
if ((fd = open(control_file_path, O_RDONLY | PG_BINARY, 0)) == -1)
|
|
{
|
|
log_err(_("Unable to open control file \"%s\" for reading: %s\n"),
|
|
control_file_path, strerror(errno));
|
|
return -1;
|
|
}
|
|
|
|
if (read(fd, &control_file, sizeof(ControlFileData)) != sizeof(ControlFileData))
|
|
{
|
|
log_err(_("could not read file \"%s\": %s\n"),
|
|
control_file_path, strerror(errno));
|
|
close(fd);
|
|
return -1;
|
|
}
|
|
|
|
close(fd);
|
|
|
|
return (int)control_file.data_checksum_version;
|
|
}
|