
Tracking how many times the monitor has performed its monitoring allows the test framework to consistently wait for an event instead of waiting for a hard-coded time period. The MaxCtrl `api get` command can be used to easily extract the numeric value.
367 lines
9.1 KiB
C++
367 lines
9.1 KiB
C++
/*
|
|
* Copyright (c) 2016 MariaDB Corporation Ab
|
|
*
|
|
* Use of this software is governed by the Business Source License included
|
|
* in the LICENSE.TXT file and at www.mariadb.com/bsl11.
|
|
*
|
|
* Change Date: 2020-01-01
|
|
*
|
|
* On the date above, in accordance with the Business Source License, use
|
|
* of this software will be governed by version 2 or later of the General
|
|
* Public License.
|
|
*/
|
|
|
|
/**
|
|
* @file A MySQL Group Replication cluster monitor
|
|
*/
|
|
|
|
#define MXS_MODULE_NAME "grmon"
|
|
|
|
#include <maxscale/cppdefs.hh>
|
|
|
|
#include <new>
|
|
#include <string>
|
|
|
|
#include <maxscale/monitor.h>
|
|
#include <maxscale/thread.h>
|
|
#include <maxscale/protocol/mysql.h>
|
|
#include <mysqld_error.h>
|
|
|
|
/**
|
|
* The instance of a Group Replication Monitor
|
|
*/
|
|
struct GRMon
|
|
{
|
|
GRMon(const GRMon&);
|
|
GRMon& operator&(const GRMon&);
|
|
public:
|
|
static GRMon* create(MXS_MONITOR* monitor, const MXS_CONFIG_PARAMETER* params);
|
|
void stop();
|
|
~GRMon();
|
|
|
|
private:
|
|
THREAD m_thread; /**< Monitor thread */
|
|
int m_shutdown; /**< Flag to shutdown the monitor thread */
|
|
MXS_MONITORED_SERVER* m_master; /**< The master server */
|
|
std::string m_script;
|
|
uint64_t m_events; /**< Enabled events */
|
|
MXS_MONITOR* m_monitor;
|
|
|
|
GRMon(MXS_MONITOR* monitor, const MXS_CONFIG_PARAMETER *params);
|
|
|
|
void main();
|
|
static void main(void* data);
|
|
};
|
|
|
|
GRMon::GRMon(MXS_MONITOR* monitor, const MXS_CONFIG_PARAMETER* params):
|
|
m_shutdown(0),
|
|
m_master(NULL),
|
|
m_script(config_get_string(params, "script")),
|
|
m_events(config_get_enum(params, "events", mxs_monitor_event_enum_values)),
|
|
m_monitor(monitor)
|
|
{
|
|
}
|
|
|
|
GRMon::~GRMon()
|
|
{
|
|
}
|
|
|
|
GRMon* GRMon::create(MXS_MONITOR* monitor, const MXS_CONFIG_PARAMETER* params)
|
|
{
|
|
GRMon* mon;
|
|
MXS_EXCEPTION_GUARD(mon = new GRMon(monitor, params));
|
|
|
|
if (mon && thread_start(&mon->m_thread, GRMon::main, mon, 0) == NULL)
|
|
{
|
|
delete mon;
|
|
mon = NULL;
|
|
}
|
|
|
|
return mon;
|
|
}
|
|
|
|
void GRMon::main(void* data)
|
|
{
|
|
GRMon* mon = (GRMon*)data;
|
|
mon->main();
|
|
}
|
|
|
|
void GRMon::stop()
|
|
{
|
|
atomic_store_int32(&m_shutdown, 1);
|
|
thread_wait(m_thread);
|
|
}
|
|
|
|
/**
|
|
* Start the instance of the monitor, returning a handle on the monitor.
|
|
*
|
|
* This function creates a thread to execute the actual monitoring.
|
|
*
|
|
* @return A handle to use when interacting with the monitor
|
|
*/
|
|
static void *
|
|
startMonitor(MXS_MONITOR *mon, const MXS_CONFIG_PARAMETER *params)
|
|
{
|
|
return GRMon::create(mon, params);
|
|
}
|
|
|
|
/**
|
|
* Stop a running monitor
|
|
*
|
|
* @param arg Handle on thr running monior
|
|
*/
|
|
static void
|
|
stopMonitor(MXS_MONITOR *mon)
|
|
{
|
|
GRMon *handle = (GRMon *) mon->handle;
|
|
handle->stop();
|
|
delete handle;
|
|
mon->handle = NULL;
|
|
}
|
|
|
|
/**
|
|
* Diagnostic interface
|
|
*
|
|
* @param dcb DCB to send output
|
|
* @param arg The monitor handle
|
|
*/
|
|
static void
|
|
diagnostics(DCB *dcb, const MXS_MONITOR *mon)
|
|
{
|
|
}
|
|
|
|
/**
|
|
* Diagnostic interface
|
|
*
|
|
* @param arg The monitor handle
|
|
*/
|
|
static json_t* diagnostics_json(const MXS_MONITOR *mon)
|
|
{
|
|
return NULL;
|
|
}
|
|
|
|
static inline bool is_false(const char* value)
|
|
{
|
|
return strcasecmp(value, "0") == 0 ||
|
|
strcasecmp(value, "no") == 0 ||
|
|
strcasecmp(value, "off") == 0 ||
|
|
strcasecmp(value, "false") == 0;
|
|
}
|
|
|
|
static bool is_master(MXS_MONITORED_SERVER* server)
|
|
{
|
|
bool rval = false;
|
|
MYSQL_RES* result;
|
|
const char* master_query =
|
|
"SELECT VARIABLE_VALUE, @@server_uuid, @@read_only FROM performance_schema.global_status "
|
|
"WHERE VARIABLE_NAME= 'group_replication_primary_member'";
|
|
|
|
if (mysql_query(server->con, master_query) == 0 && (result = mysql_store_result(server->con)))
|
|
{
|
|
for (MYSQL_ROW row = mysql_fetch_row(result); row; row = mysql_fetch_row(result))
|
|
{
|
|
if (strcasecmp(row[0], row[1]) == 0 && is_false(row[2]))
|
|
{
|
|
rval = true;
|
|
}
|
|
}
|
|
mysql_free_result(result);
|
|
}
|
|
else
|
|
{
|
|
mon_report_query_error(server);
|
|
}
|
|
|
|
return rval;
|
|
}
|
|
|
|
static bool is_slave(MXS_MONITORED_SERVER* server)
|
|
{
|
|
bool rval = false;
|
|
MYSQL_RES* result;
|
|
const char slave_query[] = "SELECT MEMBER_STATE FROM "
|
|
"performance_schema.replication_group_members "
|
|
"WHERE MEMBER_ID = @@server_uuid";
|
|
|
|
if (mysql_query(server->con, slave_query) == 0 && (result = mysql_store_result(server->con)))
|
|
{
|
|
for (MYSQL_ROW row = mysql_fetch_row(result); row; row = mysql_fetch_row(result))
|
|
{
|
|
if (strcasecmp(row[0], "ONLINE") == 0)
|
|
{
|
|
rval = true;
|
|
}
|
|
}
|
|
mysql_free_result(result);
|
|
}
|
|
else
|
|
{
|
|
mon_report_query_error(server);
|
|
}
|
|
|
|
return rval;
|
|
}
|
|
|
|
static void update_server_status(MXS_MONITOR* monitor, MXS_MONITORED_SERVER* server)
|
|
{
|
|
/* Don't even probe server flagged as in maintenance */
|
|
if (SERVER_IN_MAINT(server->server))
|
|
{
|
|
return;
|
|
}
|
|
|
|
/** Store previous status */
|
|
server->mon_prev_status = server->server->status;
|
|
|
|
mxs_connect_result_t rval = mon_ping_or_connect_to_db(monitor, server);
|
|
|
|
if (rval != MONITOR_CONN_OK)
|
|
{
|
|
if (mysql_errno(server->con) == ER_ACCESS_DENIED_ERROR)
|
|
{
|
|
server_set_status_nolock(server->server, SERVER_AUTH_ERROR);
|
|
}
|
|
else
|
|
{
|
|
server_clear_status_nolock(server->server, SERVER_AUTH_ERROR);
|
|
}
|
|
|
|
server->server->node_id = -1;
|
|
|
|
server_clear_status_nolock(server->server, SERVER_RUNNING);
|
|
|
|
if (mon_status_changed(server) && mon_print_fail_status(server))
|
|
{
|
|
mon_log_connect_error(server, rval);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
/* If we get this far then we have a working connection */
|
|
server_set_status_nolock(server->server, SERVER_RUNNING);
|
|
}
|
|
|
|
if (is_master(server))
|
|
{
|
|
server_set_status_nolock(server->server, SERVER_MASTER);
|
|
server_clear_status_nolock(server->server, SERVER_SLAVE);
|
|
}
|
|
else if (is_slave(server))
|
|
{
|
|
server_set_status_nolock(server->server, SERVER_SLAVE);
|
|
server_clear_status_nolock(server->server, SERVER_MASTER);
|
|
}
|
|
else
|
|
{
|
|
server_clear_status_nolock(server->server, SERVER_SLAVE);
|
|
server_clear_status_nolock(server->server, SERVER_MASTER);
|
|
}
|
|
}
|
|
|
|
void GRMon::main()
|
|
{
|
|
if (mysql_thread_init())
|
|
{
|
|
MXS_ERROR("mysql_thread_init failed. Exiting.");
|
|
return;
|
|
}
|
|
|
|
load_server_journal(m_monitor, NULL);
|
|
|
|
while (!m_shutdown)
|
|
{
|
|
atomic_add_uint64(&m_monitor->ticks, 1);
|
|
lock_monitor_servers(m_monitor);
|
|
servers_status_pending_to_current(m_monitor);
|
|
|
|
for (MXS_MONITORED_SERVER *ptr = m_monitor->monitored_servers; ptr; ptr = ptr->next)
|
|
{
|
|
update_server_status(m_monitor, ptr);
|
|
}
|
|
|
|
mon_hangup_failed_servers(m_monitor);
|
|
/**
|
|
* After updating the status of all servers, check if monitor events
|
|
* need to be launched.
|
|
*/
|
|
mon_process_state_changes(m_monitor,
|
|
m_script.empty() ? NULL : m_script.c_str(),
|
|
m_events);
|
|
|
|
servers_status_current_to_pending(m_monitor);
|
|
store_server_journal(m_monitor, NULL);
|
|
release_monitor_servers(m_monitor);
|
|
|
|
/** Sleep until the next monitoring interval */
|
|
size_t ms = 0;
|
|
while (ms < m_monitor->interval && !m_shutdown)
|
|
{
|
|
if (m_monitor->server_pending_changes)
|
|
{
|
|
// Admin has changed something, skip sleep
|
|
break;
|
|
}
|
|
thread_millisleep(MXS_MON_BASE_INTERVAL_MS);
|
|
ms += MXS_MON_BASE_INTERVAL_MS;
|
|
}
|
|
}
|
|
|
|
mysql_thread_end();
|
|
}
|
|
|
|
extern "C"
|
|
{
|
|
/**
|
|
* The module entry point routine. It is this routine that
|
|
* must populate the structure that is referred to as the
|
|
* "module object", this is a structure with the set of
|
|
* external entry points for this module.
|
|
*
|
|
* @return The module object
|
|
*/
|
|
MXS_MODULE* MXS_CREATE_MODULE()
|
|
{
|
|
static MXS_MONITOR_OBJECT MyObject =
|
|
{
|
|
startMonitor,
|
|
stopMonitor,
|
|
diagnostics,
|
|
diagnostics_json
|
|
};
|
|
|
|
static MXS_MODULE info =
|
|
{
|
|
MXS_MODULE_API_MONITOR,
|
|
MXS_MODULE_GA,
|
|
MXS_MONITOR_VERSION,
|
|
"A Group Replication cluster monitor",
|
|
"V1.0.0",
|
|
MXS_NO_MODULE_CAPABILITIES,
|
|
&MyObject,
|
|
NULL, /* Process init. */
|
|
NULL, /* Process finish. */
|
|
NULL, /* Thread init. */
|
|
NULL, /* Thread finish. */
|
|
{
|
|
{
|
|
"script",
|
|
MXS_MODULE_PARAM_PATH,
|
|
NULL,
|
|
MXS_MODULE_OPT_PATH_X_OK
|
|
},
|
|
{
|
|
"events",
|
|
MXS_MODULE_PARAM_ENUM,
|
|
MXS_MONITOR_EVENT_DEFAULT_VALUE,
|
|
MXS_MODULE_OPT_NONE,
|
|
mxs_monitor_event_enum_values
|
|
},
|
|
{MXS_END_MODULE_PARAMS}
|
|
}
|
|
};
|
|
|
|
return &info;
|
|
}
|
|
|
|
}
|