Esa Korhonen b29bae6e84 MXS-1865 Update server version only when (re)connecting
Updating it every iteration is needless.
2018-05-16 13:55:45 +03:00

332 lines
8.4 KiB
C++

/*
* Copyright (c) 2016 MariaDB Corporation Ab
*
* Use of this software is governed by the Business Source License included
* in the LICENSE.TXT file and at www.mariadb.com/bsl11.
*
* Change Date: 2020-01-01
*
* On the date above, in accordance with the Business Source License, use
* of this software will be governed by version 2 or later of the General
* Public License.
*/
/**
* @file A MySQL Group Replication cluster monitor
*/
#define MXS_MODULE_NAME "grmon"
#include <maxscale/cppdefs.hh>
#include <new>
#include <string>
#include <maxscale/monitor.hh>
#include <maxscale/thread.h>
#include <maxscale/protocol/mysql.h>
#include <mysqld_error.h>
/**
* The instance of a Group Replication Monitor
*/
struct GRMon : public MXS_MONITOR_INSTANCE
{
GRMon(const GRMon&);
GRMon& operator&(const GRMon&);
public:
static GRMon* create(MXS_MONITOR* monitor);
static void destroy(GRMon* monitor);
bool start(const MXS_CONFIG_PARAMETER* params);
void stop();
void diagnostics(DCB* dcb) const;
json_t* diagnostics_json() const;
private:
THREAD m_thread; /**< Monitor thread */
int m_shutdown; /**< Flag to shutdown the monitor thread */
MXS_MONITORED_SERVER* m_master; /**< The master server */
std::string m_script;
uint64_t m_events; /**< Enabled events */
MXS_MONITOR* m_monitor;
GRMon(MXS_MONITOR* monitor);
~GRMon();
void main();
static void main(void* data);
};
GRMon::GRMon(MXS_MONITOR* monitor):
m_shutdown(0),
m_master(NULL),
m_script(NULL),
m_events(0),
m_monitor(monitor)
{
}
GRMon::~GRMon()
{
}
GRMon* GRMon::create(MXS_MONITOR* monitor)
{
return new GRMon(monitor);
}
bool GRMon::start(const MXS_CONFIG_PARAMETER* params)
{
bool started = false;
m_shutdown = 0;
m_master = NULL;
m_script = config_get_string(params, "script");
m_events = config_get_enum(params, "events", mxs_monitor_event_enum_values);
m_thread = 0;
if (thread_start(&m_thread, GRMon::main, this, 0) != NULL)
{
started = true;
}
return started;
}
void GRMon::main(void* data)
{
GRMon* mon = (GRMon*)data;
mon->main();
}
void GRMon::stop()
{
ss_dassert(m_thread);
atomic_store_int32(&m_shutdown, 1);
thread_wait(m_thread);
m_thread = 0;
m_shutdown = 0;
}
void GRMon::diagnostics(DCB* dcb) const
{
}
json_t* GRMon::diagnostics_json() const
{
return NULL;
}
static inline bool is_false(const char* value)
{
return strcasecmp(value, "0") == 0 ||
strcasecmp(value, "no") == 0 ||
strcasecmp(value, "off") == 0 ||
strcasecmp(value, "false") == 0;
}
static bool is_master(MXS_MONITORED_SERVER* server)
{
bool rval = false;
MYSQL_RES* result;
const char* master_query =
"SELECT VARIABLE_VALUE, @@server_uuid, @@read_only FROM performance_schema.global_status "
"WHERE VARIABLE_NAME= 'group_replication_primary_member'";
if (mysql_query(server->con, master_query) == 0 && (result = mysql_store_result(server->con)))
{
for (MYSQL_ROW row = mysql_fetch_row(result); row; row = mysql_fetch_row(result))
{
if (strcasecmp(row[0], row[1]) == 0 && is_false(row[2]))
{
rval = true;
}
}
mysql_free_result(result);
}
else
{
mon_report_query_error(server);
}
return rval;
}
static bool is_slave(MXS_MONITORED_SERVER* server)
{
bool rval = false;
MYSQL_RES* result;
const char slave_query[] = "SELECT MEMBER_STATE FROM "
"performance_schema.replication_group_members "
"WHERE MEMBER_ID = @@server_uuid";
if (mysql_query(server->con, slave_query) == 0 && (result = mysql_store_result(server->con)))
{
for (MYSQL_ROW row = mysql_fetch_row(result); row; row = mysql_fetch_row(result))
{
if (strcasecmp(row[0], "ONLINE") == 0)
{
rval = true;
}
}
mysql_free_result(result);
}
else
{
mon_report_query_error(server);
}
return rval;
}
static void update_server_status(MXS_MONITOR* monitor, MXS_MONITORED_SERVER* server)
{
/* Don't even probe server flagged as in maintenance */
if (SERVER_IN_MAINT(server->server))
{
return;
}
/** Store previous status */
server->mon_prev_status = server->server->status;
mxs_connect_result_t rval = mon_ping_or_connect_to_db(monitor, server);
if (!mon_connection_is_ok(rval))
{
if (mysql_errno(server->con) == ER_ACCESS_DENIED_ERROR)
{
server_set_status_nolock(server->server, SERVER_AUTH_ERROR);
}
else
{
server_clear_status_nolock(server->server, SERVER_AUTH_ERROR);
}
server->server->node_id = -1;
server_clear_status_nolock(server->server, SERVER_RUNNING);
if (mon_status_changed(server) && mon_print_fail_status(server))
{
mon_log_connect_error(server, rval);
}
}
else
{
/* If we get this far then we have a working connection */
server_set_status_nolock(server->server, SERVER_RUNNING);
}
if (is_master(server))
{
server_set_status_nolock(server->server, SERVER_MASTER);
server_clear_status_nolock(server->server, SERVER_SLAVE);
}
else if (is_slave(server))
{
server_set_status_nolock(server->server, SERVER_SLAVE);
server_clear_status_nolock(server->server, SERVER_MASTER);
}
else
{
server_clear_status_nolock(server->server, SERVER_SLAVE);
server_clear_status_nolock(server->server, SERVER_MASTER);
}
}
void GRMon::main()
{
if (mysql_thread_init())
{
MXS_ERROR("mysql_thread_init failed. Exiting.");
return;
}
load_server_journal(m_monitor, NULL);
while (!m_shutdown)
{
lock_monitor_servers(m_monitor);
servers_status_pending_to_current(m_monitor);
for (MXS_MONITORED_SERVER *ptr = m_monitor->monitored_servers; ptr; ptr = ptr->next)
{
update_server_status(m_monitor, ptr);
}
mon_hangup_failed_servers(m_monitor);
/**
* After updating the status of all servers, check if monitor events
* need to be launched.
*/
mon_process_state_changes(m_monitor,
m_script.empty() ? NULL : m_script.c_str(),
m_events);
servers_status_current_to_pending(m_monitor);
store_server_journal(m_monitor, NULL);
release_monitor_servers(m_monitor);
/** Sleep until the next monitoring interval */
size_t ms = 0;
while (ms < m_monitor->interval && !m_shutdown)
{
if (m_monitor->server_pending_changes)
{
// Admin has changed something, skip sleep
break;
}
thread_millisleep(MXS_MON_BASE_INTERVAL_MS);
ms += MXS_MON_BASE_INTERVAL_MS;
}
}
mysql_thread_end();
}
/**
* The module entry point routine. It is this routine that
* must populate the structure that is referred to as the
* "module object", this is a structure with the set of
* external entry points for this module.
*
* @return The module object
*/
extern "C" MXS_MODULE* MXS_CREATE_MODULE()
{
static MXS_MODULE info =
{
MXS_MODULE_API_MONITOR,
MXS_MODULE_GA,
MXS_MONITOR_VERSION,
"A Group Replication cluster monitor",
"V1.0.0",
MXS_NO_MODULE_CAPABILITIES,
&maxscale::MonitorApi<GRMon>::s_api,
NULL, /* Process init. */
NULL, /* Process finish. */
NULL, /* Thread init. */
NULL, /* Thread finish. */
{
{
"script",
MXS_MODULE_PARAM_PATH,
NULL,
MXS_MODULE_OPT_PATH_X_OK
},
{
"events",
MXS_MODULE_PARAM_ENUM,
MXS_MONITOR_EVENT_DEFAULT_VALUE,
MXS_MODULE_OPT_NONE,
mxs_monitor_event_enum_values
},
{MXS_END_MODULE_PARAMS}
}
};
return &info;
}