
It is now possible to [un]softfail a Clustrix node via MaxScale using a Clustrix monitor module command. In case a node is successfully softfailed, the `Being Drained` bit will automatically turned on. Similarly, if a node is successfully unsoftfailed, the `Being Drained` bit will be cleared.
119 lines
3.1 KiB
C++
119 lines
3.1 KiB
C++
/*
|
|
* Copyright (c) 2018 MariaDB Corporation Ab
|
|
*
|
|
* Use of this software is governed by the Business Source License included
|
|
* in the LICENSE.TXT file and at www.mariadb.com/bsl11.
|
|
*
|
|
* Change Date: 2022-01-01
|
|
*
|
|
* On the date above, in accordance with the Business Source License, use
|
|
* of this software will be governed by version 2 or later of the General
|
|
* Public License.
|
|
*/
|
|
#pragma once
|
|
|
|
#include "clustrixmon.hh"
|
|
#include <map>
|
|
#include <maxscale/monitor.hh>
|
|
#include <maxbase/http.hh>
|
|
#include "clustrixmembership.hh"
|
|
#include "clustrixnode.hh"
|
|
|
|
class ClustrixMonitor : public maxscale::MonitorWorker
|
|
{
|
|
ClustrixMonitor(const ClustrixMonitor&) = delete;
|
|
ClustrixMonitor& operator=(const ClustrixMonitor&) = delete;
|
|
public:
|
|
class Config
|
|
{
|
|
public:
|
|
Config()
|
|
: m_cluster_monitor_interval(DEFAULT_CLUSTER_MONITOR_INTERVAL_VALUE)
|
|
, m_health_check_threshold(DEFAULT_HEALTH_CHECK_THRESHOLD_VALUE)
|
|
{
|
|
};
|
|
|
|
long cluster_monitor_interval() const
|
|
{
|
|
return m_cluster_monitor_interval;
|
|
}
|
|
|
|
void set_cluster_monitor_interval(long l)
|
|
{
|
|
m_cluster_monitor_interval = l;
|
|
}
|
|
|
|
long health_check_threshold() const
|
|
{
|
|
return m_health_check_threshold;
|
|
}
|
|
|
|
void set_health_check_threshold(long l)
|
|
{
|
|
m_health_check_threshold = l;
|
|
}
|
|
|
|
private:
|
|
long m_cluster_monitor_interval;
|
|
long m_health_check_threshold;
|
|
};
|
|
|
|
~ClustrixMonitor();
|
|
|
|
static ClustrixMonitor* create(const std::string& name, const std::string& module);
|
|
|
|
bool configure(const MXS_CONFIG_PARAMETER* pParams) override;
|
|
|
|
bool softfail(SERVER* pServer, json_t** ppError);
|
|
bool unsoftfail(SERVER* pServer, json_t** ppError);
|
|
|
|
private:
|
|
ClustrixMonitor(const std::string& name, const std::string& module);
|
|
|
|
void pre_loop() override;
|
|
void post_loop() override;
|
|
|
|
void tick() override;
|
|
|
|
void check_hub_and_refresh_nodes();
|
|
void check_hub();
|
|
void choose_hub();
|
|
void refresh_nodes();
|
|
bool check_cluster_membership(std::map<int, ClustrixMembership>* pMemberships);
|
|
|
|
void update_server_statuses();
|
|
|
|
void make_health_check();
|
|
void initiate_delayed_http_check();
|
|
bool check_http(Call::action_t action);
|
|
|
|
bool perform_softfail(SERVER* pServer, json_t** ppError);
|
|
bool perform_unsoftfail(SERVER* pServer, json_t** ppError);
|
|
|
|
enum class Operation
|
|
{
|
|
SOFTFAIL,
|
|
UNSOFTFAIL,
|
|
};
|
|
|
|
bool perform_operation(Operation operation,
|
|
SERVER* pServer,
|
|
json_t** ppError);
|
|
|
|
|
|
static long now()
|
|
{
|
|
return mxb::WorkerLoad::get_time_ms();
|
|
}
|
|
|
|
private:
|
|
Config m_config;
|
|
std::map<int, ClustrixNode> m_nodes;
|
|
std::vector<std::string> m_health_urls;
|
|
mxb::http::Async m_http;
|
|
uint32_t m_delayed_http_check_id { 0 };
|
|
long m_last_cluster_check { 0 };
|
|
SERVER* m_pHub_server { nullptr };
|
|
MYSQL* m_pHub_con { nullptr };
|
|
};
|