573 lines
18 KiB
C++
573 lines
18 KiB
C++
/*
|
|
* Copyright (c) 2016 MariaDB Corporation Ab
|
|
*
|
|
* Use of this software is governed by the Business Source License included
|
|
* in the LICENSE.TXT file and at www.mariadb.com/bsl11.
|
|
*
|
|
* Change Date: 2022-01-01
|
|
*
|
|
* On the date above, in accordance with the Business Source License, use
|
|
* of this software will be governed by version 2 or later of the General
|
|
* Public License.
|
|
*/
|
|
|
|
/**
|
|
* @file readconnroute.c - Read Connection Load Balancing Query Router
|
|
*
|
|
* This is the implementation of a simple query router that balances
|
|
* read connections. It assumes the service is configured with a set
|
|
* of slaves and that the application clients already split read and write
|
|
* queries. It offers a service to balance the client read connections
|
|
* over this set of slave servers. It does this once only, at the time
|
|
* the connection is made. It chooses the server that currently has the least
|
|
* number of connections by keeping a count for each server of how
|
|
* many connections the query router has made to the server.
|
|
*
|
|
* When two servers have the same number of current connections the one with
|
|
* the least number of connections since startup will be used.
|
|
*
|
|
* The router may also have options associated to it that will limit the
|
|
* choice of backend server. Currently two options are supported, the "master"
|
|
* option will cause the router to only connect to servers marked as masters
|
|
* and the "slave" option will limit connections to routers that are marked
|
|
* as slaves. If neither option is specified the router will connect to either
|
|
* masters or slaves.
|
|
*/
|
|
|
|
#include "readconnroute.hh"
|
|
|
|
#include <maxscale/protocol/mysql.hh>
|
|
#include <maxscale/modutil.hh>
|
|
|
|
/**
|
|
* The module entry point routine. It is this routine that
|
|
* must populate the structure that is referred to as the
|
|
* "module object", this is a structure with the set of
|
|
* external entry points for this module.
|
|
*
|
|
* @return The module object
|
|
*/
|
|
extern "C" MXS_MODULE* MXS_CREATE_MODULE()
|
|
{
|
|
MXS_NOTICE("Initialise readconnroute router module.");
|
|
|
|
static MXS_MODULE info =
|
|
{
|
|
MXS_MODULE_API_ROUTER,
|
|
MXS_MODULE_GA,
|
|
MXS_ROUTER_VERSION,
|
|
"A connection based router to load balance based on connections",
|
|
"V2.0.0",
|
|
RCAP_TYPE_RUNTIME_CONFIG,
|
|
&RCR::s_object,
|
|
nullptr, /* Process init. */
|
|
nullptr, /* Process finish. */
|
|
nullptr, /* Thread init. */
|
|
nullptr, /* Thread finish. */
|
|
{
|
|
{MXS_END_MODULE_PARAMS}
|
|
}
|
|
};
|
|
|
|
return &info;
|
|
}
|
|
|
|
/*
|
|
* This routine returns the master server from a MariaDB replication tree. The server must be
|
|
* running, not in maintenance and have the master bit set. If multiple masters are found,
|
|
* the one with the highest weight is chosen.
|
|
*
|
|
* @param servers The list of servers
|
|
*
|
|
* @return The Master server
|
|
*/
|
|
SERVER_REF* RCR::get_root_master()
|
|
{
|
|
SERVER_REF* master_host = nullptr;
|
|
for (SERVER_REF* ref = m_pService->dbref; ref; ref = ref->next)
|
|
{
|
|
if (server_ref_is_active(ref) && ref->server->is_master())
|
|
{
|
|
// No master found yet or this one has better weight.
|
|
if (!master_host || ref->server_weight > master_host->server_weight)
|
|
{
|
|
master_host = ref;
|
|
}
|
|
}
|
|
}
|
|
return master_host;
|
|
}
|
|
|
|
bool RCR::configure(MXS_CONFIG_PARAMETER* params)
|
|
{
|
|
uint64_t bitmask = 0;
|
|
uint64_t bitvalue = 0;
|
|
bool ok = true;
|
|
|
|
for (const auto& opt : mxs::strtok(params->get_string("router_options"), ", \t"))
|
|
{
|
|
if (!strcasecmp(opt.c_str(), "master"))
|
|
{
|
|
bitmask |= (SERVER_MASTER | SERVER_SLAVE);
|
|
bitvalue |= SERVER_MASTER;
|
|
}
|
|
else if (!strcasecmp(opt.c_str(), "slave"))
|
|
{
|
|
bitmask |= (SERVER_MASTER | SERVER_SLAVE);
|
|
bitvalue |= SERVER_SLAVE;
|
|
}
|
|
else if (!strcasecmp(opt.c_str(), "running"))
|
|
{
|
|
bitmask |= (SERVER_RUNNING);
|
|
bitvalue |= SERVER_RUNNING;
|
|
}
|
|
else if (!strcasecmp(opt.c_str(), "synced"))
|
|
{
|
|
bitmask |= (SERVER_JOINED);
|
|
bitvalue |= SERVER_JOINED;
|
|
}
|
|
else if (!strcasecmp(opt.c_str(), "ndb"))
|
|
{
|
|
bitmask |= (SERVER_NDB);
|
|
bitvalue |= SERVER_NDB;
|
|
}
|
|
else
|
|
{
|
|
MXS_ERROR("Unsupported router option \'%s\' for readconnroute. "
|
|
"Expected router options are [slave|master|synced|ndb|running]",
|
|
opt.c_str());
|
|
ok = false;
|
|
}
|
|
}
|
|
|
|
|
|
if (bitmask == 0 && bitvalue == 0)
|
|
{
|
|
/** No parameters given, use RUNNING as a valid server */
|
|
bitmask |= (SERVER_RUNNING);
|
|
bitvalue |= SERVER_RUNNING;
|
|
}
|
|
|
|
if (ok)
|
|
{
|
|
uint64_t mask = bitmask | (bitvalue << 32);
|
|
atomic_store_uint64(&m_bitmask_and_bitvalue, mask);
|
|
}
|
|
|
|
return ok;
|
|
}
|
|
|
|
|
|
RCR::RCR(SERVICE* service)
|
|
: mxs::Router<RCR, RCRSession>(service)
|
|
{
|
|
}
|
|
|
|
// static
|
|
RCR* RCR::create(SERVICE* service, MXS_CONFIG_PARAMETER* params)
|
|
{
|
|
RCR* inst = new(std::nothrow) RCR(service);
|
|
|
|
if (inst && !inst->configure(params))
|
|
{
|
|
delete inst;
|
|
inst = nullptr;
|
|
}
|
|
|
|
return inst;
|
|
}
|
|
|
|
RCRSession::RCRSession(RCR* inst, MXS_SESSION* session, SERVER_REF* backend, DCB* dcb,
|
|
uint32_t bitmask, uint32_t bitvalue)
|
|
: mxs::RouterSession(session)
|
|
, m_instance(inst)
|
|
, m_backend(backend)
|
|
, m_dcb(dcb)
|
|
, m_client_dcb(session->client_dcb)
|
|
, m_bitmask(bitmask)
|
|
, m_bitvalue(bitvalue)
|
|
{
|
|
}
|
|
|
|
RCRSession::~RCRSession()
|
|
{
|
|
mxb::atomic::add(&m_backend->connections, -1, mxb::atomic::RELAXED);
|
|
}
|
|
|
|
void RCRSession::close()
|
|
{
|
|
mxb_assert(m_dcb);
|
|
dcb_close(m_dcb);
|
|
}
|
|
|
|
RCRSession* RCR::newSession(MXS_SESSION* session)
|
|
{
|
|
uint64_t mask = atomic_load_uint64(&m_bitmask_and_bitvalue);
|
|
uint32_t bitmask = mask;
|
|
uint32_t bitvalue = mask >> 32;
|
|
|
|
/**
|
|
* Find the Master host from available servers
|
|
*/
|
|
SERVER_REF* master_host = get_root_master();
|
|
|
|
bool connectable_master = master_host ? master_host->server->is_connectable() : false;
|
|
|
|
/**
|
|
* Find a backend server to connect to. This is the extent of the
|
|
* load balancing algorithm we need to implement for this simple
|
|
* connection router.
|
|
*/
|
|
SERVER_REF* candidate = nullptr;
|
|
|
|
/*
|
|
* Loop over all the servers and find any that have fewer connections
|
|
* than the candidate server.
|
|
*
|
|
* If a server has less connections than the current candidate we mark this
|
|
* as the new candidate to connect to.
|
|
*
|
|
* If a server has the same number of connections currently as the candidate
|
|
* and has had less connections over time than the candidate it will also
|
|
* become the new candidate. This has the effect of spreading the
|
|
* connections over different servers during periods of very low load.
|
|
*/
|
|
for (SERVER_REF* ref = m_pService->dbref; ref; ref = ref->next)
|
|
{
|
|
if (!server_ref_is_active(ref) || !ref->server->is_connectable())
|
|
{
|
|
continue;
|
|
}
|
|
|
|
mxb_assert(ref->server->is_usable());
|
|
|
|
/* Check server status bits against bitvalue from router_options */
|
|
if (ref && (ref->server->status & bitmask & bitvalue))
|
|
{
|
|
if (master_host && connectable_master)
|
|
{
|
|
if (ref == master_host
|
|
&& (bitvalue & (SERVER_SLAVE | SERVER_MASTER)) == SERVER_SLAVE)
|
|
{
|
|
/* Skip root master here, as it could also be slave of an external server that
|
|
* is not in the configuration. Intermediate masters (Relay Servers) are also
|
|
* slave and will be selected as Slave(s)
|
|
*/
|
|
|
|
continue;
|
|
}
|
|
if (ref == master_host && bitvalue == SERVER_MASTER)
|
|
{
|
|
/* If option is "master" return only the root Master as there could be
|
|
* intermediate masters (Relay Servers) and they must not be selected.
|
|
*/
|
|
|
|
candidate = master_host;
|
|
break;
|
|
}
|
|
}
|
|
else if (bitvalue == SERVER_MASTER)
|
|
{
|
|
/* Master_host is nullptr, no master server. If requested router_option is 'master'
|
|
* candidate will be nullptr.
|
|
*/
|
|
candidate = nullptr;
|
|
break;
|
|
}
|
|
|
|
/* If no candidate set, set first running server as our initial candidate server */
|
|
if (!candidate)
|
|
{
|
|
candidate = ref;
|
|
}
|
|
else if (ref->server_weight == 0 || candidate->server_weight == 0)
|
|
{
|
|
if (ref->server_weight) // anything with a weight is better
|
|
{
|
|
candidate = ref;
|
|
}
|
|
}
|
|
else if ((ref->connections + 1) / ref->server_weight
|
|
< (candidate->connections + 1) / candidate->server_weight)
|
|
{
|
|
/* ref has a better score. */
|
|
candidate = ref;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* If we haven't found a proper candidate yet but a master server is available, we'll pick that
|
|
* with the assumption that it is "better" than a slave.
|
|
*/
|
|
if (!candidate)
|
|
{
|
|
if (master_host && connectable_master)
|
|
{
|
|
candidate = master_host;
|
|
// Even if we had 'router_options=slave' in the configuration file, we
|
|
// will still end up here if there are no slaves, but a sole master. So
|
|
// that the server will be considered valid in connection_is_valid(), we
|
|
// turn on the SERVER_MASTER bit.
|
|
//
|
|
// We must do that so that readconnroute in MaxScale 2.2 will again behave
|
|
// the same way as it did up until 2.1.12.
|
|
if (bitvalue & SERVER_SLAVE)
|
|
{
|
|
bitvalue |= SERVER_MASTER;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
if (!master_host)
|
|
{
|
|
MXS_ERROR("Failed to create new routing session. Couldn't find eligible"
|
|
" candidate server. Freeing allocated resources.");
|
|
}
|
|
else
|
|
{
|
|
mxb_assert(!connectable_master);
|
|
MXS_ERROR("The only possible candidate server (%s) is being drained "
|
|
"and thus cannot be used.", master_host->server->address);
|
|
}
|
|
return nullptr;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
mxb_assert(candidate->server->is_connectable());
|
|
}
|
|
|
|
/** Open the backend connection */
|
|
DCB* backend_dcb = dcb_connect(candidate->server, session, candidate->server->protocol().c_str());
|
|
|
|
if (!backend_dcb)
|
|
{
|
|
/** The failure is reported in dcb_connect() */
|
|
return nullptr;
|
|
}
|
|
|
|
RCRSession* client_rses = new(std::nothrow) RCRSession(this, session, candidate, backend_dcb,
|
|
bitmask, bitvalue);
|
|
|
|
if (!client_rses)
|
|
{
|
|
return nullptr;
|
|
}
|
|
|
|
mxb::atomic::add(&candidate->connections, 1, mxb::atomic::RELAXED);
|
|
|
|
m_stats.n_sessions++;
|
|
|
|
MXS_INFO("New session for server %s. Connections : %d",
|
|
candidate->server->name(),
|
|
candidate->connections);
|
|
|
|
return client_rses;
|
|
}
|
|
|
|
/** Log routing failure due to closed session */
|
|
static void log_closed_session(mxs_mysql_cmd_t mysql_command, SERVER_REF* ref)
|
|
{
|
|
char msg[SERVER::MAX_ADDRESS_LEN + 200] = ""; // Extra space for message
|
|
|
|
if (ref->server->is_down())
|
|
{
|
|
sprintf(msg, "Server '%s' is down.", ref->server->name());
|
|
}
|
|
else if (ref->server->is_in_maint())
|
|
{
|
|
sprintf(msg, "Server '%s' is in maintenance.", ref->server->name());
|
|
}
|
|
else
|
|
{
|
|
sprintf(msg, "Server '%s' no longer qualifies as a target server.", ref->server->name());
|
|
}
|
|
|
|
MXS_ERROR("Failed to route MySQL command %d to backend server. %s", mysql_command, msg);
|
|
}
|
|
|
|
/**
|
|
* Check if the server we're connected to is still valid
|
|
*
|
|
* @param inst Router instance
|
|
* @param router_cli_ses Router session
|
|
*
|
|
* @return True if the backend connection is still valid
|
|
*/
|
|
bool RCRSession::connection_is_valid() const
|
|
{
|
|
bool rval = false;
|
|
|
|
// m_instance->bitvalue and m_bitvalue are different, if we had
|
|
// 'router_options=slave' in the configuration file and there was only
|
|
// the sole master available at session creation time.
|
|
|
|
if (m_backend->server->is_usable() && (m_backend->server->status & m_bitmask & m_bitvalue))
|
|
{
|
|
// Note the use of '==' and not '|'. We must use the former to exclude a
|
|
// 'router_options=slave' that uses the master due to no slave having been
|
|
// available at session creation time. Its bitvalue is (SERVER_MASTER | SERVER_SLAVE).
|
|
if (m_bitvalue == SERVER_MASTER && m_backend->active)
|
|
{
|
|
// If we're using an active master server, verify that it is still a master
|
|
rval = m_backend == m_instance->get_root_master();
|
|
}
|
|
else
|
|
{
|
|
/**
|
|
* Either we don't use master type servers or the server reference
|
|
* is deactivated. We let deactivated connection close gracefully
|
|
* so we simply assume it is OK. This allows a server to be taken
|
|
* out of use in a manner that won't cause errors to the connected
|
|
* clients.
|
|
*/
|
|
rval = true;
|
|
}
|
|
}
|
|
|
|
return rval;
|
|
}
|
|
|
|
int RCRSession::routeQuery(GWBUF* queue)
|
|
{
|
|
int rc = 0;
|
|
MySQLProtocol* proto = static_cast<MySQLProtocol*>(m_client_dcb->protocol);
|
|
mxs_mysql_cmd_t mysql_command = proto->current_command;
|
|
|
|
mxb::atomic::add(&m_instance->stats().n_queries, 1, mxb::atomic::RELAXED);
|
|
|
|
// Due to the streaming nature of readconnroute, this is not accurate
|
|
mxb::atomic::add(&m_backend->server->stats.packets, 1, mxb::atomic::RELAXED);
|
|
|
|
DCB* backend_dcb = m_dcb;
|
|
mxb_assert(backend_dcb);
|
|
char* trc = nullptr;
|
|
|
|
if (!connection_is_valid())
|
|
{
|
|
log_closed_session(mysql_command, m_backend);
|
|
gwbuf_free(queue);
|
|
return rc;
|
|
}
|
|
|
|
switch (mysql_command)
|
|
{
|
|
case MXS_COM_CHANGE_USER:
|
|
rc = backend_dcb->func.auth(backend_dcb,
|
|
nullptr,
|
|
backend_dcb->session,
|
|
queue);
|
|
break;
|
|
|
|
case MXS_COM_QUERY:
|
|
if (mxs_log_is_priority_enabled(LOG_INFO))
|
|
{
|
|
trc = modutil_get_SQL(queue);
|
|
}
|
|
|
|
default:
|
|
rc = backend_dcb->func.write(backend_dcb, queue);
|
|
break;
|
|
}
|
|
|
|
MXS_INFO("Routed [%s] to '%s'%s%s",
|
|
STRPACKETTYPE(mysql_command),
|
|
backend_dcb->server->name(),
|
|
trc ? ": " : ".",
|
|
trc ? trc : "");
|
|
MXS_FREE(trc);
|
|
|
|
return rc;
|
|
}
|
|
|
|
void RCR::diagnostics(DCB* dcb)
|
|
{
|
|
const char* weightby = serviceGetWeightingParameter(m_pService);
|
|
|
|
dcb_printf(dcb,
|
|
"\tNumber of router sessions: %d\n",
|
|
m_stats.n_sessions);
|
|
dcb_printf(dcb,
|
|
"\tCurrent no. of router sessions: %d\n",
|
|
m_pService->stats.n_current);
|
|
dcb_printf(dcb,
|
|
"\tNumber of queries forwarded: %d\n",
|
|
m_stats.n_queries);
|
|
if (*weightby)
|
|
{
|
|
dcb_printf(dcb,
|
|
"\tConnection distribution based on %s "
|
|
"server parameter.\n",
|
|
weightby);
|
|
dcb_printf(dcb,
|
|
"\t\tServer Target %% Connections\n");
|
|
for (SERVER_REF* ref = m_pService->dbref; ref; ref = ref->next)
|
|
{
|
|
dcb_printf(dcb,
|
|
"\t\t%-20s %3.1f%% %d\n",
|
|
ref->server->name(),
|
|
ref->server_weight * 100,
|
|
ref->connections);
|
|
}
|
|
}
|
|
}
|
|
|
|
json_t* RCR::diagnostics_json() const
|
|
{
|
|
json_t* rval = json_object();
|
|
|
|
json_object_set_new(rval, "connections", json_integer(m_stats.n_sessions));
|
|
json_object_set_new(rval, "current_connections", json_integer(m_pService->stats.n_current));
|
|
json_object_set_new(rval, "queries", json_integer(m_stats.n_queries));
|
|
|
|
const char* weightby = serviceGetWeightingParameter(m_pService);
|
|
|
|
if (*weightby)
|
|
{
|
|
json_object_set_new(rval, "weightby", json_string(weightby));
|
|
}
|
|
|
|
return rval;
|
|
}
|
|
|
|
/**
|
|
* Client Reply routine
|
|
*
|
|
* The routine will reply to client data from backend server
|
|
*
|
|
* @param backend_dcb The backend DCB
|
|
* @param queue The GWBUF with reply data
|
|
*/
|
|
void RCRSession::clientReply(GWBUF* queue, DCB* backend_dcb)
|
|
{
|
|
mxb_assert(backend_dcb->session->client_dcb);
|
|
MXS_SESSION_ROUTE_REPLY(backend_dcb->session, queue);
|
|
}
|
|
|
|
/**
|
|
* Error Handler routine
|
|
*
|
|
* The routine will handle errors that occurred in writes.
|
|
*
|
|
* @param message The error message to reply
|
|
* @param problem_dcb The DCB related to the error
|
|
* @param action The action: ERRACT_NEW_CONNECTION or ERRACT_REPLY_CLIENT
|
|
* @param succp Result of action: true if router can continue
|
|
*/
|
|
void RCRSession::handleError(GWBUF* errbuf, DCB* problem_dcb, mxs_error_action_t action, bool* succp)
|
|
|
|
{
|
|
mxb_assert(problem_dcb->role == DCB::Role::BACKEND);
|
|
mxb_assert(problem_dcb->session->state == SESSION_STATE_STARTED);
|
|
DCB* client_dcb = problem_dcb->session->client_dcb;
|
|
client_dcb->func.write(client_dcb, gwbuf_clone(errbuf));
|
|
|
|
// The DCB will be closed once the session closes, no need to close it here
|
|
*succp = false;
|
|
}
|
|
|
|
uint64_t RCR::getCapabilities()
|
|
{
|
|
return RCAP_TYPE_RUNTIME_CONFIG;
|
|
}
|