457 lines
16 KiB
C
457 lines
16 KiB
C
#pragma once
|
|
/*
|
|
* Copyright (c) 2016 MariaDB Corporation Ab
|
|
*
|
|
* Use of this software is governed by the Business Source License included
|
|
* in the LICENSE.TXT file and at www.mariadb.com/bsl11.
|
|
*
|
|
* Change Date: 2020-01-01
|
|
*
|
|
* On the date above, in accordance with the Business Source License, use
|
|
* of this software will be governed by version 2 or later of the General
|
|
* Public License.
|
|
*/
|
|
|
|
/**
|
|
* @file include/maxscale/monitor.h - The public monitor interface
|
|
*/
|
|
|
|
#include <maxscale/cdefs.h>
|
|
|
|
#include <openssl/sha.h>
|
|
|
|
#include <maxscale/config.h>
|
|
#include <maxscale/dcb.h>
|
|
#include <maxscale/server.h>
|
|
#include <maxscale/jansson.h>
|
|
#include <maxscale/protocol/mysql.h>
|
|
|
|
MXS_BEGIN_DECLS
|
|
|
|
struct mxs_monitor;
|
|
typedef struct mxs_monitor MXS_MONITOR;
|
|
|
|
/**
|
|
* An opaque type from which types specific for a particular
|
|
* monitor can be derived.
|
|
*/
|
|
typedef struct mxs_monitor_instance
|
|
{
|
|
} MXS_MONITOR_INSTANCE;
|
|
|
|
/**
|
|
* @verbatim
|
|
* The "module object" structure for a backend monitor module
|
|
*
|
|
* Monitor modules monitor the backend databases that MaxScale connects to.
|
|
* The information provided by a monitor is used in routing decisions.
|
|
*
|
|
* The entry points are:
|
|
* startMonitor Called by main to start the monitor
|
|
* stopMonitor Called by main to shut down and destroy a monitor
|
|
* diagnostics Called for diagnostic output
|
|
*
|
|
* startMonitor is called to start the monitoring process, it is called on the
|
|
* MaxScale main thread and is responsible for creating a thread for the monitor
|
|
* itself to run on. This should use the entry points defined in the thread.h
|
|
* header file rather than make direct calls to the operating system threading
|
|
* libraries. The return from startMonitor is a pointer that will be passed to
|
|
* all other monitor API calls.
|
|
*
|
|
* @endverbatim
|
|
*
|
|
* @see load_module
|
|
*/
|
|
typedef struct mxs_monitor_api
|
|
{
|
|
/**
|
|
* @brief Create the monitor.
|
|
*
|
|
* This entry point is called once when MaxScale is started, for
|
|
* creating the monitor.
|
|
*
|
|
* If the function fails, MaxScale will not start. That is, it
|
|
* should fail only for fatal reasons such as not being able to
|
|
* create vital resources.
|
|
*
|
|
* @param monitor The monitor object.
|
|
*
|
|
* @return Pointer to the monitor specific data. Will be stored
|
|
* in @c monitor->handle.
|
|
*/
|
|
MXS_MONITOR_INSTANCE *(*createInstance)(MXS_MONITOR *monitor);
|
|
|
|
/**
|
|
* @brief Destroy the monitor.
|
|
*
|
|
* This entry point is called once when MaxScale is shutting down, iff
|
|
* the earlier call to @c initMonitor returned on object. The monitor should
|
|
* perform all needed cleanup.
|
|
*
|
|
* @param monitor The monitor object.
|
|
*/
|
|
void (*destroyInstance)(MXS_MONITOR_INSTANCE *monitor);
|
|
|
|
/**
|
|
* @brief Start the monitor
|
|
*
|
|
* This entry point is called when the monitor is started. If the monitor
|
|
* requires polling of the servers, it should create a separate monitoring
|
|
* thread.
|
|
*
|
|
* @param monitor The monitor object
|
|
* @param params Parameters for this monitor
|
|
*
|
|
* @return True, if the monitor could be started, false otherwise.
|
|
*/
|
|
bool (*startMonitor)(MXS_MONITOR_INSTANCE *monitor,
|
|
const MXS_CONFIG_PARAMETER *params);
|
|
|
|
/**
|
|
* @brief Stop the monitor
|
|
*
|
|
* This entry point is called when the monitor is stopped. If the monitor
|
|
* uses a polling thread, the thread should be stopped.
|
|
*
|
|
* @param monitor The monitor object
|
|
*/
|
|
void (*stopMonitor)(MXS_MONITOR_INSTANCE *monitor);
|
|
|
|
/**
|
|
* @brief Write diagnostic information to a DCB.
|
|
*
|
|
* @param monitor The monitor object.
|
|
* @param dcb The dcb to write to.
|
|
*/
|
|
void (*diagnostics)(const MXS_MONITOR_INSTANCE* monitor, DCB* dcb);
|
|
|
|
/**
|
|
* @brief Return diagnostic information about the monitor
|
|
*
|
|
* @param monitor The monitor object.
|
|
*
|
|
* @return A JSON object representing the state of the monitor
|
|
*
|
|
* @see jansson.h
|
|
*/
|
|
json_t* (*diagnostics_json)(const MXS_MONITOR_INSTANCE *monitor);
|
|
} MXS_MONITOR_API;
|
|
|
|
/**
|
|
* The monitor API version number. Any change to the monitor module API
|
|
* must change these versions using the rules defined in modinfo.h
|
|
*/
|
|
#define MXS_MONITOR_VERSION {4, 0, 0}
|
|
|
|
/**
|
|
* Specifies capabilities specific for monitor.
|
|
*
|
|
* @see enum routing_capability
|
|
*
|
|
* @note The values of the capabilities here *must* be between 0x0001 0000 0000 0000
|
|
* and 0x0080 0000 0000 0000, that is, bits 48 to 55.
|
|
*/
|
|
typedef enum monitor_capability
|
|
{
|
|
MCAP_TYPE_NONE = 0x0 // TODO: remove once monitor capabilities are defined
|
|
} monitor_capability_t;
|
|
|
|
/** Monitor's poll frequency */
|
|
#define MXS_MON_BASE_INTERVAL_MS 100
|
|
|
|
#define MXS_MONITOR_RUNNING 1
|
|
#define MXS_MONITOR_STOPPING 2
|
|
#define MXS_MONITOR_STOPPED 3
|
|
|
|
#define MXS_MONITOR_DEFAULT_ID 1UL // unsigned long value
|
|
|
|
#define MAX_MONITOR_USER_LEN 512
|
|
#define MAX_MONITOR_PASSWORD_LEN 512
|
|
|
|
/**
|
|
* Monitor state bit mask values
|
|
*/
|
|
typedef enum
|
|
{
|
|
MONITOR_STATE_ALLOC = 0x00,
|
|
MONITOR_STATE_RUNNING = 0x01,
|
|
MONITOR_STATE_STOPPING = 0x02,
|
|
MONITOR_STATE_STOPPED = 0x04,
|
|
MONITOR_STATE_FREED = 0x08
|
|
} monitor_state_t;
|
|
|
|
/* Return type of mon_ping_or_connect_to_db(). */
|
|
typedef enum
|
|
{
|
|
MONITOR_CONN_EXISTING_OK, /* Existing connection was ok and server replied to ping. */
|
|
MONITOR_CONN_NEWCONN_OK, /* No existing connection or no ping reply. New connection created
|
|
* successfully. */
|
|
MONITOR_CONN_REFUSED, /* No existing connection or no ping reply. Server refused new connection. */
|
|
MONITOR_CONN_TIMEOUT /* No existing connection or no ping reply. Timeout on new connection. */
|
|
} mxs_connect_result_t;
|
|
|
|
/** Monitor events */
|
|
typedef enum
|
|
{
|
|
UNDEFINED_EVENT = 0,
|
|
MASTER_DOWN_EVENT = (1 << 0), /**< master_down */
|
|
MASTER_UP_EVENT = (1 << 1), /**< master_up */
|
|
SLAVE_DOWN_EVENT = (1 << 2), /**< slave_down */
|
|
SLAVE_UP_EVENT = (1 << 3), /**< slave_up */
|
|
SERVER_DOWN_EVENT = (1 << 4), /**< server_down */
|
|
SERVER_UP_EVENT = (1 << 5), /**< server_up */
|
|
SYNCED_DOWN_EVENT = (1 << 6), /**< synced_down */
|
|
SYNCED_UP_EVENT = (1 << 7), /**< synced_up */
|
|
DONOR_DOWN_EVENT = (1 << 8), /**< donor_down */
|
|
DONOR_UP_EVENT = (1 << 9), /**< donor_up */
|
|
NDB_DOWN_EVENT = (1 << 10), /**< ndb_down */
|
|
NDB_UP_EVENT = (1 << 11), /**< ndb_up */
|
|
LOST_MASTER_EVENT = (1 << 12), /**< lost_master */
|
|
LOST_SLAVE_EVENT = (1 << 13), /**< lost_slave */
|
|
LOST_SYNCED_EVENT = (1 << 14), /**< lost_synced */
|
|
LOST_DONOR_EVENT = (1 << 15), /**< lost_donor */
|
|
LOST_NDB_EVENT = (1 << 16), /**< lost_ndb */
|
|
NEW_MASTER_EVENT = (1 << 17), /**< new_master */
|
|
NEW_SLAVE_EVENT = (1 << 18), /**< new_slave */
|
|
NEW_SYNCED_EVENT = (1 << 19), /**< new_synced */
|
|
NEW_DONOR_EVENT = (1 << 20), /**< new_donor */
|
|
NEW_NDB_EVENT = (1 << 21), /**< new_ndb */
|
|
} mxs_monitor_event_t;
|
|
|
|
/**
|
|
* The linked list of servers that are being monitored by the monitor module.
|
|
*/
|
|
typedef struct monitored_server
|
|
{
|
|
SERVER *server; /**< The server being monitored */
|
|
MYSQL *con; /**< The MySQL connection */
|
|
bool log_version_err;
|
|
int mon_err_count;
|
|
uint64_t mon_prev_status; /**< Status before starting the current monitor loop */
|
|
uint64_t pending_status; /**< Status during current monitor loop */
|
|
bool new_event; /**< Whether an action was taken on the last event */
|
|
int64_t disk_space_checked; /**< When was the disk space checked the last time */
|
|
struct monitored_server *next; /**< The next server in the list */
|
|
} MXS_MONITORED_SERVER;
|
|
|
|
/**
|
|
* Representation of the running monitor.
|
|
*/
|
|
struct mxs_monitor
|
|
{
|
|
char *name; /**< The name of the monitor module */
|
|
char user[MAX_MONITOR_USER_LEN]; /*< Monitor username */
|
|
char password[MAX_MONITOR_PASSWORD_LEN]; /*< Monitor password */
|
|
SPINLOCK lock;
|
|
MXS_CONFIG_PARAMETER* parameters; /*< configuration parameters */
|
|
MXS_MONITORED_SERVER* monitored_servers; /*< List of servers the monitor monitors */
|
|
monitor_state_t state; /**< The state of the monitor */
|
|
int connect_timeout; /**< Connect timeout in seconds for mysql_real_connect */
|
|
int connect_attempts; /**< How many times a connection is attempted */
|
|
int read_timeout; /**< Timeout in seconds to read from the server.
|
|
* There are retries and the total effective timeout
|
|
* value is three times the option value.
|
|
*/
|
|
int write_timeout; /**< Timeout in seconds for each attempt to write to the server.
|
|
* There are retries and the total effective timeout value is
|
|
* two times the option value.
|
|
*/
|
|
MXS_MONITOR_API *api; /**< The monitor api */
|
|
char *module_name; /**< Name of the monitor module */
|
|
MXS_MONITOR_INSTANCE *instance; /**< Instance returned from startMonitor */
|
|
size_t interval; /**< The monitor interval */
|
|
int check_maintenance_flag; /**< Set when admin requests a maintenance status change. */
|
|
bool active; /**< True if monitor is active */
|
|
time_t journal_max_age; /**< Maximum age of journal file */
|
|
uint32_t script_timeout; /**< Timeout in seconds for the monitor scripts */
|
|
uint8_t journal_hash[SHA_DIGEST_LENGTH]; /**< SHA1 hash of the latest written journal */
|
|
MxsDiskSpaceThreshold* disk_space_threshold; /**< Disk space thresholds */
|
|
int64_t disk_space_check_interval; /**< How often should a disk space check be made at most. */
|
|
uint64_t ticks; /**< Number of performed monitoring intervals */
|
|
struct mxs_monitor *next; /**< Next monitor in the linked list */
|
|
};
|
|
|
|
static const MXS_ENUM_VALUE mxs_monitor_event_enum_values[] =
|
|
{
|
|
{"master_down", MASTER_DOWN_EVENT},
|
|
{"master_up", MASTER_UP_EVENT},
|
|
{"slave_down", SLAVE_DOWN_EVENT},
|
|
{"slave_up", SLAVE_UP_EVENT},
|
|
{"server_down", SERVER_DOWN_EVENT},
|
|
{"server_up", SERVER_UP_EVENT},
|
|
{"synced_down", SYNCED_DOWN_EVENT},
|
|
{"synced_up", SYNCED_UP_EVENT},
|
|
{"donor_down", DONOR_DOWN_EVENT},
|
|
{"donor_up", DONOR_UP_EVENT},
|
|
{"ndb_down", NDB_DOWN_EVENT},
|
|
{"ndb_up", NDB_UP_EVENT},
|
|
{"lost_master", LOST_MASTER_EVENT},
|
|
{"lost_slave", LOST_SLAVE_EVENT},
|
|
{"lost_synced", LOST_SYNCED_EVENT},
|
|
{"lost_donor", LOST_DONOR_EVENT},
|
|
{"lost_ndb", LOST_NDB_EVENT},
|
|
{"new_master", NEW_MASTER_EVENT},
|
|
{"new_slave", NEW_SLAVE_EVENT},
|
|
{"new_synced", NEW_SYNCED_EVENT},
|
|
{"new_donor", NEW_DONOR_EVENT},
|
|
{"new_ndb", NEW_NDB_EVENT},
|
|
{NULL}
|
|
};
|
|
|
|
/** Default value for the `events` parameter */
|
|
static const char MXS_MONITOR_EVENT_DEFAULT_VALUE[] = "master_down,master_up,slave_down,"
|
|
"slave_up,server_down,server_up,synced_down,synced_up,donor_down,donor_up,"
|
|
"ndb_down,ndb_up,lost_master,lost_slave,lost_synced,lost_donor,lost_ndb,"
|
|
"new_master,new_slave,new_synced,new_donor,new_ndb";
|
|
|
|
/**
|
|
* Monitor configuration parameters names
|
|
*/
|
|
extern const char CN_BACKEND_CONNECT_ATTEMPTS[];
|
|
extern const char CN_BACKEND_CONNECT_TIMEOUT[];
|
|
extern const char CN_BACKEND_READ_TIMEOUT[];
|
|
extern const char CN_BACKEND_WRITE_TIMEOUT[];
|
|
extern const char CN_DISK_SPACE_CHECK_INTERVAL[];
|
|
extern const char CN_EVENTS[];
|
|
extern const char CN_JOURNAL_MAX_AGE[];
|
|
extern const char CN_MONITOR_INTERVAL[];
|
|
extern const char CN_SCRIPT[];
|
|
extern const char CN_SCRIPT_TIMEOUT[];
|
|
|
|
bool check_monitor_permissions(MXS_MONITOR* monitor, const char* query);
|
|
|
|
void monitor_clear_pending_status(MXS_MONITORED_SERVER *ptr, uint64_t bit);
|
|
void monitor_set_pending_status(MXS_MONITORED_SERVER *ptr, uint64_t bit);
|
|
void monitor_check_maintenance_requests(MXS_MONITOR *monitor);
|
|
|
|
bool mon_status_changed(MXS_MONITORED_SERVER* mon_srv);
|
|
bool mon_print_fail_status(MXS_MONITORED_SERVER* mon_srv);
|
|
|
|
mxs_connect_result_t mon_ping_or_connect_to_db(MXS_MONITOR* mon, MXS_MONITORED_SERVER *database);
|
|
bool mon_connection_is_ok(mxs_connect_result_t connect_result);
|
|
void mon_log_connect_error(MXS_MONITORED_SERVER* database, mxs_connect_result_t rval);
|
|
const char* mon_get_event_name(mxs_monitor_event_t event);
|
|
|
|
/**
|
|
* Alter monitor parameters
|
|
*
|
|
* The monitor parameters should not be altered while the monitor is
|
|
* running. To alter a parameter from outside a monitor module, stop the monitor,
|
|
* do the alteration and then restart the monitor. The monitor "owns" the parameters
|
|
* as long as it is running so if the monitor needs to change its own parameters,
|
|
* it can do it without stopping itself.
|
|
*
|
|
* @param monitor Monitor whose parameter is altered
|
|
* @param key Parameter name to alter
|
|
* @param value New value for the parameter
|
|
*/
|
|
void mon_alter_parameter(MXS_MONITOR* monitor, const char* key, const char* value);
|
|
|
|
/**
|
|
* @brief Handle state change events
|
|
*
|
|
* This function should be called by all monitors at the end of each monitoring
|
|
* cycle. This will log state changes and execute any scripts that should be executed.
|
|
*
|
|
* @param monitor Monitor object
|
|
* @param script Script to execute or NULL for no script
|
|
* @param events Enabled events
|
|
*/
|
|
void mon_process_state_changes(MXS_MONITOR *monitor, const char *script, uint64_t events);
|
|
|
|
/**
|
|
* @brief Hangup connections to failed servers
|
|
*
|
|
* Injects hangup events for DCB that are connected to servers that are down.
|
|
*
|
|
* @param monitor Monitor object
|
|
*/
|
|
void mon_hangup_failed_servers(MXS_MONITOR *monitor);
|
|
|
|
/**
|
|
* @brief Report query errors
|
|
*
|
|
* @param db Database where the query failed
|
|
*/
|
|
void mon_report_query_error(MXS_MONITORED_SERVER* db);
|
|
|
|
/**
|
|
* @brief Convert monitor to JSON
|
|
*
|
|
* @param monitor Monitor to convert
|
|
* @param host Hostname of this server
|
|
*
|
|
* @return JSON representation of the monitor
|
|
*/
|
|
json_t* monitor_to_json(const MXS_MONITOR* monitor, const char* host);
|
|
|
|
/**
|
|
* @brief Convert all monitors to JSON
|
|
*
|
|
* @param host Hostname of this server
|
|
*
|
|
* @return JSON array containing all monitors
|
|
*/
|
|
json_t* monitor_list_to_json(const char* host);
|
|
|
|
/**
|
|
* @brief Get links to monitors that relate to a server
|
|
*
|
|
* @param server Server to inspect
|
|
* @param host Hostname of this server
|
|
*
|
|
* @return Array of monitor links or NULL if no relations exist
|
|
*/
|
|
json_t* monitor_relations_to_server(const SERVER* server, const char* host);
|
|
|
|
/**
|
|
* @brief Store a journal of server states
|
|
*
|
|
* @param monitor Monitor to journal
|
|
* @param master The current master server or NULL if no master exists
|
|
*/
|
|
void store_server_journal(MXS_MONITOR *monitor, MXS_MONITORED_SERVER *master);
|
|
|
|
/**
|
|
* @brief Load a journal of server states
|
|
*
|
|
* @param monitor Monitor where journal is loaded
|
|
* @param master Set to point to the current master
|
|
*/
|
|
void load_server_journal(MXS_MONITOR *monitor, MXS_MONITORED_SERVER **master);
|
|
|
|
/**
|
|
* Find the monitored server representing the server.
|
|
*
|
|
* @param mon Cluster monitor
|
|
* @param search_server Server to search for
|
|
* @return Found monitored server or NULL if not found
|
|
*/
|
|
MXS_MONITORED_SERVER* mon_get_monitored_server(const MXS_MONITOR* mon, SERVER* search_server);
|
|
|
|
/**
|
|
* Get an array of monitored servers. If a server defined in the config setting is not monitored by
|
|
* the given monitor, that server is ignored and not inserted into the output array.
|
|
*
|
|
* @param params Config parameters
|
|
* @param key Setting name
|
|
* @param mon Monitor which should monitor the servers
|
|
* @param monitored_servers_out Where to save output array. The caller should free the array, but not the
|
|
* elements. The output must contain NULL before calling this function.
|
|
* @return Output array size.
|
|
*/
|
|
int mon_config_get_servers(const MXS_CONFIG_PARAMETER* params, const char* key, const MXS_MONITOR* mon,
|
|
MXS_MONITORED_SERVER*** monitored_array_out);
|
|
|
|
/**
|
|
* @brief Set the disk space threshold of a monitor
|
|
*
|
|
* @param server The monitor.
|
|
* @param disk_space_threshold The disk space threshold as specified in the config file.
|
|
*
|
|
* @return True, if the provided string is valid and the threshold could be set.
|
|
*/
|
|
bool monitor_set_disk_space_threshold(MXS_MONITOR *monitor, const char *disk_space_threshold);
|
|
|
|
MXS_END_DECLS
|