457 lines
		
	
	
		
			16 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			457 lines
		
	
	
		
			16 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| #pragma once
 | |
| /*
 | |
|  * Copyright (c) 2016 MariaDB Corporation Ab
 | |
|  *
 | |
|  * Use of this software is governed by the Business Source License included
 | |
|  * in the LICENSE.TXT file and at www.mariadb.com/bsl11.
 | |
|  *
 | |
|  * Change Date: 2020-01-01
 | |
|  *
 | |
|  * On the date above, in accordance with the Business Source License, use
 | |
|  * of this software will be governed by version 2 or later of the General
 | |
|  * Public License.
 | |
|  */
 | |
| 
 | |
| /**
 | |
|  * @file include/maxscale/monitor.h - The public monitor interface
 | |
|  */
 | |
| 
 | |
| #include <maxscale/cdefs.h>
 | |
| 
 | |
| #include <openssl/sha.h>
 | |
| 
 | |
| #include <maxscale/config.h>
 | |
| #include <maxscale/dcb.h>
 | |
| #include <maxscale/server.h>
 | |
| #include <maxscale/jansson.h>
 | |
| #include <maxscale/protocol/mysql.h>
 | |
| 
 | |
| MXS_BEGIN_DECLS
 | |
| 
 | |
| struct mxs_monitor;
 | |
| typedef struct mxs_monitor MXS_MONITOR;
 | |
| 
 | |
| /**
 | |
|  * An opaque type from which types specific for a particular
 | |
|  * monitor can be derived.
 | |
|  */
 | |
| typedef struct mxs_monitor_instance
 | |
| {
 | |
| } MXS_MONITOR_INSTANCE;
 | |
| 
 | |
| /**
 | |
|  * @verbatim
 | |
|  * The "module object" structure for a backend monitor module
 | |
|  *
 | |
|  * Monitor modules monitor the backend databases that MaxScale connects to.
 | |
|  * The information provided by a monitor is used in routing decisions.
 | |
|  *
 | |
|  * The entry points are:
 | |
|  *      startMonitor    Called by main to start the monitor
 | |
|  *      stopMonitor     Called by main to shut down and destroy a monitor
 | |
|  *      diagnostics     Called for diagnostic output
 | |
|  *
 | |
|  * startMonitor is called to start the monitoring process, it is called on the
 | |
|  * MaxScale main thread and is responsible for creating a thread for the monitor
 | |
|  * itself to run on. This should use the entry points defined in the thread.h
 | |
|  * header file rather than make direct calls to the operating system threading
 | |
|  * libraries. The return from startMonitor is a pointer that will be passed to
 | |
|  * all other monitor API calls.
 | |
|  *
 | |
|  * @endverbatim
 | |
|  *
 | |
|  * @see load_module
 | |
|  */
 | |
| typedef struct mxs_monitor_api
 | |
| {
 | |
|     /**
 | |
|      * @brief Create the monitor.
 | |
|      *
 | |
|      * This entry point is called once when MaxScale is started, for
 | |
|      * creating the monitor.
 | |
|      *
 | |
|      * If the function fails, MaxScale will not start. That is, it
 | |
|      * should fail only for fatal reasons such as not being able to
 | |
|      * create vital resources.
 | |
|      *
 | |
|      * @param monitor  The monitor object.
 | |
|      *
 | |
|      * @return Pointer to the monitor specific data. Will be stored
 | |
|      *         in @c monitor->handle.
 | |
|      */
 | |
|     MXS_MONITOR_INSTANCE *(*createInstance)(MXS_MONITOR *monitor);
 | |
| 
 | |
|     /**
 | |
|      * @brief Destroy the monitor.
 | |
|      *
 | |
|      * This entry point is called once when MaxScale is shutting down, iff
 | |
|      * the earlier call to @c initMonitor returned on object. The monitor should
 | |
|      * perform all needed cleanup.
 | |
|      *
 | |
|      * @param monitor  The monitor object.
 | |
|      */
 | |
|     void (*destroyInstance)(MXS_MONITOR_INSTANCE *monitor);
 | |
| 
 | |
|     /**
 | |
|      * @brief Start the monitor
 | |
|      *
 | |
|      * This entry point is called when the monitor is started. If the monitor
 | |
|      * requires polling of the servers, it should create a separate monitoring
 | |
|      * thread.
 | |
|      *
 | |
|      * @param monitor The monitor object
 | |
|      * @param params  Parameters for this monitor
 | |
|      *
 | |
|      * @return True, if the monitor could be started, false otherwise.
 | |
|      */
 | |
|     bool (*startMonitor)(MXS_MONITOR_INSTANCE *monitor,
 | |
|                          const MXS_CONFIG_PARAMETER *params);
 | |
| 
 | |
|     /**
 | |
|      * @brief Stop the monitor
 | |
|      *
 | |
|      * This entry point is called when the monitor is stopped. If the monitor
 | |
|      * uses a polling thread, the thread should be stopped.
 | |
|      *
 | |
|      * @param monitor The monitor object
 | |
|      */
 | |
|     void (*stopMonitor)(MXS_MONITOR_INSTANCE *monitor);
 | |
| 
 | |
|     /**
 | |
|      * @brief Write diagnostic information to a DCB.
 | |
|      *
 | |
|      * @param monitor  The monitor object.
 | |
|      * @param dcb      The dcb to write to.
 | |
|      */
 | |
|     void (*diagnostics)(const MXS_MONITOR_INSTANCE* monitor, DCB* dcb);
 | |
| 
 | |
|     /**
 | |
|      * @brief Return diagnostic information about the monitor
 | |
|      *
 | |
|      * @param monitor  The monitor object.
 | |
|      *
 | |
|      * @return A JSON object representing the state of the monitor
 | |
|      *
 | |
|      * @see jansson.h
 | |
|      */
 | |
|     json_t* (*diagnostics_json)(const MXS_MONITOR_INSTANCE *monitor);
 | |
| } MXS_MONITOR_API;
 | |
| 
 | |
| /**
 | |
|  * The monitor API version number. Any change to the monitor module API
 | |
|  * must change these versions using the rules defined in modinfo.h
 | |
|  */
 | |
| #define MXS_MONITOR_VERSION {4, 0, 0}
 | |
| 
 | |
| /**
 | |
|  * Specifies capabilities specific for monitor.
 | |
|  *
 | |
|  * @see enum routing_capability
 | |
|  *
 | |
|  * @note The values of the capabilities here *must* be between 0x0001 0000 0000 0000
 | |
|  *       and 0x0080 0000 0000 0000, that is, bits 48 to 55.
 | |
|  */
 | |
| typedef enum monitor_capability
 | |
| {
 | |
|     MCAP_TYPE_NONE = 0x0 // TODO: remove once monitor capabilities are defined
 | |
| } monitor_capability_t;
 | |
| 
 | |
| /** Monitor's poll frequency */
 | |
| #define MXS_MON_BASE_INTERVAL_MS 100
 | |
| 
 | |
| #define MXS_MONITOR_RUNNING 1
 | |
| #define MXS_MONITOR_STOPPING 2
 | |
| #define MXS_MONITOR_STOPPED 3
 | |
| 
 | |
| #define MXS_MONITOR_DEFAULT_ID 1UL // unsigned long value
 | |
| 
 | |
| #define MAX_MONITOR_USER_LEN     512
 | |
| #define MAX_MONITOR_PASSWORD_LEN 512
 | |
| 
 | |
| /**
 | |
|  * Monitor state bit mask values
 | |
|  */
 | |
| typedef enum
 | |
| {
 | |
|     MONITOR_STATE_ALLOC     = 0x00,
 | |
|     MONITOR_STATE_RUNNING   = 0x01,
 | |
|     MONITOR_STATE_STOPPING  = 0x02,
 | |
|     MONITOR_STATE_STOPPED   = 0x04,
 | |
|     MONITOR_STATE_FREED     = 0x08
 | |
| } monitor_state_t;
 | |
| 
 | |
| /* Return type of mon_ping_or_connect_to_db(). */
 | |
| typedef enum
 | |
| {
 | |
|     MONITOR_CONN_EXISTING_OK,   /* Existing connection was ok and server replied to ping. */
 | |
|     MONITOR_CONN_NEWCONN_OK,    /* No existing connection or no ping reply. New connection created
 | |
|                                  * successfully. */
 | |
|     MONITOR_CONN_REFUSED,       /* No existing connection or no ping reply. Server refused new connection. */
 | |
|     MONITOR_CONN_TIMEOUT        /* No existing connection or no ping reply. Timeout on new connection. */
 | |
| } mxs_connect_result_t;
 | |
| 
 | |
| /** Monitor events */
 | |
| typedef enum
 | |
| {
 | |
|     UNDEFINED_EVENT   = 0,
 | |
|     MASTER_DOWN_EVENT = (1 << 0),  /**< master_down */
 | |
|     MASTER_UP_EVENT   = (1 << 1),  /**< master_up */
 | |
|     SLAVE_DOWN_EVENT  = (1 << 2),  /**< slave_down */
 | |
|     SLAVE_UP_EVENT    = (1 << 3),  /**< slave_up */
 | |
|     SERVER_DOWN_EVENT = (1 << 4),  /**< server_down */
 | |
|     SERVER_UP_EVENT   = (1 << 5),  /**< server_up */
 | |
|     SYNCED_DOWN_EVENT = (1 << 6),  /**< synced_down */
 | |
|     SYNCED_UP_EVENT   = (1 << 7),  /**< synced_up */
 | |
|     DONOR_DOWN_EVENT  = (1 << 8),  /**< donor_down */
 | |
|     DONOR_UP_EVENT    = (1 << 9),  /**< donor_up */
 | |
|     NDB_DOWN_EVENT    = (1 << 10), /**< ndb_down */
 | |
|     NDB_UP_EVENT      = (1 << 11), /**< ndb_up */
 | |
|     LOST_MASTER_EVENT = (1 << 12), /**< lost_master */
 | |
|     LOST_SLAVE_EVENT  = (1 << 13), /**< lost_slave */
 | |
|     LOST_SYNCED_EVENT = (1 << 14), /**< lost_synced */
 | |
|     LOST_DONOR_EVENT  = (1 << 15), /**< lost_donor */
 | |
|     LOST_NDB_EVENT    = (1 << 16), /**< lost_ndb */
 | |
|     NEW_MASTER_EVENT  = (1 << 17), /**< new_master */
 | |
|     NEW_SLAVE_EVENT   = (1 << 18), /**< new_slave */
 | |
|     NEW_SYNCED_EVENT  = (1 << 19), /**< new_synced */
 | |
|     NEW_DONOR_EVENT   = (1 << 20), /**< new_donor */
 | |
|     NEW_NDB_EVENT     = (1 << 21), /**< new_ndb */
 | |
| } mxs_monitor_event_t;
 | |
| 
 | |
| /**
 | |
|  * The linked list of servers that are being monitored by the monitor module.
 | |
|  */
 | |
| typedef struct monitored_server
 | |
| {
 | |
|     SERVER *server;                 /**< The server being monitored */
 | |
|     MYSQL *con;                     /**< The MySQL connection */
 | |
|     bool log_version_err;
 | |
|     int mon_err_count;
 | |
|     uint64_t mon_prev_status;       /**< Status before starting the current monitor loop */
 | |
|     uint64_t pending_status;        /**< Status during current monitor loop */
 | |
|     bool new_event;                 /**< Whether an action was taken on the last event */
 | |
|     int64_t disk_space_checked;     /**< When was the disk space checked the last time */
 | |
|     struct monitored_server *next;  /**< The next server in the list */
 | |
| } MXS_MONITORED_SERVER;
 | |
| 
 | |
| /**
 | |
|  * Representation of the running monitor.
 | |
|  */
 | |
| struct mxs_monitor
 | |
| {
 | |
|     char *name;                   /**< The name of the monitor module */
 | |
|     char user[MAX_MONITOR_USER_LEN]; /*< Monitor username */
 | |
|     char password[MAX_MONITOR_PASSWORD_LEN]; /*< Monitor password */
 | |
|     SPINLOCK lock;
 | |
|     MXS_CONFIG_PARAMETER* parameters; /*< configuration parameters */
 | |
|     MXS_MONITORED_SERVER* monitored_servers; /*< List of servers the monitor monitors */
 | |
|     monitor_state_t state;        /**< The state of the monitor */
 | |
|     int connect_timeout;          /**< Connect timeout in seconds for mysql_real_connect */
 | |
|     int connect_attempts;      /**< How many times a connection is attempted */
 | |
|     int read_timeout;             /**< Timeout in seconds to read from the server.
 | |
|                                    * There are retries and the total effective timeout
 | |
|                                    * value is three times the option value.
 | |
|                                    */
 | |
|     int write_timeout;            /**< Timeout in seconds for each attempt to write to the server.
 | |
|                                    * There are retries and the total effective timeout value is
 | |
|                                    * two times the option value.
 | |
|                                    */
 | |
|     MXS_MONITOR_API *api;         /**< The monitor api */
 | |
|     char *module_name;            /**< Name of the monitor module */
 | |
|     MXS_MONITOR_INSTANCE *instance; /**< Instance returned from startMonitor */
 | |
|     size_t interval;              /**< The monitor interval */
 | |
|     int check_maintenance_flag;   /**< Set when admin requests a maintenance status change. */
 | |
|     bool active; /**< True if monitor is active */
 | |
|     time_t journal_max_age; /**< Maximum age of journal file */
 | |
|     uint32_t script_timeout; /**< Timeout in seconds for the monitor scripts */
 | |
|     uint8_t journal_hash[SHA_DIGEST_LENGTH]; /**< SHA1 hash of the latest written journal */
 | |
|     MxsDiskSpaceThreshold* disk_space_threshold; /**< Disk space thresholds */
 | |
|     int64_t disk_space_check_interval; /**< How often should a disk space check be made at most. */
 | |
|     uint64_t ticks; /**< Number of performed monitoring intervals */
 | |
|     struct mxs_monitor *next;     /**< Next monitor in the linked list */
 | |
| };
 | |
| 
 | |
| static const MXS_ENUM_VALUE mxs_monitor_event_enum_values[] =
 | |
| {
 | |
|     {"master_down", MASTER_DOWN_EVENT},
 | |
|     {"master_up", MASTER_UP_EVENT},
 | |
|     {"slave_down", SLAVE_DOWN_EVENT},
 | |
|     {"slave_up", SLAVE_UP_EVENT},
 | |
|     {"server_down", SERVER_DOWN_EVENT},
 | |
|     {"server_up", SERVER_UP_EVENT},
 | |
|     {"synced_down", SYNCED_DOWN_EVENT},
 | |
|     {"synced_up", SYNCED_UP_EVENT},
 | |
|     {"donor_down", DONOR_DOWN_EVENT},
 | |
|     {"donor_up", DONOR_UP_EVENT},
 | |
|     {"ndb_down", NDB_DOWN_EVENT},
 | |
|     {"ndb_up", NDB_UP_EVENT},
 | |
|     {"lost_master", LOST_MASTER_EVENT},
 | |
|     {"lost_slave", LOST_SLAVE_EVENT},
 | |
|     {"lost_synced", LOST_SYNCED_EVENT},
 | |
|     {"lost_donor", LOST_DONOR_EVENT},
 | |
|     {"lost_ndb", LOST_NDB_EVENT},
 | |
|     {"new_master", NEW_MASTER_EVENT},
 | |
|     {"new_slave", NEW_SLAVE_EVENT},
 | |
|     {"new_synced", NEW_SYNCED_EVENT},
 | |
|     {"new_donor", NEW_DONOR_EVENT},
 | |
|     {"new_ndb", NEW_NDB_EVENT},
 | |
|     {NULL}
 | |
| };
 | |
| 
 | |
| /** Default value for the `events` parameter */
 | |
| static const char MXS_MONITOR_EVENT_DEFAULT_VALUE[] = "master_down,master_up,slave_down,"
 | |
|                                                       "slave_up,server_down,server_up,synced_down,synced_up,donor_down,donor_up,"
 | |
|                                                       "ndb_down,ndb_up,lost_master,lost_slave,lost_synced,lost_donor,lost_ndb,"
 | |
|                                                       "new_master,new_slave,new_synced,new_donor,new_ndb";
 | |
| 
 | |
| /**
 | |
|  * Monitor configuration parameters names
 | |
|  */
 | |
| extern const char CN_BACKEND_CONNECT_ATTEMPTS[];
 | |
| extern const char CN_BACKEND_CONNECT_TIMEOUT[];
 | |
| extern const char CN_BACKEND_READ_TIMEOUT[];
 | |
| extern const char CN_BACKEND_WRITE_TIMEOUT[];
 | |
| extern const char CN_DISK_SPACE_CHECK_INTERVAL[];
 | |
| extern const char CN_EVENTS[];
 | |
| extern const char CN_JOURNAL_MAX_AGE[];
 | |
| extern const char CN_MONITOR_INTERVAL[];
 | |
| extern const char CN_SCRIPT[];
 | |
| extern const char CN_SCRIPT_TIMEOUT[];
 | |
| 
 | |
| bool check_monitor_permissions(MXS_MONITOR* monitor, const char* query);
 | |
| 
 | |
| void monitor_clear_pending_status(MXS_MONITORED_SERVER *ptr, uint64_t bit);
 | |
| void monitor_set_pending_status(MXS_MONITORED_SERVER *ptr, uint64_t bit);
 | |
| void monitor_check_maintenance_requests(MXS_MONITOR *monitor);
 | |
| 
 | |
| bool mon_status_changed(MXS_MONITORED_SERVER* mon_srv);
 | |
| bool mon_print_fail_status(MXS_MONITORED_SERVER* mon_srv);
 | |
| 
 | |
| mxs_connect_result_t mon_ping_or_connect_to_db(MXS_MONITOR* mon, MXS_MONITORED_SERVER *database);
 | |
| bool mon_connection_is_ok(mxs_connect_result_t connect_result);
 | |
| void mon_log_connect_error(MXS_MONITORED_SERVER* database, mxs_connect_result_t rval);
 | |
| const char* mon_get_event_name(mxs_monitor_event_t event);
 | |
| 
 | |
| /**
 | |
|  * Alter monitor parameters
 | |
|  *
 | |
|  * The monitor parameters should not be altered while the monitor is
 | |
|  * running. To alter a parameter from outside a monitor module, stop the monitor,
 | |
|  * do the alteration and then restart the monitor. The monitor "owns" the parameters
 | |
|  * as long as it is running so if the monitor needs to change its own parameters,
 | |
|  * it can do it without stopping itself.
 | |
|  *
 | |
|  * @param monitor Monitor whose parameter is altered
 | |
|  * @param key     Parameter name to alter
 | |
|  * @param value   New value for the parameter
 | |
|  */
 | |
| void mon_alter_parameter(MXS_MONITOR* monitor, const char* key, const char* value);
 | |
| 
 | |
| /**
 | |
|  * @brief Handle state change events
 | |
|  *
 | |
|  * This function should be called by all monitors at the end of each monitoring
 | |
|  * cycle. This will log state changes and execute any scripts that should be executed.
 | |
|  *
 | |
|  * @param monitor Monitor object
 | |
|  * @param script Script to execute or NULL for no script
 | |
|  * @param events Enabled events
 | |
|  */
 | |
| void mon_process_state_changes(MXS_MONITOR *monitor, const char *script, uint64_t events);
 | |
| 
 | |
| /**
 | |
|  * @brief Hangup connections to failed servers
 | |
|  *
 | |
|  * Injects hangup events for DCB that are connected to servers that are down.
 | |
|  *
 | |
|  * @param monitor Monitor object
 | |
|  */
 | |
| void mon_hangup_failed_servers(MXS_MONITOR *monitor);
 | |
| 
 | |
| /**
 | |
|  * @brief Report query errors
 | |
|  *
 | |
|  * @param db Database where the query failed
 | |
|  */
 | |
| void mon_report_query_error(MXS_MONITORED_SERVER* db);
 | |
| 
 | |
| /**
 | |
|  * @brief Convert monitor to JSON
 | |
|  *
 | |
|  * @param monitor Monitor to convert
 | |
|  * @param host    Hostname of this server
 | |
|  *
 | |
|  * @return JSON representation of the monitor
 | |
|  */
 | |
| json_t* monitor_to_json(const MXS_MONITOR* monitor, const char* host);
 | |
| 
 | |
| /**
 | |
|  * @brief Convert all monitors to JSON
 | |
|  *
 | |
|  * @param host    Hostname of this server
 | |
|  *
 | |
|  * @return JSON array containing all monitors
 | |
|  */
 | |
| json_t* monitor_list_to_json(const char* host);
 | |
| 
 | |
| /**
 | |
|  * @brief Get links to monitors that relate to a server
 | |
|  *
 | |
|  * @param server Server to inspect
 | |
|  * @param host   Hostname of this server
 | |
|  *
 | |
|  * @return Array of monitor links or NULL if no relations exist
 | |
|  */
 | |
| json_t* monitor_relations_to_server(const SERVER* server, const char* host);
 | |
| 
 | |
| /**
 | |
|  * @brief Store a journal of server states
 | |
|  *
 | |
|  * @param monitor Monitor to journal
 | |
|  * @param master  The current master server or NULL if no master exists
 | |
|  */
 | |
| void store_server_journal(MXS_MONITOR *monitor, MXS_MONITORED_SERVER *master);
 | |
| 
 | |
| /**
 | |
|  * @brief Load a journal of server states
 | |
|  *
 | |
|  * @param monitor Monitor where journal is loaded
 | |
|  * @param master  Set to point to the current master
 | |
|  */
 | |
| void load_server_journal(MXS_MONITOR *monitor, MXS_MONITORED_SERVER **master);
 | |
| 
 | |
| /**
 | |
|  * Find the monitored server representing the server.
 | |
|  *
 | |
|  * @param mon Cluster monitor
 | |
|  * @param search_server Server to search for
 | |
|  * @return Found monitored server or NULL if not found
 | |
|  */
 | |
| MXS_MONITORED_SERVER* mon_get_monitored_server(const MXS_MONITOR* mon, SERVER* search_server);
 | |
| 
 | |
| /**
 | |
|  * Get an array of monitored servers. If a server defined in the config setting is not monitored by
 | |
|  * the given monitor, that server is ignored and not inserted into the output array.
 | |
|  *
 | |
|  * @param params Config parameters
 | |
|  * @param key Setting name
 | |
|  * @param mon Monitor which should monitor the servers
 | |
|  * @param monitored_servers_out Where to save output array. The caller should free the array, but not the
 | |
|  * elements. The output must contain NULL before calling this function.
 | |
|  * @return Output array size.
 | |
|  */
 | |
| int mon_config_get_servers(const MXS_CONFIG_PARAMETER* params, const char* key, const MXS_MONITOR* mon,
 | |
|                            MXS_MONITORED_SERVER*** monitored_array_out);
 | |
| 
 | |
| /**
 | |
|  * @brief Set the disk space threshold of a monitor
 | |
|  *
 | |
|  * @param server                The monitor.
 | |
|  * @param disk_space_threshold  The disk space threshold as specified in the config file.
 | |
|  *
 | |
|  * @return True, if the provided string is valid and the threshold could be set.
 | |
|  */
 | |
| bool monitor_set_disk_space_threshold(MXS_MONITOR *monitor, const char *disk_space_threshold);
 | |
| 
 | |
| MXS_END_DECLS
 | 
