The test checks that failover works even when the master of the monitored cluster is a slave to an external masters. The test also verifies that the servers do not get unexpected status labels.
		
			
				
	
	
		
			197 lines
		
	
	
		
			6.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			197 lines
		
	
	
		
			6.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
#include "fail_switch_rejoin_common.cpp"
 | 
						|
#include <sstream>
 | 
						|
#include <iostream>
 | 
						|
 | 
						|
using std::stringstream;
 | 
						|
using std::cout;
 | 
						|
using std::endl;
 | 
						|
 | 
						|
void replicate_from(TestConnections& test, int server_ind, int target_ind)
 | 
						|
{
 | 
						|
    test.repl->replicate_from(server_ind, target_ind);
 | 
						|
}
 | 
						|
 | 
						|
void reset_replication(TestConnections& test)
 | 
						|
{
 | 
						|
    int master_id = get_master_server_id(test);
 | 
						|
    cout << "Reseting..." << endl;
 | 
						|
    test.repl->start_node(0, (char*)"");
 | 
						|
    sleep(5);
 | 
						|
    test.repl->connect();
 | 
						|
    get_output(test);
 | 
						|
    // First set the old master to replicate from current master.
 | 
						|
    if (test.global_result == 0)
 | 
						|
    {
 | 
						|
        int ind = master_id - 1;
 | 
						|
        replicate_from(test, 0, ind);
 | 
						|
        sleep(3);
 | 
						|
        get_output(test);
 | 
						|
        int ec;
 | 
						|
        stringstream switchover;
 | 
						|
        switchover << "maxadmin call command mysqlmon switchover MySQL-Monitor server1 server" << master_id;
 | 
						|
        test.maxscales->ssh_node_output(0, switchover.str().c_str() , true, &ec);
 | 
						|
        sleep(3);
 | 
						|
        master_id = get_master_server_id(test);
 | 
						|
        cout << "Master server id is now back to " << master_id << endl;
 | 
						|
        test.assert(master_id == 1, "Switchover back to server1 failed");
 | 
						|
    }
 | 
						|
    get_output(test);
 | 
						|
    StringSet node_states;
 | 
						|
    for (int i = 2; i < 4; i++)
 | 
						|
    {
 | 
						|
        stringstream servername;
 | 
						|
        servername << "server" << i;
 | 
						|
        node_states = test.get_server_status(servername.str().c_str());
 | 
						|
        bool states_ok = (node_states.find("Slave") != node_states.end());
 | 
						|
        test.assert(states_ok, "Server %d is not replicating.", i);
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
int prepare_test_1(TestConnections& test)
 | 
						|
{
 | 
						|
    cout << LINE << endl;
 | 
						|
    cout << "Part 1: Stopping master and waiting for failover. Check that another server is promoted." <<
 | 
						|
        endl;
 | 
						|
    cout << LINE << endl;
 | 
						|
    int node0_id = test.repl->get_server_id(0); // Read master id now before shutdown.
 | 
						|
    test.repl->stop_node(0);
 | 
						|
    return node0_id;
 | 
						|
}
 | 
						|
 | 
						|
void check_test_1(TestConnections& test, int node0_id)
 | 
						|
{
 | 
						|
    get_output(test);
 | 
						|
    int master_id = get_master_server_id(test);
 | 
						|
    cout << "Master server id is " << master_id << endl;
 | 
						|
    test.assert(master_id > 0 && master_id != node0_id, "Master did not change or no master detected.");
 | 
						|
    if (test.global_result == 0)
 | 
						|
    {
 | 
						|
        check(test);
 | 
						|
    }
 | 
						|
    // Reset state
 | 
						|
    reset_replication(test);
 | 
						|
}
 | 
						|
 | 
						|
void prepare_test_2(TestConnections& test)
 | 
						|
{
 | 
						|
    cout << LINE << endl;
 | 
						|
    cout << "Part 2: Disable replication on server 2 and kill master, check that server 3 or 4 is promoted."
 | 
						|
        << endl;
 | 
						|
    cout << LINE << endl;
 | 
						|
    test.repl->connect();
 | 
						|
    check(test);
 | 
						|
    sleep(1);
 | 
						|
    print_gtids(test);
 | 
						|
    test.try_query(test.repl->nodes[1], "STOP SLAVE;");
 | 
						|
    test.try_query(test.repl->nodes[1], "RESET SLAVE ALL;");
 | 
						|
    sleep(1);
 | 
						|
    get_output(test);
 | 
						|
    if (test.global_result == 0)
 | 
						|
    {
 | 
						|
        cout << "Stopping master." << endl;
 | 
						|
        test.repl->stop_node(0);
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
void check_test_2(TestConnections& test)
 | 
						|
{
 | 
						|
    get_output(test);
 | 
						|
    int master_id = get_master_server_id(test);
 | 
						|
    cout << "Master server id is " << master_id << endl;
 | 
						|
    bool success = (master_id > 0 &&
 | 
						|
                    (master_id == test.repl->get_server_id(2) || master_id == test.repl->get_server_id(3)));
 | 
						|
    test.assert(success, WRONG_SLAVE);
 | 
						|
    if (test.global_result == 0)
 | 
						|
    {
 | 
						|
        check(test);
 | 
						|
    }
 | 
						|
 | 
						|
    // Reset state
 | 
						|
    replicate_from(test, 1, master_id - 1);
 | 
						|
    sleep(3);
 | 
						|
    get_output(test);
 | 
						|
    StringSet node_states = test.get_server_status("server2");
 | 
						|
    test.assert(node_states.find("Slave") != node_states.end(), "Server 2 is not replicating.");
 | 
						|
    if (test.global_result == 0)
 | 
						|
    {
 | 
						|
        reset_replication(test);
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
void prepare_test_3(TestConnections& test)
 | 
						|
{
 | 
						|
    cout << LINE << "\n";
 | 
						|
    cout << "Part 3: Disable log_bin on server 2, making it invalid for promotion. Enable log-slave-updates "
 | 
						|
        " on servers 2 and 4. Disable log-slave-updates on server 3. Check that server 4 is promoted on"
 | 
						|
        " master failure." << "\n" << LINE << endl;
 | 
						|
    get_output(test);
 | 
						|
    test.maxscales->stop_maxscale(0);
 | 
						|
    test.repl->stop_node(1);
 | 
						|
    test.repl->stop_node(2);
 | 
						|
    test.repl->stop_node(3);
 | 
						|
    test.repl->stash_server_settings(1);
 | 
						|
    test.repl->stash_server_settings(2);
 | 
						|
    test.repl->stash_server_settings(3);
 | 
						|
 | 
						|
    test.repl->disable_server_setting(1, "log-bin");
 | 
						|
    test.repl->disable_server_setting(1, "log_bin");
 | 
						|
    test.repl->disable_server_setting(2, "log-slave-updates");
 | 
						|
    test.repl->disable_server_setting(2, "log_slave_updates");
 | 
						|
    const char* log_slave = "log-slave-updates=1";
 | 
						|
    test.repl->add_server_setting(1, log_slave);
 | 
						|
    test.repl->add_server_setting(3, log_slave);
 | 
						|
 | 
						|
    test.repl->start_node(1, (char *) "");
 | 
						|
    test.repl->start_node(2, (char *) "");
 | 
						|
    test.repl->start_node(3, (char *) "");
 | 
						|
    test.maxscales->start_maxscale(0);
 | 
						|
    sleep(2);
 | 
						|
 | 
						|
    test.repl->connect();
 | 
						|
    test.tprintf("Settings changed.");
 | 
						|
    get_output(test);
 | 
						|
    print_gtids(test);
 | 
						|
    check(test);
 | 
						|
 | 
						|
    if (test.global_result == 0)
 | 
						|
    {
 | 
						|
        cout << "Stopping master." << endl;
 | 
						|
        test.repl->stop_node(0);
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
void check_test_3(TestConnections& test)
 | 
						|
{
 | 
						|
    check(test);
 | 
						|
    get_output(test);
 | 
						|
    int master_id = get_master_server_id(test);
 | 
						|
 | 
						|
    // Because servers have been restarted, redo connections.
 | 
						|
    test.repl->connect();
 | 
						|
    cout << "Master server id is " << master_id << endl;
 | 
						|
    test.assert(master_id > 0 && master_id == test.repl->get_server_id(3), WRONG_SLAVE);
 | 
						|
    print_gtids(test);
 | 
						|
 | 
						|
    reset_replication(test);
 | 
						|
    get_output(test);
 | 
						|
 | 
						|
    // Restore server 2 and 4 settings. Because server 1 is now the master, shutting it down causes
 | 
						|
    // another failover. Prevent this by stopping maxscale.
 | 
						|
    test.tprintf("Restoring server settings.");
 | 
						|
    test.maxscales->stop_maxscale(0);
 | 
						|
    test.repl->stop_node(1);
 | 
						|
    test.repl->stop_node(2);
 | 
						|
    test.repl->stop_node(3);
 | 
						|
    sleep(4);
 | 
						|
 | 
						|
    test.repl->restore_server_settings(1);
 | 
						|
    test.repl->restore_server_settings(2);
 | 
						|
    test.repl->restore_server_settings(3);
 | 
						|
 | 
						|
    test.repl->start_node(1, (char *) "");
 | 
						|
    test.repl->start_node(2, (char *) "");
 | 
						|
    test.repl->start_node(3, (char *) "");
 | 
						|
    sleep(2);
 | 
						|
    test.maxscales->start_maxscale(0);
 | 
						|
}
 |