#!/usr/bin/env python # -*- coding: utf-8 -*- ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:__init__.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:actions.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #import time #import re #import json #import traceback #import sys #import mysql.connector #from mysql.connector import errorcode #from my_error import MyError #import logging # #class SqlItem: # action_sql = None # rollback_sql = None # def __init__(self, action_sql, rollback_sql): # self.action_sql = action_sql # self.rollback_sql = rollback_sql # #g_succ_sql_list = [] #g_commit_sql_list = [] # #def refresh_commit_sql_list(): # global g_succ_sql_list # global g_commit_sql_list # if len(g_commit_sql_list) < len(g_succ_sql_list): # for i in range(len(g_commit_sql_list), len(g_succ_sql_list)): # g_commit_sql_list.append(g_succ_sql_list[i]) # #def get_succ_sql_list_str(): # global g_succ_sql_list # ret_str = '' # for i in range(0, len(g_succ_sql_list)): # if i > 0: # ret_str += '\n' # ret_str += g_succ_sql_list[i].action_sql + ';' # return ret_str # #def get_commit_sql_list_str(): # global g_commit_sql_list # ret_str = '' # for i in range(0, len(g_commit_sql_list)): # if i > 0: # ret_str += '\n' # ret_str += g_commit_sql_list[i].action_sql + ';' # return ret_str # #def get_rollback_sql_file_lines_str(): # global g_commit_sql_list # ret_str = '' # g_commit_sql_list_len = len(g_commit_sql_list) # for i in range(0, g_commit_sql_list_len): # if i > 0: # ret_str += '\n' # idx = g_commit_sql_list_len - 1 - i # ret_str += '/*\n' + g_commit_sql_list[idx].action_sql + ';\n*/\n' # ret_str += g_commit_sql_list[idx].rollback_sql + ';' # return ret_str # #def dump_rollback_sql_to_file(rollback_sql_filename): # logging.info('===================== begin to dump rollback sql file ============================') # rollback_sql_file = open(rollback_sql_filename, 'w') # rollback_sql_file.write('# 此文件是回滚用的sql。\n') # rollback_sql_file.write('# 注释的sql是已经成功commit的sql,它的下一条没被注释的sql则是对应的回滚sql。回滚的sql的排序跟commit的sql的排序刚好相反。\n') # rollback_sql_file.write('# 跑升级脚本失败的时候可以参考本文件来进行回滚。\n') # rollback_sql_file.write('\n') # rollback_sql_file_lines_str = get_rollback_sql_file_lines_str() # rollback_sql_file.write(rollback_sql_file_lines_str) # rollback_sql_file.close() # logging.info('=========== succeed to dump rollback sql file to: ' + rollback_sql_filename + '===============') # #def check_is_ddl_sql(sql): # word_list = sql.split() # if len(word_list) < 1: # raise MyError('sql is empty, sql="{0}"'.format(sql)) # key_word = word_list[0].lower() # if 'create' != key_word and 'alter' != key_word: # raise MyError('sql must be ddl, key_word="{0}", sql="{1}"'.format(key_word, sql)) # #def check_is_query_sql(sql): # word_list = sql.split() # if len(word_list) < 1: # raise MyError('sql is empty, sql="{0}"'.format(sql)) # key_word = word_list[0].lower() # if 'select' != key_word and 'show' != key_word and 'desc' != key_word: # raise MyError('sql must be query, key_word="{0}", sql="{1}"'.format(key_word, sql)) # #def check_is_update_sql(sql): # word_list = sql.split() # if len(word_list) < 1: # raise MyError('sql is empty, sql="{0}"'.format(sql)) # key_word = word_list[0].lower() # if 'insert' != key_word and 'update' != key_word and 'replace' != key_word and 'set' != key_word and 'delete' != key_word: # # 还有类似这种:select @current_ts := now() # if not (len(word_list) >= 3 and 'select' == word_list[0].lower()\ # and word_list[1].lower().startswith('@') and ':=' == word_list[2].lower()): # raise MyError('sql must be update, key_word="{0}", sql="{1}"'.format(key_word, sql)) # #def set_parameter(cur, parameter, value): # sql = """alter system set {0} = '{1}'""".format(parameter, value) # logging.info(sql) # cur.execute(sql) # wait_parameter_sync(cur, parameter, value) # #def get_ori_enable_ddl(cur): # ori_value_str = fetch_ori_enable_ddl(cur) # wait_parameter_sync(cur, 'enable_ddl', ori_value_str) # ori_value = (ori_value_str == 'True') # return ori_value # #def fetch_ori_enable_ddl(cur): # ori_value = 'True' # sql = """select value from oceanbase.__all_sys_parameter where name = 'enable_ddl'""" # # logging.info(sql) # cur.execute(sql) # result = cur.fetchall() # # if len(result) == 0: # # means default value, is True # ori_value = 'True' # elif len(result) != 1 or len(result[0]) != 1: # logging.exception('result cnt not match') # raise e # elif result[0][0].lower() in ["1", "true", "on", "yes", 't']: # ori_value = 'True' # elif result[0][0].lower() in ["0", "false", "off", "no", 'f']: # ori_value = 'False' # else: # logging.exception("""result value is invalid, result:{0}""".format(result[0][0])) # raise e # return ori_value # #def wait_parameter_sync(cur, key, value): # sql = """select count(*) as cnt from oceanbase.__all_virtual_sys_parameter_stat # where name = '{0}' and value != '{1}'""".format(key, value) # times = 10 # while times > 0: # logging.info(sql) # cur.execute(sql) # result = cur.fetchall() # if len(result) != 1 or len(result[0]) != 1: # logging.exception('result cnt not match') # raise e # elif result[0][0] == 0: # logging.info("""{0} is sync, value is {1}""".format(key, value)) # break # else: # logging.info("""{0} is not sync, value should be {1}""".format(key, value)) # # times -= 1 # if times == 0: # logging.exception("""check {0}:{1} sync timeout""".format(key, value)) # raise e # time.sleep(5) # #class Cursor: # __cursor = None # def __init__(self, cursor): # self.__cursor = cursor # def exec_sql(self, sql, print_when_succ = True): # try: # self.__cursor.execute(sql) # rowcount = self.__cursor.rowcount # if True == print_when_succ: # logging.info('succeed to execute sql: %s, rowcount = %d', sql, rowcount) # return rowcount # except mysql.connector.Error, e: # logging.exception('mysql connector error, fail to execute sql: %s', sql) # raise e # except Exception, e: # logging.exception('normal error, fail to execute sql: %s', sql) # raise e # def exec_query(self, sql, print_when_succ = True): # try: # self.__cursor.execute(sql) # results = self.__cursor.fetchall() # rowcount = self.__cursor.rowcount # if True == print_when_succ: # logging.info('succeed to execute query: %s, rowcount = %d', sql, rowcount) # return (self.__cursor.description, results) # except mysql.connector.Error, e: # logging.exception('mysql connector error, fail to execute sql: %s', sql) # raise e # except Exception, e: # logging.exception('normal error, fail to execute sql: %s', sql) # raise e # #class DDLCursor: # _cursor = None # def __init__(self, cursor): # self._cursor = Cursor(cursor) # def exec_ddl(self, sql, print_when_succ = True): # try: # # 这里检查是不是ddl,不是ddl就抛错 # check_is_ddl_sql(sql) # return self._cursor.exec_sql(sql, print_when_succ) # except Exception, e: # logging.exception('fail to execute ddl: %s', sql) # raise e # #class QueryCursor: # _cursor = None # def __init__(self, cursor): # self._cursor = Cursor(cursor) # def exec_query(self, sql, print_when_succ = True): # try: # # 这里检查是不是query,不是query就抛错 # check_is_query_sql(sql) # return self._cursor.exec_query(sql, print_when_succ) # except Exception, e: # logging.exception('fail to execute dml query: %s', sql) # raise e # #class DMLCursor(QueryCursor): # def exec_update(self, sql, print_when_succ = True): # try: # # 这里检查是不是update,不是update就抛错 # check_is_update_sql(sql) # return self._cursor.exec_sql(sql, print_when_succ) # except Exception, e: # logging.exception('fail to execute dml update: %s', sql) # raise e # #class BaseDDLAction(): # __ddl_cursor = None # _query_cursor = None # def __init__(self, cursor): # self.__ddl_cursor = DDLCursor(cursor) # self._query_cursor = QueryCursor(cursor) # def do_action(self): # global g_succ_sql_list # action_sql = self.get_action_ddl() # rollback_sql = self.get_rollback_sql() # self.__ddl_cursor.exec_ddl(action_sql) # g_succ_sql_list.append(SqlItem(action_sql, rollback_sql)) # # ddl马上就提交了,因此刷新g_commit_sql_list # refresh_commit_sql_list() # #class BaseDMLAction(): # __dml_cursor = None # _query_cursor = None # def __init__(self, cursor): # self.__dml_cursor = DMLCursor(cursor) # self._query_cursor = QueryCursor(cursor) # def do_action(self): # global g_succ_sql_list # action_sql = self.get_action_dml() # rollback_sql = self.get_rollback_sql() # self.__dml_cursor.exec_update(action_sql) # g_succ_sql_list.append(SqlItem(action_sql, rollback_sql)) # #class BaseEachTenantDMLAction(): # __dml_cursor = None # _query_cursor = None # _tenant_id_list = None # _cursor = None # def __init__(self, cursor, tenant_id_list): # self.__dml_cursor = DMLCursor(cursor) # self._query_cursor = QueryCursor(cursor) # self._tenant_id_list = tenant_id_list # self._cursor = Cursor(cursor) # def get_tenant_id_list(self): # return self._tenant_id_list # def do_each_tenant_action(self, tenant_id): # global g_succ_sql_list # action_sql = self.get_each_tenant_action_dml(tenant_id) # rollback_sql = self.get_each_tenant_rollback_sql(tenant_id) # self.__dml_cursor.exec_update(action_sql) # g_succ_sql_list.append(SqlItem(action_sql, rollback_sql)) # def change_tenant(self, tenant_id): # self._cursor.exec_sql("alter system change tenant tenant_id = {0}".format(tenant_id)) # (desc, results) = self._query_cursor.exec_query("select effective_tenant_id()") # if (1 != len(results) or 1 != len(results[0])): # raise MyError("results cnt not match") # elif (tenant_id != results[0][0]): # raise MyError("change tenant failed, effective_tenant_id:{0}, tenant_id:{1}" # .format(results[0][0], tenant_id)) # #class BaseEachTenantDDLAction(): # __dml_cursor = None # _query_cursor = None # _tenant_id_list = None # _all_table_name = "__all_table" # def __init__(self, cursor, tenant_id_list): # self.__ddl_cursor = DDLCursor(cursor) # self._query_cursor = QueryCursor(cursor) # self._tenant_id_list = tenant_id_list # def get_tenant_id_list(self): # return self._tenant_id_list # def get_all_table_name(self): # return self._all_table_name # def set_all_table_name(self, table_name): # self._all_table_name = table_name # def do_each_tenant_action(self, tenant_id): # global g_succ_sql_list # action_sql = self.get_each_tenant_action_ddl(tenant_id) # rollback_sql = self.get_each_tenant_rollback_sql(tenant_id) # self.__ddl_cursor.exec_ddl(action_sql) # g_succ_sql_list.append(SqlItem(action_sql, rollback_sql)) # # ddl马上就提交了,因此刷新g_commit_sql_list # refresh_commit_sql_list() # #def actions_cls_compare(x, y): # diff = x.get_seq_num() - y.get_seq_num() # if 0 == diff: # raise MyError('seq num is equal') # elif diff < 0: # return -1 # else: # return 1 # #def reflect_action_cls_list(action_module, action_name_prefix): # action_cls_list = [] # cls_from_actions = dir(action_module) # for cls in cls_from_actions: # if cls.startswith(action_name_prefix): # action_cls = getattr(action_module, cls) # action_cls_list.append(action_cls) # action_cls_list.sort(actions_cls_compare) # return action_cls_list # #def fetch_observer_version(query_cur): # (desc, results) = query_cur.exec_query("""select distinct value from __all_virtual_sys_parameter_stat where name='min_observer_version'""") # if len(results) != 1: # raise MyError('query results count is not 1') # else: # logging.info('get observer version success, version = {0}'.format(results[0][0])) # return results[0][0] # #def fetch_tenant_ids(query_cur): # try: # tenant_id_list = [] # (desc, results) = query_cur.exec_query("""select distinct tenant_id from oceanbase.__all_tenant order by tenant_id desc""") # for r in results: # tenant_id_list.append(r[0]) # return tenant_id_list # except Exception, e: # logging.exception('fail to fetch distinct tenant ids') # raise e # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:config.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #pre_upgrade_log_filename = 'upgrade_pre.log' #pre_upgrade_sql_filename = 'upgrade_sql_pre.txt' #pre_upgrade_rollback_sql_filename = 'rollback_sql_pre.txt' # #post_upgrade_log_filename = 'upgrade_post.log' #post_upgrade_sql_filename = 'upgrade_sql_post.txt' #post_upgrade_rollback_sql_filename = 'rollback_sql_post.txt' # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:do_upgrade_post.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #from my_error import MyError #import sys #import mysql.connector #from mysql.connector import errorcode #import logging #import json #import config #import opts #import run_modules #import actions #import special_upgrade_action_post # ## 由于用了/*+read_consistency(WEAK) */来查询,因此升级期间不能允许创建或删除租户 # #class UpgradeParams: # log_filename = config.post_upgrade_log_filename # sql_dump_filename = config.post_upgrade_sql_filename # rollback_sql_filename = config.post_upgrade_rollback_sql_filename # #def config_logging_module(log_filenamme): # logging.basicConfig(level=logging.INFO,\ # format='[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s',\ # datefmt='%Y-%m-%d %H:%M:%S',\ # filename=log_filenamme,\ # filemode='w') # # 定义日志打印格式 # formatter = logging.Formatter('[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s', '%Y-%m-%d %H:%M:%S') # ####################################### # # 定义一个Handler打印INFO及以上级别的日志到sys.stdout # stdout_handler = logging.StreamHandler(sys.stdout) # stdout_handler.setLevel(logging.INFO) # # 设置日志打印格式 # stdout_handler.setFormatter(formatter) # # 将定义好的stdout_handler日志handler添加到root logger # logging.getLogger('').addHandler(stdout_handler) # # #def dump_sql_to_file(dump_filename, tenant_id_list): # normal_ddls_str = normal_ddl_actions_post.get_normal_ddl_actions_sqls_str() # normal_dmls_str = normal_dml_actions_post.get_normal_dml_actions_sqls_str() # each_tenant_dmls_str = each_tenant_dml_actions_post.get_each_tenant_dml_actions_sqls_str(tenant_id_list) # dump_file = open(dump_filename, 'w') # dump_file.write('# 以下是upgrade_post.py脚本中的步骤\n') # dump_file.write('# 仅供upgrade_post.py脚本运行失败需要人肉的时候参考\n') # dump_file.write('\n\n') # dump_file.write('# normal ddl\n') # dump_file.write(normal_ddls_str + '\n') # dump_file.write('\n\n') # dump_file.write('# normal dml\n') # dump_file.write(normal_dmls_str + '\n') # dump_file.write('\n\n') # dump_file.write('# each tenant dml\n') # dump_file.write(each_tenant_dmls_str + '\n') # dump_file.write('\n\n') # dump_file.write('# do special upgrade actions\n') # dump_file.write('# please run ./upgrade_post.py -h [host] -P [port] -u [user] -p [password] -m special_action\n') # dump_file.write('\n\n') # dump_file.close() # #def check_before_upgrade(query_cur, upgrade_params): # check_server_version(query_cur) # return # ## 混部阶段执行POST脚本,会导致租户级系统表创建可能多数派处于旧binary而被GC, ## 需要规避OCP升级流程异常导致的混部阶段执行POST脚本的问题 #def check_server_version(query_cur): # sql = """select distinct(substring_index(build_version, '_', 1)) from __all_server"""; # (desc, results) = query_cur.exec_query(sql); # if len(results) != 1: # raise MyError("servers build_version not match") # else: # logging.info("check server version success") # #def print_stats(): # logging.info('==================================================================================') # logging.info('============================== STATISTICS BEGIN ==================================') # logging.info('==================================================================================') # logging.info('succeed run sql(except sql of special actions): \n\n%s\n', actions.get_succ_sql_list_str()) # logging.info('commited sql(except sql of special actions): \n\n%s\n', actions.get_commit_sql_list_str()) # logging.info('==================================================================================') # logging.info('=============================== STATISTICS END ===================================') # logging.info('==================================================================================') # #def do_upgrade(my_host, my_port, my_user, my_passwd, my_module_set, upgrade_params): # try: # conn = mysql.connector.connect(user = my_user, # password = my_passwd, # host = my_host, # port = my_port, # database = 'oceanbase', # raise_on_warnings = True) # cur = conn.cursor(buffered=True) # try: # query_cur = actions.QueryCursor(cur) # # 开始升级前的检查 # check_before_upgrade(query_cur, upgrade_params) # # 获取租户id列表 # tenant_id_list = actions.fetch_tenant_ids(query_cur) # if len(tenant_id_list) <= 0: # logging.error('distinct tenant id count is <= 0, tenant_id_count: %d', len(tenant_id_list)) # raise MyError('no tenant id') # logging.info('there has %s distinct tenant ids: [%s]', len(tenant_id_list), ','.join(str(tenant_id) for tenant_id in tenant_id_list)) # conn.commit() # if run_modules.MODULE_SPECIAL_ACTION in my_module_set: # logging.info('================begin to run special action===============') # conn.autocommit = True # special_upgrade_action_post.do_special_upgrade(conn, cur, tenant_id_list, my_user, my_passwd) # conn.autocommit = False # actions.refresh_commit_sql_list() # logging.info('================succeed to commit special action===============') # except Exception, e: # logging.exception('run error') # raise e # finally: # # 打印统计信息 # print_stats() # # 将回滚sql写到文件中 # actions.dump_rollback_sql_to_file(upgrade_params.rollback_sql_filename) # cur.close() # conn.close() # except mysql.connector.Error, e: # logging.exception('connection error') # raise e # except Exception, e: # logging.exception('normal error') # raise e # #def do_upgrade_by_argv(argv): # upgrade_params = UpgradeParams() # opts.change_opt_defult_value('log-file', upgrade_params.log_filename) # opts.parse_options(argv) # if not opts.has_no_local_opts(): # opts.deal_with_local_opts() # else: # opts.check_db_client_opts() # log_filename = opts.get_opt_log_file() # upgrade_params.log_filename = log_filename # # 日志配置放在这里是为了前面的操作不要覆盖掉日志文件 # config_logging_module(upgrade_params.log_filename) # try: # host = opts.get_opt_host() # port = int(opts.get_opt_port()) # user = opts.get_opt_user() # password = opts.get_opt_password() # cmd_module_str = opts.get_opt_module() # module_set = set([]) # all_module_set = run_modules.get_all_module_set() # cmd_module_list = cmd_module_str.split(',') # for cmd_module in cmd_module_list: # if run_modules.ALL_MODULE == cmd_module: # module_set = module_set | all_module_set # elif cmd_module in all_module_set: # module_set.add(cmd_module) # else: # raise MyError('invalid module: {0}'.format(cmd_module)) # logging.info('parameters from cmd: host=\"%s\", port=%s, user=\"%s\", password=\"%s\", module=\"%s\", log-file=\"%s\"',\ # host, port, user, password, module_set, log_filename) # do_upgrade(host, port, user, password, module_set, upgrade_params) # except mysql.connector.Error, e: # logging.exception('mysql connctor error') # logging.exception('run error, maybe you can reference ' + upgrade_params.rollback_sql_filename + ' to rollback it') # raise e # except Exception, e: # logging.exception('normal error') # logging.exception('run error, maybe you can reference ' + upgrade_params.rollback_sql_filename + ' to rollback it') # raise e # # # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:do_upgrade_pre.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #from my_error import MyError #import sys #import mysql.connector #from mysql.connector import errorcode #import logging # #import config #import opts #import run_modules #import actions #import special_upgrade_action_pre # ## 由于用了/*+read_consistency(WEAK) */来查询,因此升级期间不能允许创建或删除租户 # #class UpgradeParams: # log_filename = config.pre_upgrade_log_filename # sql_dump_filename = config.pre_upgrade_sql_filename # rollback_sql_filename = config.pre_upgrade_rollback_sql_filename # #def config_logging_module(log_filenamme): # logging.basicConfig(level=logging.INFO,\ # format='[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s',\ # datefmt='%Y-%m-%d %H:%M:%S',\ # filename=log_filenamme,\ # filemode='w') # # 定义日志打印格式 # formatter = logging.Formatter('[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s', '%Y-%m-%d %H:%M:%S') # ####################################### # # 定义一个Handler打印INFO及以上级别的日志到sys.stdout # stdout_handler = logging.StreamHandler(sys.stdout) # stdout_handler.setLevel(logging.INFO) # # 设置日志打印格式 # stdout_handler.setFormatter(formatter) # # 将定义好的stdout_handler日志handler添加到root logger # logging.getLogger('').addHandler(stdout_handler) # #def dump_sql_to_file(cur, query_cur, dump_filename, tenant_id_list, update_sys_var_list, add_sys_var_list): # normal_ddls_str = normal_ddl_actions_pre.get_normal_ddl_actions_sqls_str(query_cur) # normal_dmls_str = normal_dml_actions_pre.get_normal_dml_actions_sqls_str() # each_tenant_dmls_str = each_tenant_dml_actions_pre.get_each_tenant_dml_actions_sqls_str(tenant_id_list) # dump_file = open(dump_filename, 'w') # dump_file.write('# 以下是upgrade_pre.py脚本中的步骤\n') # dump_file.write('# 仅供upgrade_pre.py脚本运行失败需要人肉的时候参考\n') # dump_file.write('\n\n') # dump_file.write('# normal ddl\n') # dump_file.write(normal_ddls_str + '\n') # dump_file.write('\n\n') # dump_file.write('# normal dml\n') # dump_file.write(normal_dmls_str + '\n') # dump_file.write('\n\n') # dump_file.write('# each tenant dml\n') # dump_file.write(each_tenant_dmls_str + '\n') # dump_file.write('\n\n') # dump_file.write('# upgrade sys vars\n') # dump_file.write(sys_vars_upgrade_dmls_str + '\n') # dump_file.write('\n\n') # dump_file.write('# do special upgrade actions\n') # dump_file.write('# please run ./upgrade_pre.py -h [host] -P [port] -u [user] -p [password] -m special_action\n') # dump_file.write('\n\n') # dump_file.close() # #def check_before_upgrade(query_cur, upgrade_params): # return # #def print_stats(): # logging.info('==================================================================================') # logging.info('============================== STATISTICS BEGIN ==================================') # logging.info('==================================================================================') # logging.info('succeed run sql(except sql of special actions): \n\n%s\n', actions.get_succ_sql_list_str()) # logging.info('commited sql(except sql of special actions): \n\n%s\n', actions.get_commit_sql_list_str()) # logging.info('==================================================================================') # logging.info('=============================== STATISTICS END ===================================') # logging.info('==================================================================================') # #def do_upgrade(my_host, my_port, my_user, my_passwd, my_module_set, upgrade_params): # try: # conn = mysql.connector.connect(user = my_user, # password = my_passwd, # host = my_host, # port = my_port, # database = 'oceanbase', # raise_on_warnings = True) # cur = conn.cursor(buffered=True) # try: # query_cur = actions.QueryCursor(cur) # # 开始升级前的检查 # check_before_upgrade(query_cur, upgrade_params) # # get min_observer_version # version = actions.fetch_observer_version(query_cur) # # 获取租户id列表 # tenant_id_list = actions.fetch_tenant_ids(query_cur) # if len(tenant_id_list) <= 0: # logging.error('distinct tenant id count is <= 0, tenant_id_count: %d', len(tenant_id_list)) # raise MyError('no tenant id') # logging.info('there has %s distinct tenant ids: [%s]', len(tenant_id_list), ','.join(str(tenant_id) for tenant_id in tenant_id_list)) # # if run_modules.MODULE_SPECIAL_ACTION in my_module_set: # logging.info('================begin to run special action===============') # conn.autocommit = True # special_upgrade_action_pre.do_special_upgrade(conn, cur, tenant_id_list, my_user, my_passwd) # conn.autocommit = False # actions.refresh_commit_sql_list() # logging.info('================succeed to commit special action===============') # except Exception, e: # logging.exception('run error') # raise e # finally: # # 打印统计信息 # print_stats() # # 将回滚sql写到文件中 # actions.dump_rollback_sql_to_file(upgrade_params.rollback_sql_filename) # cur.close() # conn.close() # except mysql.connector.Error, e: # logging.exception('connection error') # raise e # except Exception, e: # logging.exception('normal error') # raise e # #def do_upgrade_by_argv(argv): # upgrade_params = UpgradeParams() # opts.change_opt_defult_value('log-file', upgrade_params.log_filename) # opts.parse_options(argv) # if not opts.has_no_local_opts(): # opts.deal_with_local_opts() # else: # opts.check_db_client_opts() # log_filename = opts.get_opt_log_file() # upgrade_params.log_filename = log_filename # # 日志配置放在这里是为了前面的操作不要覆盖掉日志文件 # config_logging_module(upgrade_params.log_filename) # try: # host = opts.get_opt_host() # port = int(opts.get_opt_port()) # user = opts.get_opt_user() # password = opts.get_opt_password() # cmd_module_str = opts.get_opt_module() # module_set = set([]) # all_module_set = run_modules.get_all_module_set() # cmd_module_list = cmd_module_str.split(',') # for cmd_module in cmd_module_list: # if run_modules.ALL_MODULE == cmd_module: # module_set = module_set | all_module_set # elif cmd_module in all_module_set: # module_set.add(cmd_module) # else: # raise MyError('invalid module: {0}'.format(cmd_module)) # logging.info('parameters from cmd: host=\"%s\", port=%s, user=\"%s\", password=\"%s\", module=\"%s\", log-file=\"%s\"',\ # host, port, user, password, module_set, log_filename) # do_upgrade(host, port, user, password, module_set, upgrade_params) # except mysql.connector.Error, e: # logging.exception('mysql connctor error') # logging.exception('run error, maybe you can reference ' + upgrade_params.rollback_sql_filename + ' to rollback it') # raise e # except Exception, e: # logging.exception('normal error') # logging.exception('run error, maybe you can reference ' + upgrade_params.rollback_sql_filename + ' to rollback it') # raise e # # # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:my_error.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #class MyError(Exception): # def __init__(self, value): # self.value = value # def __str__(self): # return repr(self.value) ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:my_utils.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #import mysql.connector #from mysql.connector import errorcode #from my_error import MyError #from actions import QueryCursor #import logging # #def results_to_str(desc, results): # ret_str = '' # max_width_list = [] # for col_desc in desc: # max_width_list.append(len(str(col_desc[0]))) # col_count = len(max_width_list) # for result in results: # if col_count != len(result): # raise MyError('column count is not equal, desc column count: {0}, data column count: {1}'.format(col_count, len(result))) # for i in range(0, col_count): # result_col_width = len(str(result[i])) # if max_width_list[i] < result_col_width: # max_width_list[i] = result_col_width # # 打印列名 # for i in range(0, col_count): # if i > 0: # ret_str += ' ' # 空四格 # ret_str += str(desc[i][0]) # # 补足空白 # for j in range(0, max_width_list[i] - len(str(desc[i][0]))): # ret_str += ' ' # # 打印数据 # for result in results: # ret_str += '\n' # 先换行 # for i in range(0, col_count): # if i > 0: # ret_str += ' ' # 空四格 # ret_str += str(result[i]) # # 补足空白 # for j in range(0, max_width_list[i] - len(str(result[i]))): # ret_str += ' ' # return ret_str # #def query_and_dump_results(query_cur, sql): # (desc, results) = query_cur.exec_query(sql) # result_str = results_to_str(desc, results) # logging.info('dump query results, sql: %s, results:\n%s', sql, result_str) # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:opts.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #from my_error import MyError #import sys #import os #import getopt # #help_str = \ #""" #Help: #""" +\ #sys.argv[0] + """ [OPTIONS]""" +\ #'\n\n' +\ #'-I, --help Display this help and exit.\n' +\ #'-V, --version Output version information and exit.\n' +\ #'-h, --host=name Connect to host.\n' +\ #'-P, --port=name Port number to use for connection.\n' +\ #'-u, --user=name User for login.\n' +\ #'-p, --password=name Password to use when connecting to server. If password is\n' +\ #' not given it\'s empty string "".\n' +\ #'-m, --module=name Modules to run. Modules should be a string combined by some of\n' +\ #' the following strings: ddl, normal_dml, each_tenant_dml,\n' +\ #' system_variable_dml, special_action, all. "all" represents\n' +\ #' that all modules should be run. They are splitted by ",".\n' +\ #' For example: -m all, or --module=ddl,normal_dml,special_action\n' +\ #'-l, --log-file=name Log file path. If log file path is not given it\'s ' + os.path.splitext(sys.argv[0])[0] + '.log\n' +\ #'\n\n' +\ #'Maybe you want to run cmd like that:\n' +\ #sys.argv[0] + ' -h 127.0.0.1 -P 3306 -u admin -p admin\n' # #version_str = """version 1.0.0""" # #class Option: # __g_short_name_set = set([]) # __g_long_name_set = set([]) # __short_name = None # __long_name = None # __is_with_param = None # __is_local_opt = None # __has_value = None # __value = None # def __init__(self, short_name, long_name, is_with_param, is_local_opt, default_value = None): # if short_name in Option.__g_short_name_set: # raise MyError('duplicate option short name: {0}'.format(short_name)) # elif long_name in Option.__g_long_name_set: # raise MyError('duplicate option long name: {0}'.format(long_name)) # Option.__g_short_name_set.add(short_name) # Option.__g_long_name_set.add(long_name) # self.__short_name = short_name # self.__long_name = long_name # self.__is_with_param = is_with_param # self.__is_local_opt = is_local_opt # self.__has_value = False # if None != default_value: # self.set_value(default_value) # def is_with_param(self): # return self.__is_with_param # def get_short_name(self): # return self.__short_name # def get_long_name(self): # return self.__long_name # def has_value(self): # return self.__has_value # def get_value(self): # return self.__value # def set_value(self, value): # self.__value = value # self.__has_value = True # def is_local_opt(self): # return self.__is_local_opt # def is_valid(self): # return None != self.__short_name and None != self.__long_name and True == self.__has_value and None != self.__value # #g_opts =\ #[\ #Option('I', 'help', False, True),\ #Option('V', 'version', False, True),\ #Option('h', 'host', True, False),\ #Option('P', 'port', True, False),\ #Option('u', 'user', True, False),\ #Option('p', 'password', True, False, ''),\ ## 要跑哪个模块,默认全跑 #Option('m', 'module', True, False, 'all'),\ ## 日志文件路径,不同脚本的main函数中中会改成不同的默认值 #Option('l', 'log-file', True, False) #]\ # #def change_opt_defult_value(opt_long_name, opt_default_val): # global g_opts # for opt in g_opts: # if opt.get_long_name() == opt_long_name: # opt.set_value(opt_default_val) # return # #def has_no_local_opts(): # global g_opts # no_local_opts = True # for opt in g_opts: # if opt.is_local_opt() and opt.has_value(): # no_local_opts = False # return no_local_opts # #def check_db_client_opts(): # global g_opts # for opt in g_opts: # if not opt.is_local_opt() and not opt.has_value(): # raise MyError('option "-{0}" has not been specified, maybe you should run "{1} --help" for help'\ # .format(opt.get_short_name(), sys.argv[0])) # #def parse_option(opt_name, opt_val): # global g_opts # for opt in g_opts: # if opt_name in (('-' + opt.get_short_name()), ('--' + opt.get_long_name())): # opt.set_value(opt_val) # #def parse_options(argv): # global g_opts # short_opt_str = '' # long_opt_list = [] # for opt in g_opts: # if opt.is_with_param(): # short_opt_str += opt.get_short_name() + ':' # else: # short_opt_str += opt.get_short_name() # for opt in g_opts: # if opt.is_with_param(): # long_opt_list.append(opt.get_long_name() + '=') # else: # long_opt_list.append(opt.get_long_name()) # (opts, args) = getopt.getopt(argv, short_opt_str, long_opt_list) # for (opt_name, opt_val) in opts: # parse_option(opt_name, opt_val) # if has_no_local_opts(): # check_db_client_opts() # #def deal_with_local_opt(opt): # if 'help' == opt.get_long_name(): # global help_str # print help_str # elif 'version' == opt.get_long_name(): # global version_str # print version_str # #def deal_with_local_opts(): # global g_opts # if has_no_local_opts(): # raise MyError('no local options, can not deal with local options') # else: # for opt in g_opts: # if opt.is_local_opt() and opt.has_value(): # deal_with_local_opt(opt) # # 只处理一个 # return # #def get_opt_host(): # global g_opts # for opt in g_opts: # if 'host' == opt.get_long_name(): # return opt.get_value() # #def get_opt_port(): # global g_opts # for opt in g_opts: # if 'port' == opt.get_long_name(): # return opt.get_value() # #def get_opt_user(): # global g_opts # for opt in g_opts: # if 'user' == opt.get_long_name(): # return opt.get_value() # #def get_opt_password(): # global g_opts # for opt in g_opts: # if 'password' == opt.get_long_name(): # return opt.get_value() # #def get_opt_module(): # global g_opts # for opt in g_opts: # if 'module' == opt.get_long_name(): # return opt.get_value() # #def get_opt_log_file(): # global g_opts # for opt in g_opts: # if 'log-file' == opt.get_long_name(): # return opt.get_value() # ##parse_options(sys.argv[1:]) # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:reset_upgrade_scripts.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #import os # #def clear_action_codes(action_filename_list, action_begin_line, \ # action_end_line, is_special_upgrade_code): # char_enter = '\n' # for action_filename in action_filename_list: # new_action_file_lines = [] # action_file = open(action_filename, 'r') # action_file_lines = action_file.readlines() # is_action_codes = False # for action_file_line in action_file_lines: # if is_action_codes and action_file_line == (action_end_line + char_enter): # is_action_codes = False # if not is_action_codes: # new_action_file_lines.append(action_file_line) # if not is_action_codes and action_file_line == (action_begin_line + char_enter): # is_action_codes = True # action_file.close() # new_action_file = open(action_filename, 'w') # for new_action_file_line in new_action_file_lines: # if is_special_upgrade_code: # if new_action_file_line == (action_end_line + char_enter): # new_action_file.write(' return\n') # new_action_file.write(new_action_file_line) # new_action_file.close() # #def regenerate_upgrade_script(): # print('\n=========run gen_upgrade_scripts.py, begin=========\n') # info = os.popen('./gen_upgrade_scripts.py;') # print(info.read()) # print('\n=========run gen_upgrade_scripts.py, end=========\n') # #if __name__ == '__main__': # action_begin_line = '####========******####======== actions begin ========####******========####' # action_end_line = '####========******####========= actions end =========####******========####' # action_filename_list = \ # [\ # 'normal_ddl_actions_pre.py',\ # 'normal_ddl_actions_post.py',\ # 'normal_dml_actions_pre.py',\ # 'normal_dml_actions_post.py',\ # 'each_tenant_dml_actions_pre.py',\ # 'each_tenant_dml_actions_post.py',\ # 'each_tenant_ddl_actions_post.py'\ # ] # special_upgrade_filename_list = \ # [\ # 'special_upgrade_action_pre.py',\ # 'special_upgrade_action_post.py' # ] # clear_action_codes(action_filename_list, action_begin_line, action_end_line, False) # clear_action_codes(special_upgrade_filename_list, action_begin_line, action_end_line, True) # regenerate_upgrade_script() # # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:run_modules.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #ALL_MODULE = 'all' # #MODULE_DDL = 'ddl' #MODULE_NORMAL_DML = 'normal_dml' #MODULE_EACH_TENANT_DML = 'each_tenant_dml' #MODULE_EACH_TENANT_DDL = 'each_tenant_ddl' #MODULE_SYSTEM_VARIABLE_DML = 'system_variable_dml' #MODULE_SPECIAL_ACTION = 'special_action' # #def get_all_module_set(): # import run_modules # module_set = set([]) # attrs_from_run_module = dir(run_modules) # for attr in attrs_from_run_module: # if attr.startswith('MODULE_'): # module = getattr(run_modules, attr) # module_set.add(module) # return module_set # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:special_upgrade_action_post.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #import logging #import time #from actions import Cursor #from actions import DMLCursor #from actions import QueryCursor #import mysql.connector #from mysql.connector import errorcode #import actions # #def do_special_upgrade(conn, cur, tenant_id_list, user, pwd): # # special upgrade action ##升级语句对应的action要写在下面的actions begin和actions end这两行之间, ##因为基准版本更新的时候会调用reset_upgrade_scripts.py来清空actions begin和actions end ##这两行之间的这些代码,如果不写在这两行之间的话会导致清空不掉相应的代码。 # upgrade_system_package(conn, cur) #####========******####======== actions begin ========####******========#### # return #####========******####========= actions end =========####******========#### # #def query(cur, sql): # cur.execute(sql) # results = cur.fetchall() # return results # #def get_tenant_names(cur): # return [_[0] for _ in query(cur, 'select tenant_name from oceanbase.__all_tenant')] # #def run_create_inner_schema_job(conn, cur): # try: # ###### enable ddl # ori_enable_ddl = actions.get_ori_enable_ddl(cur) # if ori_enable_ddl == 0: # actions.set_parameter(cur, 'enable_ddl', 'True') # # # check record in rs_job # count_sql = """select count(*) from oceanbase.__all_rootservice_job # where job_type = 'CREATE_INNER_SCHEMA';""" # result = query(cur, count_sql) # job_count = 0 # if (1 != len(result)) : # logging.warn("unexpected sql output") # raise e # else : # job_count = result[0][0] # # run job # sql = "alter system run job 'CREATE_INNER_SCHEMA';" # logging.info(sql) # cur.execute(sql) # # # wait job finish # times = 180 # ## 先检查job count变化 # count_check = False # while times > 0: # result = query(cur, count_sql) # if (1 != len(result)): # logging.warn("unexpected sql output") # raise e # elif (result[0][0] > job_count): # count_check = True # logging.info('create_inner_schema job detected') # break # time.sleep(10) # times -= 1 # if times == 0: # raise MyError('check create_inner_schema job failed!') # # ## 继续检查job status状态 # status_sql = """select job_status from oceanbase.__all_rootservice_job # where job_type = 'CREATE_INNER_SCHEMA' order by job_id desc limit 1;""" # status_check = False # while times > 0 and count_check == True: # result = query(cur, status_sql) # if (0 == len(result)): # logging.warn("unexpected sql output") # raise e # elif (1 != len(result) or 1 != len(result[0])): # logging.warn("result len not match") # raise e # elif result[0][0] == "FAILED": # logging.warn("run create_inner_schema job faild") # raise e # elif result[0][0] == "INPROGRESS": # logging.info('create_inner_schema job is still running') # elif result[0][0] == "SUCCESS": # status_check = True # break; # else: # logging.warn("invalid result: {0}" % (result[0][0])) # raise e # time.sleep(10) # times -= 1 # if times == 0: # raise MyError('check create_inner_schema job failed!') # # if (status_check == True and count_check == True): # logging.info('check create_inner_schema job success') # else: # logging.warn("run create_inner_schema job faild") # raise e # # # disable ddl # if ori_enable_ddl == 0: # actions.set_parameter(cur, 'enable_ddl', 'False') # except Exception, e: # logging.warn("run create_inner_schema job failed") # raise e # logging.info("run create_inner_schema job success") # #def disable_major_freeze(conn, cur): # try: # actions.set_parameter(cur, "enable_major_freeze", 'False') # except Exception, e: # logging.warn("disable enable_major_freeze failed") # raise e # logging.info("disable enable_major_freeze finish") # #def get_max_used_job_id(cur): # try: # max_job_id = 0 # sql = "select job_id from oceanbase.__all_rootservice_job order by job_id desc limit 1" # results = query(cur, sql) # # if (len(results) == 0): # max_job_id = 0 # elif (len(results) != 1 or len(results[0]) != 1): # logging.warn("row cnt not match") # raise e # else: # max_job_id = results[0][0] # # logging.info("get max_used_job_id:{0}".format(max_job_id)) # # return max_job_id # except Exception, e: # logging.warn("failed to get max_used_job_id") # raise e # #def check_can_run_upgrade_job(cur, version): # try: # sql = """select job_status from oceanbase.__all_rootservice_job # where job_type = 'UPGRADE_POST_ACTION' and extra_info = '{0}' # order by job_id desc limit 1""".format(version) # results = query(cur, sql) # # bret = True # if (len(results) == 0): # bret = True # logging.info("upgrade job not created yet, should run upgrade job") # elif (len(results) != 1 or len(results[0]) != 1): # logging.warn("row cnt not match") # raise e # elif ("INPROGRESS" == results[0][0]): # logging.warn("upgrade job still running, should wait") # raise e # elif ("SUCCESS" == results[0][0]): # bret = False # logging.info("execute upgrade job successfully, skip run upgrade job") # elif ("FAILED" == results[0][0]): # bret = True # logging.info("execute upgrade job failed, should run again") # else: # logging.warn("invalid job status: {0}".format(results[0][0])) # raise e # # return bret # except Exception, e: # logging.warn("failed to check if upgrade job can run") # raise e # # #def check_upgrade_job_result(cur, version, max_used_job_id): # try: # times = 0 # while (times <= 180): # sql = """select job_status from oceanbase.__all_rootservice_job # where job_type = 'RUN_UPGRADE_POST_JOB' and extra_info = '{0}' # and job_id > {1} order by job_id desc limit 1""".format(version, max_used_job_id) # results = query(cur, sql) # # if (len(results) == 0): # logging.info("upgrade job not created yet") # elif (len(results) != 1 or len(results[0]) != 1): # logging.warn("row cnt not match") # raise e # elif ("INPROGRESS" == results[0][0]): # logging.info("upgrade job is still running") # elif ("SUCCESS" == results[0][0]): # logging.info("execute upgrade job successfully") # break; # elif ("FAILED" == results[0][0]): # logging.warn("execute upgrade job failed") # raise e # else: # logging.warn("invalid job status: {0}".format(results[0][0])) # raise e # # times = times + 1 # time.sleep(10) # except Exception, e: # logging.warn("failed to check upgrade job result") # raise e # # #def run_upgrade_job(conn, cur, version): # try: # logging.info("start to run upgrade job, version:{0}".format(version)) # # pre check # if (check_can_run_upgrade_job(cur, version) == True): # conn.autocommit = True # # disable enable_ddl # ori_enable_ddl = actions.get_ori_enable_ddl(cur) # if ori_enable_ddl == 1: # actions.set_parameter(cur, 'enable_ddl', 'False') # # get max_used_job_id # max_used_job_id = get_max_used_job_id(cur) # # run upgrade job # sql = """alter system run upgrade job '{0}'""".format(version) # logging.info(sql) # cur.execute(sql) # # check upgrade job result # check_upgrade_job_result(cur, version, max_used_job_id) # # reset enable_ddl # if ori_enable_ddl == 1: # actions.set_parameter(cur, 'enable_ddl', 'True') # except Exception, e: # logging.warn("run upgrade job failed, version:{0}".format(version)) # raise e # logging.info("run upgrade job success, version:{0}".format(version)) # # #def upgrade_system_package(conn, cur): # try: # ori_enable_ddl = actions.get_ori_enable_ddl(cur) # if ori_enable_ddl == 0: # actions.set_parameter(cur, 'enable_ddl', 'True') # # sql = "set ob_query_timeout = 300000000;" # logging.info(sql) # cur.execute(sql) # # sql = """ # CREATE OR REPLACE PACKAGE __DBMS_UPGRADE # PROCEDURE UPGRADE(package_name VARCHAR(1024)); # PROCEDURE UPGRADE_ALL(); # END; # """ # logging.info(sql) # cur.execute(sql) # # sql = """ # CREATE OR REPLACE PACKAGE BODY __DBMS_UPGRADE # PROCEDURE UPGRADE(package_name VARCHAR(1024)); # PRAGMA INTERFACE(c, UPGRADE_SINGLE); # PROCEDURE UPGRADE_ALL(); # PRAGMA INTERFACE(c, UPGRADE_ALL); # END; # """ # logging.info(sql) # cur.execute(sql) # # sql = """ # CALL __DBMS_UPGRADE.UPGRADE_ALL(); # """ # logging.info(sql) # cur.execute(sql) # # ###### alter session compatibility mode # sql = "set ob_compatibility_mode='oracle';" # logging.info(sql) # cur.execute(sql) # # sql = "set ob_query_timeout = 300000000;" # logging.info(sql) # cur.execute(sql) # # sql = """ # CREATE OR REPLACE PACKAGE "__DBMS_UPGRADE" IS # PROCEDURE UPGRADE(package_name VARCHAR2); # PROCEDURE UPGRADE_ALL; # END; # """ # logging.info(sql) # cur.execute(sql) # # sql = """ # CREATE OR REPLACE PACKAGE BODY "__DBMS_UPGRADE" IS # PROCEDURE UPGRADE(package_name VARCHAR2); # PRAGMA INTERFACE(c, UPGRADE_SINGLE); # PROCEDURE UPGRADE_ALL; # PRAGMA INTERFACE(c, UPGRADE_ALL); # END; # """ # logging.info(sql) # cur.execute(sql) # # ########## update system package ########## # sql = """ # CALL "__DBMS_UPGRADE".UPGRADE_ALL(); # """ # logging.info(sql) # cur.execute(sql) # # ###### alter session compatibility mode # sql = "set ob_compatibility_mode='mysql';" # logging.info(sql) # cur.execute(sql) # time.sleep(10) # # if ori_enable_ddl == 0: # actions.set_parameter(cur, 'enable_ddl', 'False') # # logging.info("upgrade package finished!") # except Exception, e: # logging.warn("upgrade package failed!") # raise e # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:special_upgrade_action_pre.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #from my_error import MyError #import time #import mysql.connector #from mysql.connector import errorcode #import logging #import re #import string #from random import Random #from actions import DMLCursor #from actions import QueryCursor #import binascii #import my_utils #import actions #import sys # ##def modify_schema_history(conn, cur, tenant_ids): ## try: ## conn.autocommit = True ## ## # disable ddl ## ori_enable_ddl = actions.get_ori_enable_ddl(cur) ## if ori_enable_ddl == 1: ## actions.set_parameter(cur, 'enable_ddl', 'False') ## log('tenant_ids: {0}'.format(tenant_ids)) ## for tenant_id in tenant_ids: ## sql = """alter system change tenant tenant_id = {0}""".format(tenant_id) ## log(sql) ## cur.execute(sql) # ## #####implement##### ## ## # 还原默认 tenant ## sys_tenant_id = 1 ## sql = """alter system change tenant tenant_id = {0}""".format(sys_tenant_id) ## log(sql) ## cur.execute(sql) ## ## # enable ddl ## if ori_enable_ddl == 1: ## actions.set_parameter(cur, 'enable_ddl', 'True') ## except Exception, e: ## logging.warn("exec modify trigger failed") ## raise e ## logging.info('exec modify trigger finish') # ## 主库需要执行的升级动作 #def do_special_upgrade(conn, cur, tenant_id_list, user, passwd): # # special upgrade action ##升级语句对应的action要写在下面的actions begin和actions end这两行之间, ##因为基准版本更新的时候会调用reset_upgrade_scripts.py来清空actions begin和actions end ##这两行之间的这些代码,如果不写在这两行之间的话会导致清空不掉相应的代码。 ## 主库升级流程没加滚动升级步骤,或混部阶段DDL测试有相关case覆盖前,混部开始禁DDL # actions.set_parameter(cur, 'enable_ddl', 'False') #####========******####======== actions begin ========####******========#### # return #####========******####========= actions end =========####******========#### # #def query(cur, sql): # log(sql) # cur.execute(sql) # results = cur.fetchall() # return results # #def log(msg): # logging.info(msg) # #def get_oracle_tenant_ids(cur): # return [_[0] for _ in query(cur, 'select tenant_id from oceanbase.__all_tenant where compatibility_mode = 1')] # #def get_tenant_ids(cur): # return [_[0] for _ in query(cur, 'select tenant_id from oceanbase.__all_tenant')] # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:upgrade_checker.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #import sys #import os #import mysql.connector #from mysql.connector import errorcode #import logging #import getopt #import time # #class UpgradeParams: # log_filename = 'upgrade_checker.log' # old_version = '4.0.0.0' ##### --------------start : my_error.py -------------- #class MyError(Exception): # def __init__(self, value): # self.value = value # def __str__(self): # return repr(self.value) ##### --------------start : actions.py------------ #class Cursor: # __cursor = None # def __init__(self, cursor): # self.__cursor = cursor # def exec_sql(self, sql, print_when_succ = True): # try: # self.__cursor.execute(sql) # rowcount = self.__cursor.rowcount # if True == print_when_succ: # logging.info('succeed to execute sql: %s, rowcount = %d', sql, rowcount) # return rowcount # except mysql.connector.Error, e: # logging.exception('mysql connector error, fail to execute sql: %s', sql) # raise e # except Exception, e: # logging.exception('normal error, fail to execute sql: %s', sql) # raise e # def exec_query(self, sql, print_when_succ = True): # try: # self.__cursor.execute(sql) # results = self.__cursor.fetchall() # rowcount = self.__cursor.rowcount # if True == print_when_succ: # logging.info('succeed to execute query: %s, rowcount = %d', sql, rowcount) # return (self.__cursor.description, results) # except mysql.connector.Error, e: # logging.exception('mysql connector error, fail to execute sql: %s', sql) # raise e # except Exception, e: # logging.exception('normal error, fail to execute sql: %s', sql) # raise e # #def set_parameter(cur, parameter, value): # sql = """alter system set {0} = '{1}'""".format(parameter, value) # logging.info(sql) # cur.execute(sql) # wait_parameter_sync(cur, parameter, value) # #def wait_parameter_sync(cur, key, value): # sql = """select count(*) as cnt from oceanbase.__all_virtual_sys_parameter_stat # where name = '{0}' and value != '{1}'""".format(key, value) # times = 10 # while times > 0: # logging.info(sql) # cur.execute(sql) # result = cur.fetchall() # if len(result) != 1 or len(result[0]) != 1: # logging.exception('result cnt not match') # raise e # elif result[0][0] == 0: # logging.info("""{0} is sync, value is {1}""".format(key, value)) # break # else: # logging.info("""{0} is not sync, value should be {1}""".format(key, value)) # # times -= 1 # if times == 0: # logging.exception("""check {0}:{1} sync timeout""".format(key, value)) # raise e # time.sleep(5) # ##### --------------start : opt.py -------------- #help_str = \ #""" #Help: #""" +\ #sys.argv[0] + """ [OPTIONS]""" +\ #'\n\n' +\ #'-I, --help Display this help and exit.\n' +\ #'-V, --version Output version information and exit.\n' +\ #'-h, --host=name Connect to host.\n' +\ #'-P, --port=name Port number to use for connection.\n' +\ #'-u, --user=name User for login.\n' +\ #'-p, --password=name Password to use when connecting to server. If password is\n' +\ #' not given it\'s empty string "".\n' +\ #'-m, --module=name Modules to run. Modules should be a string combined by some of\n' +\ #' the following strings: ddl, normal_dml, each_tenant_dml,\n' +\ #' system_variable_dml, special_action, all. "all" represents\n' +\ #' that all modules should be run. They are splitted by ",".\n' +\ #' For example: -m all, or --module=ddl,normal_dml,special_action\n' +\ #'-l, --log-file=name Log file path. If log file path is not given it\'s ' + os.path.splitext(sys.argv[0])[0] + '.log\n' +\ #'\n\n' +\ #'Maybe you want to run cmd like that:\n' +\ #sys.argv[0] + ' -h 127.0.0.1 -P 3306 -u admin -p admin\n' # #version_str = """version 1.0.0""" # #class Option: # __g_short_name_set = set([]) # __g_long_name_set = set([]) # __short_name = None # __long_name = None # __is_with_param = None # __is_local_opt = None # __has_value = None # __value = None # def __init__(self, short_name, long_name, is_with_param, is_local_opt, default_value = None): # if short_name in Option.__g_short_name_set: # raise MyError('duplicate option short name: {0}'.format(short_name)) # elif long_name in Option.__g_long_name_set: # raise MyError('duplicate option long name: {0}'.format(long_name)) # Option.__g_short_name_set.add(short_name) # Option.__g_long_name_set.add(long_name) # self.__short_name = short_name # self.__long_name = long_name # self.__is_with_param = is_with_param # self.__is_local_opt = is_local_opt # self.__has_value = False # if None != default_value: # self.set_value(default_value) # def is_with_param(self): # return self.__is_with_param # def get_short_name(self): # return self.__short_name # def get_long_name(self): # return self.__long_name # def has_value(self): # return self.__has_value # def get_value(self): # return self.__value # def set_value(self, value): # self.__value = value # self.__has_value = True # def is_local_opt(self): # return self.__is_local_opt # def is_valid(self): # return None != self.__short_name and None != self.__long_name and True == self.__has_value and None != self.__value # #g_opts =\ #[\ #Option('I', 'help', False, True),\ #Option('V', 'version', False, True),\ #Option('h', 'host', True, False),\ #Option('P', 'port', True, False),\ #Option('u', 'user', True, False),\ #Option('p', 'password', True, False, ''),\ ## 要跑哪个模块,默认全跑 #Option('m', 'module', True, False, 'all'),\ ## 日志文件路径,不同脚本的main函数中中会改成不同的默认值 #Option('l', 'log-file', True, False) #]\ # #def change_opt_defult_value(opt_long_name, opt_default_val): # global g_opts # for opt in g_opts: # if opt.get_long_name() == opt_long_name: # opt.set_value(opt_default_val) # return # #def has_no_local_opts(): # global g_opts # no_local_opts = True # for opt in g_opts: # if opt.is_local_opt() and opt.has_value(): # no_local_opts = False # return no_local_opts # #def check_db_client_opts(): # global g_opts # for opt in g_opts: # if not opt.is_local_opt() and not opt.has_value(): # raise MyError('option "-{0}" has not been specified, maybe you should run "{1} --help" for help'\ # .format(opt.get_short_name(), sys.argv[0])) # #def parse_option(opt_name, opt_val): # global g_opts # for opt in g_opts: # if opt_name in (('-' + opt.get_short_name()), ('--' + opt.get_long_name())): # opt.set_value(opt_val) # #def parse_options(argv): # global g_opts # short_opt_str = '' # long_opt_list = [] # for opt in g_opts: # if opt.is_with_param(): # short_opt_str += opt.get_short_name() + ':' # else: # short_opt_str += opt.get_short_name() # for opt in g_opts: # if opt.is_with_param(): # long_opt_list.append(opt.get_long_name() + '=') # else: # long_opt_list.append(opt.get_long_name()) # (opts, args) = getopt.getopt(argv, short_opt_str, long_opt_list) # for (opt_name, opt_val) in opts: # parse_option(opt_name, opt_val) # if has_no_local_opts(): # check_db_client_opts() # #def deal_with_local_opt(opt): # if 'help' == opt.get_long_name(): # global help_str # print help_str # elif 'version' == opt.get_long_name(): # global version_str # print version_str # #def deal_with_local_opts(): # global g_opts # if has_no_local_opts(): # raise MyError('no local options, can not deal with local options') # else: # for opt in g_opts: # if opt.is_local_opt() and opt.has_value(): # deal_with_local_opt(opt) # # 只处理一个 # return # #def get_opt_host(): # global g_opts # for opt in g_opts: # if 'host' == opt.get_long_name(): # return opt.get_value() # #def get_opt_port(): # global g_opts # for opt in g_opts: # if 'port' == opt.get_long_name(): # return opt.get_value() # #def get_opt_user(): # global g_opts # for opt in g_opts: # if 'user' == opt.get_long_name(): # return opt.get_value() # #def get_opt_password(): # global g_opts # for opt in g_opts: # if 'password' == opt.get_long_name(): # return opt.get_value() # #def get_opt_module(): # global g_opts # for opt in g_opts: # if 'module' == opt.get_long_name(): # return opt.get_value() # #def get_opt_log_file(): # global g_opts # for opt in g_opts: # if 'log-file' == opt.get_long_name(): # return opt.get_value() ##### ---------------end---------------------- # ##### --------------start : do_upgrade_pre.py-------------- #def config_logging_module(log_filenamme): # logging.basicConfig(level=logging.INFO,\ # format='[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s',\ # datefmt='%Y-%m-%d %H:%M:%S',\ # filename=log_filenamme,\ # filemode='w') # # 定义日志打印格式 # formatter = logging.Formatter('[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s', '%Y-%m-%d %H:%M:%S') # ####################################### # # 定义一个Handler打印INFO及以上级别的日志到sys.stdout # stdout_handler = logging.StreamHandler(sys.stdout) # stdout_handler.setLevel(logging.INFO) # # 设置日志打印格式 # stdout_handler.setFormatter(formatter) # # 将定义好的stdout_handler日志handler添加到root logger # logging.getLogger('').addHandler(stdout_handler) ##### ---------------end---------------------- # # #fail_list=[] # ##### START #### ## 1. 检查前置版本 #def check_observer_version(query_cur, upgrade_params): # (desc, results) = query_cur.exec_query("""select distinct value from GV$OB_PARAMETERS where name='min_observer_version'""") # if len(results) != 1: # fail_list.append('query results count is not 1') # elif cmp(results[0][0], upgrade_params.old_version) < 0 : # fail_list.append('old observer version is expected equal or higher then: {0}, actual version:{1}'.format(upgrade_params.old_version, results[0][0])) # logging.info('check observer version success, version = {0}'.format(results[0][0])) # ## 2. 检查paxos副本是否同步, paxos副本是否缺失 #def check_paxos_replica(query_cur): # # 2.1 检查paxos副本是否同步 # (desc, results) = query_cur.exec_query("""select count(1) as unsync_cnt from GV$OB_LOG_STAT where in_sync = 'NO'""") # if results[0][0] > 0 : # fail_list.append('{0} replicas unsync, please check'.format(results[0][0])) # # 2.2 检查paxos副本是否有缺失 TODO # logging.info('check paxos replica success') # ## 3. 检查是否有做balance, locality变更 #def check_rebalance_task(query_cur): # # 3.1 检查是否有做locality变更 # (desc, results) = query_cur.exec_query("""select count(1) as cnt from DBA_OB_TENANT_JOBS where job_status='INPROGRESS' and result_code is null""") # if results[0][0] > 0 : # fail_list.append('{0} locality tasks is doing, please check'.format(results[0][0])) # # 3.2 检查是否有做balance # (desc, results) = query_cur.exec_query("""select count(1) as rebalance_task_cnt from CDB_OB_LS_REPLICA_TASKS""") # if results[0][0] > 0 : # fail_list.append('{0} rebalance tasks is doing, please check'.format(results[0][0])) # logging.info('check rebalance task success') # ## 4. 检查集群状态 #def check_cluster_status(query_cur): # # 4.1 检查是否非合并状态 # (desc, results) = query_cur.exec_query("""select count(1) from CDB_OB_MAJOR_COMPACTION where STATUS != 'IDLE'""") # if results[0][0] > 0 : # fail_list.append('{0} tenant is merging, please check'.format(results[0][0])) # logging.info('check cluster status success') # ## 5. 检查是否有异常租户(creating,延迟删除,恢复中) #def check_tenant_status(query_cur): # (desc, results) = query_cur.exec_query("""select count(*) as count from DBA_OB_TENANTS where status != 'NORMAL'""") # if len(results) != 1 or len(results[0]) != 1: # fail_list.append('results len not match') # elif 0 != results[0][0]: # fail_list.append('has abnormal tenant, should stop') # else: # logging.info('check tenant status success') # ## 6. 检查无恢复任务 #def check_restore_job_exist(query_cur): # (desc, results) = query_cur.exec_query("""select count(1) from CDB_OB_RESTORE_PROGRESS""") # if len(results) != 1 or len(results[0]) != 1: # fail_list.append('failed to restore job cnt') # elif results[0][0] != 0: # fail_list.append("""still has restore job, upgrade is not allowed temporarily""") # logging.info('check restore job success') # # #def check_is_primary_zone_distributed(primary_zone_str): # semicolon_pos = len(primary_zone_str) # for i in range(len(primary_zone_str)): # if primary_zone_str[i] == ';': # semicolon_pos = i # break # comma_pos = len(primary_zone_str) # for j in range(len(primary_zone_str)): # if primary_zone_str[j] == ',': # comma_pos = j # break # if comma_pos < semicolon_pos: # return True # else: # return False # ## 7. 升级前需要primary zone只有一个 #def check_tenant_primary_zone(query_cur): # (desc, results) = query_cur.exec_query("""select tenant_name,primary_zone from DBA_OB_TENANTS where tenant_id != 1"""); # for item in results: # if cmp(item[1], "RANDOM") == 0: # fail_list.append('{0} tenant primary zone random before update not allowed'.format(item[0])) # elif check_is_primary_zone_distributed(item[1]): # fail_list.append('{0} tenant primary zone distributed before update not allowed'.format(item[0])) # logging.info('check tenant primary zone success') # ## 8. 修改永久下线的时间,避免升级过程中缺副本 #def modify_server_permanent_offline_time(cur): # set_parameter(cur, 'server_permanent_offline_time', '72h') # ## last check of do_check, make sure no function execute after check_fail_list #def check_fail_list(): # if len(fail_list) != 0 : # error_msg ="upgrade checker failed with " + str(len(fail_list)) + " reasons: " + ", ".join(['['+x+"] " for x in fail_list]) # raise MyError(error_msg) # ## 开始升级前的检查 #def do_check(my_host, my_port, my_user, my_passwd, upgrade_params): # try: # conn = mysql.connector.connect(user = my_user, # password = my_passwd, # host = my_host, # port = my_port, # database = 'oceanbase', # raise_on_warnings = True) # conn.autocommit = True # cur = conn.cursor(buffered=True) # try: # query_cur = Cursor(cur) # check_observer_version(query_cur, upgrade_params) # check_paxos_replica(query_cur) # check_rebalance_task(query_cur) # check_cluster_status(query_cur) # check_tenant_status(query_cur) # check_restore_job_exist(query_cur) # check_tenant_primary_zone(query_cur) # # all check func should execute before check_fail_list # check_fail_list() # #modify_server_permanent_offline_time(cur) # except Exception, e: # logging.exception('run error') # raise e # finally: # cur.close() # conn.close() # except mysql.connector.Error, e: # logging.exception('connection error') # raise e # except Exception, e: # logging.exception('normal error') # raise e # #if __name__ == '__main__': # upgrade_params = UpgradeParams() # change_opt_defult_value('log-file', upgrade_params.log_filename) # parse_options(sys.argv[1:]) # if not has_no_local_opts(): # deal_with_local_opts() # else: # check_db_client_opts() # log_filename = get_opt_log_file() # upgrade_params.log_filename = log_filename # # 日志配置放在这里是为了前面的操作不要覆盖掉日志文件 # config_logging_module(upgrade_params.log_filename) # try: # host = get_opt_host() # port = int(get_opt_port()) # user = get_opt_user() # password = get_opt_password() # logging.info('parameters from cmd: host=\"%s\", port=%s, user=\"%s\", password=\"%s\", log-file=\"%s\"',\ # host, port, user, password, log_filename) # do_check(host, port, user, password, upgrade_params) # except mysql.connector.Error, e: # logging.exception('mysql connctor error') # raise e # except Exception, e: # logging.exception('normal error') # raise e ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:upgrade_cluster_health_checker.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #import sys #import os #import time #import mysql.connector #from mysql.connector import errorcode #import logging #import getopt # #class UpgradeParams: # log_filename = 'upgrade_cluster_health_checker.log' # ##### --------------start : my_error.py -------------- #class MyError(Exception): # def __init__(self, value): # self.value = value # def __str__(self): # return repr(self.value) # ##### --------------start : actions.py 只允许执行查询语句-------------- #class QueryCursor: # __cursor = None # def __init__(self, cursor): # self.__cursor = cursor # def exec_sql(self, sql, print_when_succ = True): # try: # self.__cursor.execute(sql) # rowcount = self.__cursor.rowcount # if True == print_when_succ: # logging.info('succeed to execute sql: %s, rowcount = %d', sql, rowcount) # return rowcount # except mysql.connector.Error, e: # logging.exception('mysql connector error, fail to execute sql: %s', sql) # raise e # except Exception, e: # logging.exception('normal error, fail to execute sql: %s', sql) # raise e # def exec_query(self, sql, print_when_succ = True): # try: # self.__cursor.execute(sql) # results = self.__cursor.fetchall() # rowcount = self.__cursor.rowcount # if True == print_when_succ: # logging.info('succeed to execute query: %s, rowcount = %d', sql, rowcount) # return (self.__cursor.description, results) # except mysql.connector.Error, e: # logging.exception('mysql connector error, fail to execute sql: %s', sql) # raise e # except Exception, e: # logging.exception('normal error, fail to execute sql: %s', sql) # raise e ##### ---------------end---------------------- # ##### --------------start : opt.py -------------- #help_str = \ #""" #Help: #""" +\ #sys.argv[0] + """ [OPTIONS]""" +\ #'\n\n' +\ #'-I, --help Display this help and exit.\n' +\ #'-V, --version Output version information and exit.\n' +\ #'-h, --host=name Connect to host.\n' +\ #'-P, --port=name Port number to use for connection.\n' +\ #'-u, --user=name User for login.\n' +\ #'-p, --password=name Password to use when connecting to server. If password is\n' +\ #' not given it\'s empty string "".\n' +\ #'-m, --module=name Modules to run. Modules should be a string combined by some of\n' +\ #' the following strings: ddl, normal_dml, each_tenant_dml,\n' +\ #' system_variable_dml, special_action, all. "all" represents\n' +\ #' that all modules should be run. They are splitted by ",".\n' +\ #' For example: -m all, or --module=ddl,normal_dml,special_action\n' +\ #'-l, --log-file=name Log file path. If log file path is not given it\'s ' + os.path.splitext(sys.argv[0])[0] + '.log\n' +\ #'-t, --timeout=name check timeout, default: 600(s).\n' + \ #'\n\n' +\ #'Maybe you want to run cmd like that:\n' +\ #sys.argv[0] + ' -h 127.0.0.1 -P 3306 -u admin -p admin\n' # #version_str = """version 1.0.0""" # #class Option: # __g_short_name_set = set([]) # __g_long_name_set = set([]) # __short_name = None # __long_name = None # __is_with_param = None # __is_local_opt = None # __has_value = None # __value = None # def __init__(self, short_name, long_name, is_with_param, is_local_opt, default_value = None): # if short_name in Option.__g_short_name_set: # raise MyError('duplicate option short name: {0}'.format(short_name)) # elif long_name in Option.__g_long_name_set: # raise MyError('duplicate option long name: {0}'.format(long_name)) # Option.__g_short_name_set.add(short_name) # Option.__g_long_name_set.add(long_name) # self.__short_name = short_name # self.__long_name = long_name # self.__is_with_param = is_with_param # self.__is_local_opt = is_local_opt # self.__has_value = False # if None != default_value: # self.set_value(default_value) # def is_with_param(self): # return self.__is_with_param # def get_short_name(self): # return self.__short_name # def get_long_name(self): # return self.__long_name # def has_value(self): # return self.__has_value # def get_value(self): # return self.__value # def set_value(self, value): # self.__value = value # self.__has_value = True # def is_local_opt(self): # return self.__is_local_opt # def is_valid(self): # return None != self.__short_name and None != self.__long_name and True == self.__has_value and None != self.__value # #g_opts =\ #[\ #Option('I', 'help', False, True),\ #Option('V', 'version', False, True),\ #Option('h', 'host', True, False),\ #Option('P', 'port', True, False),\ #Option('u', 'user', True, False),\ #Option('p', 'password', True, False, ''),\ ## 要跑哪个模块,默认全跑 #Option('m', 'module', True, False, 'all'),\ ## 日志文件路径,不同脚本的main函数中中会改成不同的默认值 #Option('l', 'log-file', True, False),\ ## 一些检查的超时时间,默认是600s #Option('t', 'timeout', True, False, '600') #]\ # #def change_opt_defult_value(opt_long_name, opt_default_val): # global g_opts # for opt in g_opts: # if opt.get_long_name() == opt_long_name: # opt.set_value(opt_default_val) # return # #def has_no_local_opts(): # global g_opts # no_local_opts = True # for opt in g_opts: # if opt.is_local_opt() and opt.has_value(): # no_local_opts = False # return no_local_opts # #def check_db_client_opts(): # global g_opts # for opt in g_opts: # if not opt.is_local_opt() and not opt.has_value(): # raise MyError('option "-{0}" has not been specified, maybe you should run "{1} --help" for help'\ # .format(opt.get_short_name(), sys.argv[0])) # #def parse_option(opt_name, opt_val): # global g_opts # for opt in g_opts: # if opt_name in (('-' + opt.get_short_name()), ('--' + opt.get_long_name())): # opt.set_value(opt_val) # #def parse_options(argv): # global g_opts # short_opt_str = '' # long_opt_list = [] # for opt in g_opts: # if opt.is_with_param(): # short_opt_str += opt.get_short_name() + ':' # else: # short_opt_str += opt.get_short_name() # for opt in g_opts: # if opt.is_with_param(): # long_opt_list.append(opt.get_long_name() + '=') # else: # long_opt_list.append(opt.get_long_name()) # (opts, args) = getopt.getopt(argv, short_opt_str, long_opt_list) # for (opt_name, opt_val) in opts: # parse_option(opt_name, opt_val) # if has_no_local_opts(): # check_db_client_opts() # #def deal_with_local_opt(opt): # if 'help' == opt.get_long_name(): # global help_str # print help_str # elif 'version' == opt.get_long_name(): # global version_str # print version_str # #def deal_with_local_opts(): # global g_opts # if has_no_local_opts(): # raise MyError('no local options, can not deal with local options') # else: # for opt in g_opts: # if opt.is_local_opt() and opt.has_value(): # deal_with_local_opt(opt) # # 只处理一个 # return # #def get_opt_host(): # global g_opts # for opt in g_opts: # if 'host' == opt.get_long_name(): # return opt.get_value() # #def get_opt_port(): # global g_opts # for opt in g_opts: # if 'port' == opt.get_long_name(): # return opt.get_value() # #def get_opt_user(): # global g_opts # for opt in g_opts: # if 'user' == opt.get_long_name(): # return opt.get_value() # #def get_opt_password(): # global g_opts # for opt in g_opts: # if 'password' == opt.get_long_name(): # return opt.get_value() # #def get_opt_module(): # global g_opts # for opt in g_opts: # if 'module' == opt.get_long_name(): # return opt.get_value() # #def get_opt_log_file(): # global g_opts # for opt in g_opts: # if 'log-file' == opt.get_long_name(): # return opt.get_value() # #def get_opt_timeout(): # global g_opts # for opt in g_opts: # if 'timeout' == opt.get_long_name(): # return opt.get_value() ##### ---------------end---------------------- # ##### --------------start : do_upgrade_pre.py-------------- #def config_logging_module(log_filenamme): # logging.basicConfig(level=logging.INFO,\ # format='[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s',\ # datefmt='%Y-%m-%d %H:%M:%S',\ # filename=log_filenamme,\ # filemode='w') # # 定义日志打印格式 # formatter = logging.Formatter('[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s', '%Y-%m-%d %H:%M:%S') # ####################################### # # 定义一个Handler打印INFO及以上级别的日志到sys.stdout # stdout_handler = logging.StreamHandler(sys.stdout) # stdout_handler.setLevel(logging.INFO) # # 设置日志打印格式 # stdout_handler.setFormatter(formatter) # # 将定义好的stdout_handler日志handler添加到root logger # logging.getLogger('').addHandler(stdout_handler) ##### ---------------end---------------------- # ##### START #### ## 1. 检查paxos副本是否同步, paxos副本是否缺失 #def check_paxos_replica(query_cur): # # 2.1 检查paxos副本是否同步 # (desc, results) = query_cur.exec_query("""select count(1) as unsync_cnt from GV$OB_LOG_STAT where in_sync = 'NO'""") # if results[0][0] > 0 : # raise MyError('{0} replicas unsync, please check'.format(results[0][0])) # # 2.2 检查paxos副本是否有缺失 TODO # logging.info('check paxos replica success') # ## 2. 检查observer是否可服务 #def check_observer_status(query_cur): # # 3.1 检查是否有做locality变更 # (desc, results) = query_cur.exec_query("""select count(*) from oceanbase.__all_server where start_service_time is null or status='INACTIVE'""") # if results[0][0] > 0 : # raise MyError('{0} observer not service, please check'.format(results[0][0])) # logging.info('check observer status success') # ## 3. 检查schema是否刷新成功 #def check_schema_status(query_cur): # # 4.1 检查是否非合并状态 # (desc, results) = query_cur.exec_query("""select count(*) from __all_server a left join __all_virtual_server_schema_info b on a.svr_ip = b.svr_ip and a.svr_port = b.svr_port where b.svr_ip is null""") # if results[0][0] > 0 : # raise MyError('refresh schema failed, please check') # (desc, results) = query_cur.exec_query("""select count(*) from __all_virtual_server_schema_info a join __all_virtual_server_schema_info b on a.tenant_id = b.tenant_id where a.refreshed_schema_version != b.refreshed_schema_version or a.refreshed_schema_version <= 1""") # if results[0][0] > 0 : # raise MyError('refresh schema failed, please check') # logging.info('check schema status success') # ## 开始健康检查 #def do_check(my_host, my_port, my_user, my_passwd, upgrade_params, timeout): # try: # conn = mysql.connector.connect(user = my_user, # password = my_passwd, # host = my_host, # port = my_port, # database = 'oceanbase', # raise_on_warnings = True) # conn.autocommit = True # cur = conn.cursor(buffered=True) # try: # query_cur = QueryCursor(cur) # check_paxos_replica(query_cur) # check_observer_status(query_cur) # check_schema_status(query_cur) # except Exception, e: # logging.exception('run error') # raise e # finally: # cur.close() # conn.close() # except mysql.connector.Error, e: # logging.exception('connection error') # raise e # except Exception, e: # logging.exception('normal error') # raise e # #if __name__ == '__main__': # upgrade_params = UpgradeParams() # change_opt_defult_value('log-file', upgrade_params.log_filename) # parse_options(sys.argv[1:]) # if not has_no_local_opts(): # deal_with_local_opts() # else: # check_db_client_opts() # log_filename = get_opt_log_file() # upgrade_params.log_filename = log_filename # # 日志配置放在这里是为了前面的操作不要覆盖掉日志文件 # config_logging_module(upgrade_params.log_filename) # try: # host = get_opt_host() # port = int(get_opt_port()) # user = get_opt_user() # password = get_opt_password() # timeout = int(get_opt_timeout()) # logging.info('parameters from cmd: host=\"%s\", port=%s, user=\"%s\", password=\"%s\", log-file=\"%s\", timeout=%s', \ # host, port, user, password, log_filename, timeout) # do_check(host, port, user, password, upgrade_params, timeout) # except mysql.connector.Error, e: # logging.exception('mysql connctor error') # raise e # except Exception, e: # logging.exception('normal error') # raise e # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #filename:upgrade_post_checker.py ##!/usr/bin/env python ## -*- coding: utf-8 -*- # #import sys #import os #import time #import mysql.connector #from mysql.connector import errorcode #import logging #import getopt #import time # #class UpgradeParams: # log_filename = 'upgrade_post_checker.log' # new_version = '4.0.0.0' ##### --------------start : my_error.py -------------- #class MyError(Exception): # def __init__(self, value): # self.value = value # def __str__(self): # return repr(self.value) ##### --------------start : actions.py------------ #class Cursor: # __cursor = None # def __init__(self, cursor): # self.__cursor = cursor # def exec_sql(self, sql, print_when_succ = True): # try: # self.__cursor.execute(sql) # rowcount = self.__cursor.rowcount # if True == print_when_succ: # logging.info('succeed to execute sql: %s, rowcount = %d', sql, rowcount) # return rowcount # except mysql.connector.Error, e: # logging.exception('mysql connector error, fail to execute sql: %s', sql) # raise e # except Exception, e: # logging.exception('normal error, fail to execute sql: %s', sql) # raise e # def exec_query(self, sql, print_when_succ = True): # try: # self.__cursor.execute(sql) # results = self.__cursor.fetchall() # rowcount = self.__cursor.rowcount # if True == print_when_succ: # logging.info('succeed to execute query: %s, rowcount = %d', sql, rowcount) # return (self.__cursor.description, results) # except mysql.connector.Error, e: # logging.exception('mysql connector error, fail to execute sql: %s', sql) # raise e # except Exception, e: # logging.exception('normal error, fail to execute sql: %s', sql) # raise e # #def set_parameter(cur, parameter, value): # sql = """alter system set {0} = '{1}'""".format(parameter, value) # logging.info(sql) # cur.execute(sql) # wait_parameter_sync(cur, parameter, value) # #def wait_parameter_sync(cur, key, value): # sql = """select count(*) as cnt from oceanbase.__all_virtual_sys_parameter_stat # where name = '{0}' and value != '{1}'""".format(key, value) # times = 10 # while times > 0: # logging.info(sql) # cur.execute(sql) # result = cur.fetchall() # if len(result) != 1 or len(result[0]) != 1: # logging.exception('result cnt not match') # raise e # elif result[0][0] == 0: # logging.info("""{0} is sync, value is {1}""".format(key, value)) # break # else: # logging.info("""{0} is not sync, value should be {1}""".format(key, value)) # # times -= 1 # if times == 0: # logging.exception("""check {0}:{1} sync timeout""".format(key, value)) # raise e # time.sleep(5) # ##### --------------start : opt.py -------------- #help_str = \ #""" #Help: #""" +\ #sys.argv[0] + """ [OPTIONS]""" +\ #'\n\n' +\ #'-I, --help Display this help and exit.\n' +\ #'-V, --version Output version information and exit.\n' +\ #'-h, --host=name Connect to host.\n' +\ #'-P, --port=name Port number to use for connection.\n' +\ #'-u, --user=name User for login.\n' +\ #'-p, --password=name Password to use when connecting to server. If password is\n' +\ #' not given it\'s empty string "".\n' +\ #'-m, --module=name Modules to run. Modules should be a string combined by some of\n' +\ #' the following strings: ddl, normal_dml, each_tenant_dml,\n' +\ #' system_variable_dml, special_action, all. "all" represents\n' +\ #' that all modules should be run. They are splitted by ",".\n' +\ #' For example: -m all, or --module=ddl,normal_dml,special_action\n' +\ #'-l, --log-file=name Log file path. If log file path is not given it\'s ' + os.path.splitext(sys.argv[0])[0] + '.log\n' +\ #'\n\n' +\ #'Maybe you want to run cmd like that:\n' +\ #sys.argv[0] + ' -h 127.0.0.1 -P 3306 -u admin -p admin\n' # #version_str = """version 1.0.0""" # #class Option: # __g_short_name_set = set([]) # __g_long_name_set = set([]) # __short_name = None # __long_name = None # __is_with_param = None # __is_local_opt = None # __has_value = None # __value = None # def __init__(self, short_name, long_name, is_with_param, is_local_opt, default_value = None): # if short_name in Option.__g_short_name_set: # raise MyError('duplicate option short name: {0}'.format(short_name)) # elif long_name in Option.__g_long_name_set: # raise MyError('duplicate option long name: {0}'.format(long_name)) # Option.__g_short_name_set.add(short_name) # Option.__g_long_name_set.add(long_name) # self.__short_name = short_name # self.__long_name = long_name # self.__is_with_param = is_with_param # self.__is_local_opt = is_local_opt # self.__has_value = False # if None != default_value: # self.set_value(default_value) # def is_with_param(self): # return self.__is_with_param # def get_short_name(self): # return self.__short_name # def get_long_name(self): # return self.__long_name # def has_value(self): # return self.__has_value # def get_value(self): # return self.__value # def set_value(self, value): # self.__value = value # self.__has_value = True # def is_local_opt(self): # return self.__is_local_opt # def is_valid(self): # return None != self.__short_name and None != self.__long_name and True == self.__has_value and None != self.__value # #g_opts =\ #[\ #Option('I', 'help', False, True),\ #Option('V', 'version', False, True),\ #Option('h', 'host', True, False),\ #Option('P', 'port', True, False),\ #Option('u', 'user', True, False),\ #Option('p', 'password', True, False, ''),\ ## 要跑哪个模块,默认全跑 #Option('m', 'module', True, False, 'all'),\ ## 日志文件路径,不同脚本的main函数中中会改成不同的默认值 #Option('l', 'log-file', True, False) #]\ # #def change_opt_defult_value(opt_long_name, opt_default_val): # global g_opts # for opt in g_opts: # if opt.get_long_name() == opt_long_name: # opt.set_value(opt_default_val) # return # #def has_no_local_opts(): # global g_opts # no_local_opts = True # for opt in g_opts: # if opt.is_local_opt() and opt.has_value(): # no_local_opts = False # return no_local_opts # #def check_db_client_opts(): # global g_opts # for opt in g_opts: # if not opt.is_local_opt() and not opt.has_value(): # raise MyError('option "-{0}" has not been specified, maybe you should run "{1} --help" for help'\ # .format(opt.get_short_name(), sys.argv[0])) # #def parse_option(opt_name, opt_val): # global g_opts # for opt in g_opts: # if opt_name in (('-' + opt.get_short_name()), ('--' + opt.get_long_name())): # opt.set_value(opt_val) # #def parse_options(argv): # global g_opts # short_opt_str = '' # long_opt_list = [] # for opt in g_opts: # if opt.is_with_param(): # short_opt_str += opt.get_short_name() + ':' # else: # short_opt_str += opt.get_short_name() # for opt in g_opts: # if opt.is_with_param(): # long_opt_list.append(opt.get_long_name() + '=') # else: # long_opt_list.append(opt.get_long_name()) # (opts, args) = getopt.getopt(argv, short_opt_str, long_opt_list) # for (opt_name, opt_val) in opts: # parse_option(opt_name, opt_val) # if has_no_local_opts(): # check_db_client_opts() # #def deal_with_local_opt(opt): # if 'help' == opt.get_long_name(): # global help_str # print help_str # elif 'version' == opt.get_long_name(): # global version_str # print version_str # #def deal_with_local_opts(): # global g_opts # if has_no_local_opts(): # raise MyError('no local options, can not deal with local options') # else: # for opt in g_opts: # if opt.is_local_opt() and opt.has_value(): # deal_with_local_opt(opt) # # 只处理一个 # return # #def get_opt_host(): # global g_opts # for opt in g_opts: # if 'host' == opt.get_long_name(): # return opt.get_value() # #def get_opt_port(): # global g_opts # for opt in g_opts: # if 'port' == opt.get_long_name(): # return opt.get_value() # #def get_opt_user(): # global g_opts # for opt in g_opts: # if 'user' == opt.get_long_name(): # return opt.get_value() # #def get_opt_password(): # global g_opts # for opt in g_opts: # if 'password' == opt.get_long_name(): # return opt.get_value() # #def get_opt_module(): # global g_opts # for opt in g_opts: # if 'module' == opt.get_long_name(): # return opt.get_value() # #def get_opt_log_file(): # global g_opts # for opt in g_opts: # if 'log-file' == opt.get_long_name(): # return opt.get_value() ##### ---------------end---------------------- # #def config_logging_module(log_filenamme): # logging.basicConfig(level=logging.INFO,\ # format='[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s',\ # datefmt='%Y-%m-%d %H:%M:%S',\ # filename=log_filenamme,\ # filemode='w') # # 定义日志打印格式 # formatter = logging.Formatter('[%(asctime)s] %(levelname)s %(filename)s:%(lineno)d %(message)s', '%Y-%m-%d %H:%M:%S') # ####################################### # # 定义一个Handler打印INFO及以上级别的日志到sys.stdout # stdout_handler = logging.StreamHandler(sys.stdout) # stdout_handler.setLevel(logging.INFO) # # 设置日志打印格式 # stdout_handler.setFormatter(formatter) # # 将定义好的stdout_handler日志handler添加到root logger # logging.getLogger('').addHandler(stdout_handler) # ##### STAR ## 1 检查版本号 #def check_cluster_version(query_cur): # # 一方面配置项生效是个异步生效任务,另一方面是2.2.0之后新增租户级配置项刷新,和系统级配置项刷新复用同一个timer,这里暂且等一下。 # times = 30 # sql="select distinct value = '{0}' from oceanbase.GV$OB_PARAMETERS where name='min_observer_version'".format(upgrade_params.new_version) # while times > 0 : # (desc, results) = query_cur.exec_query(sql) # if len(results) == 1 and results[0][0] == 1: # break; # time.sleep(1) # times -=1 # if times == 0: # logging.warn("check cluster version timeout!") # raise e # else: # logging.info("check_cluster_version success") # ## 2 检查内部表自检是否成功 #def check_root_inspection(query_cur): # sql = "select count(*) from oceanbase.__all_virtual_upgrade_inspection where info != 'succeed'" # times = 180 # while times > 0 : # (desc, results) = query_cur.exec_query(sql) # if results[0][0] == 0: # break # time.sleep(10) # times -= 1 # if times == 0: # logging.warn('check root inspection failed!') # raise e # logging.info('check root inspection success') # ## 4 开ddl #def enable_ddl(cur): # set_parameter(cur, 'enable_ddl', 'True') # ## 5 打开rebalance #def enable_rebalance(cur): # set_parameter(cur, 'enable_rebalance', 'True') # ## 6 打开rereplication #def enable_rereplication(cur): # set_parameter(cur, 'enable_rereplication', 'True') # ## 7 打开major freeze #def enable_major_freeze(cur): # set_parameter(cur, 'enable_major_freeze', 'True') # #def fetch_tenant_ids(query_cur): # try: # tenant_id_list = [] # (desc, results) = query_cur.exec_query("""select distinct tenant_id from oceanbase.__all_tenant order by tenant_id desc""") # for r in results: # tenant_id_list.append(r[0]) # return tenant_id_list # except Exception, e: # logging.exception('fail to fetch distinct tenant ids') # raise e # ## 开始升级后的检查 #def do_check(my_host, my_port, my_user, my_passwd, upgrade_params): # try: # conn = mysql.connector.connect(user = my_user, # password = my_passwd, # host = my_host, # port = my_port, # database = 'oceanbase', # raise_on_warnings = True) # conn.autocommit = True # cur = conn.cursor(buffered=True) # try: # query_cur = Cursor(cur) # try: # check_cluster_version(query_cur) # check_root_inspection(query_cur) # enable_ddl(cur) # enable_rebalance(cur) # enable_rereplication(cur) # enable_major_freeze(cur) # except Exception, e: # logging.exception('run error') # raise e # except Exception, e: # logging.exception('run error') # raise e # finally: # cur.close() # conn.close() # except mysql.connector.Error, e: # logging.exception('connection error') # raise e # except Exception, e: # logging.exception('normal error') # raise e # #if __name__ == '__main__': # upgrade_params = UpgradeParams() # change_opt_defult_value('log-file', upgrade_params.log_filename) # parse_options(sys.argv[1:]) # if not has_no_local_opts(): # deal_with_local_opts() # else: # check_db_client_opts() # log_filename = get_opt_log_file() # upgrade_params.log_filename = log_filename # # 日志配置放在这里是为了前面的操作不要覆盖掉日志文件 # config_logging_module(upgrade_params.log_filename) # try: # host = get_opt_host() # port = int(get_opt_port()) # user = get_opt_user() # password = get_opt_password() # logging.info('parameters from cmd: host=\"%s\", port=%s, user=\"%s\", password=\"%s\", log-file=\"%s\"',\ # host, port, user, password, log_filename) # do_check(host, port, user, password, upgrade_params) # except mysql.connector.Error, e: # logging.exception('mysql connctor error') # raise e # except Exception, e: # logging.exception('normal error') # raise e # ####====XXXX======######==== I am a splitter ====######======XXXX====#### #sub file module end import os import sys import datetime from random import Random class SplitError(Exception): def __init__(self, value): self.value = value def __str__(self): return repr(self.value) def random_str(rand_str_len = 8): str = '' chars = 'AaBbCcDdEeFfGgHhIiJjKkLlMmNnOoPpQqRrSsTtUuVvWwXxYyZz0123456789' length = len(chars) - 1 random = Random() for i in range(rand_str_len): str += chars[random.randint(0, length)] return str def split_py_files(sub_files_dir): char_enter = '\n' file_splitter_line = '####====XXXX======######==== I am a splitter ====######======XXXX====####' sub_filename_line_prefix = '#filename:' sub_file_module_end_line = '#sub file module end' os.makedirs(sub_files_dir) print('succeed to create run dir: ' + sub_files_dir + char_enter) cur_file = open(sys.argv[0], 'r') cur_file_lines = cur_file.readlines() cur_file_lines_count = len(cur_file_lines) sub_file_lines = [] sub_filename = '' begin_read_sub_py_file = False is_first_splitter_line = True i = 0 while i < cur_file_lines_count: if (file_splitter_line + char_enter) != cur_file_lines[i]: if begin_read_sub_py_file: sub_file_lines.append(cur_file_lines[i]) else: if is_first_splitter_line: is_first_splitter_line = False else: #读完一个子文件了,写到磁盘中 sub_file = open(sub_files_dir + '/' + sub_filename, 'w') for sub_file_line in sub_file_lines: sub_file.write(sub_file_line[1:]) sub_file.close() #清空sub_file_lines sub_file_lines = [] #再读取下一行的文件名或者结束标记 i += 1 if i >= cur_file_lines_count: raise SplitError('invalid line index:' + str(i) + ', lines_count:' + str(cur_file_lines_count)) elif (sub_file_module_end_line + char_enter) == cur_file_lines[i]: print 'succeed to split all sub py files' break else: mark_idx = cur_file_lines[i].find(sub_filename_line_prefix) if 0 != mark_idx: raise SplitError('invalid sub file name line, mark_idx = ' + str(mark_idx) + ', line = ' + cur_file_lines[i]) else: sub_filename = cur_file_lines[i][len(sub_filename_line_prefix):-1] begin_read_sub_py_file = True i += 1 cur_file.close() if __name__ == '__main__': cur_filename = sys.argv[0][sys.argv[0].rfind(os.sep)+1:] (cur_file_short_name,cur_file_ext_name1) = os.path.splitext(sys.argv[0]) (cur_file_real_name,cur_file_ext_name2) = os.path.splitext(cur_filename) sub_files_dir_suffix = '_extract_files_' + datetime.datetime.now().strftime('%Y_%m_%d_%H_%M_%S_%f') + '_' + random_str() sub_files_dir = cur_file_short_name + sub_files_dir_suffix sub_files_short_dir = cur_file_real_name + sub_files_dir_suffix split_py_files(sub_files_dir) exec('from ' + sub_files_short_dir + '.do_upgrade_post import do_upgrade_by_argv') do_upgrade_by_argv(sys.argv[1:])