Skip to content

Commit

Permalink
feat: tendbHa定点回档增加slave延迟检查 TencentBlueKing#9096
Browse files Browse the repository at this point in the history
  • Loading branch information
zfrendo authored and zhangzhw8 committed Jan 17, 2025
1 parent 758b475 commit d5f6e26
Show file tree
Hide file tree
Showing 2 changed files with 93 additions and 0 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -41,6 +41,7 @@
TendbGetBackupInfoFailedException,
)
from backend.flow.plugins.components.collections.mysql.exec_actuator_script import ExecuteDBActuatorScriptComponent
from backend.flow.plugins.components.collections.mysql.mysql_check_slave_delay import MySQLCheckSlaveDelayComponent
from backend.flow.plugins.components.collections.mysql.mysql_crond_control import MysqlCrondMonitorControlComponent
from backend.flow.plugins.components.collections.mysql.mysql_rds_execute import MySQLExecuteRdsComponent
from backend.flow.plugins.components.collections.mysql.trans_flies import TransFileComponent
Expand Down Expand Up @@ -371,6 +372,24 @@ def rollback_to_cluster_flow(self):
act_component_code=ExecuteDBActuatorScriptComponent.code,
kwargs=asdict(exec_act_kwargs),
)

if rollback_storage.instance_role in (
InstanceRole.BACKEND_REPEATER.value,
InstanceRole.BACKEND_SLAVE.value,
):
rollback_pipeline.add_act(
act_name=_("检查主从延迟 {}").format(rollback_storage.ip_port),
act_component_code=MySQLCheckSlaveDelayComponent.code,
kwargs=asdict(
ExecuteRdsKwargs(
bk_cloud_id=cluster_class.bk_cloud_id,
instance_ip=rollback_storage.machine.ip,
instance_port=rollback_storage.port,
sqls=["show slave status"],
)
),
)

# 屏蔽监控,停止从库备份
rollback_pipeline.add_act(
act_name=_("屏蔽监控 {}").format(rollback_storage.ip_port),
Expand All @@ -383,6 +402,7 @@ def rollback_to_cluster_flow(self):
)
),
)

if self.data["all_database_rollback"]:
rollback_pipeline.add_act(
act_name=_("从库stop slave {}").format(rollback_storage.ip_port),
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,73 @@
# -*- coding: utf-8 -*-
"""
TencentBlueKing is pleased to support the open source community by making 蓝鲸智云-DB管理系统(BlueKing-BK-DBM) available.
Copyright (C) 2017-2023 THL A29 Limited, a Tencent company. All rights reserved.
Licensed under the MIT License (the "License"); you may not use this file except in compliance with the License.
You may obtain a copy of the License at https://opensource.org/licenses/MIT
Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
specific language governing permissions and limitations under the License.
"""
import logging

from django.utils.translation import ugettext as _
from pipeline.component_framework.component import Component

from backend.components import DRSApi
from backend.constants import IP_PORT_DIVIDER
from backend.flow.plugins.components.collections.common.base_service import BaseService

logger = logging.getLogger("flow")


class MySQLCheckSlaveDelayService(BaseService):
"""
执行 show slave status 语句
"""

def _execute(self, data, parent_data) -> bool:
kwargs = data.get_one_of_inputs("kwargs")
self.log_info(_("传入参数:{}").format(kwargs))
self.log_info(
_("检查从库是否延迟,为保证定点回档前清理回档的库会同步到所有从节点。如果检查不通过,您可以检查目标集群延迟情况,根据自己实际需求来跳过此节点。" "只要确保回档的库已清理,跳过该节点不影响后续流程。")
)
res = DRSApi.rpc(
{
"addresses": ["{}{}{}".format(kwargs["instance_ip"], IP_PORT_DIVIDER, kwargs["instance_port"])],
"cmds": ["show slave status"],
"force": False,
"bk_cloud_id": kwargs["bk_cloud_id"],
}
)
if res[0]["error_msg"]:
self.log_info("execute sql error {}".format(res[0]["error_msg"]))
return False
else:
if len(res[0]["cmd_results"][0]["table_data"]) == 0:
self.log_info("show slave status is empty")
return False
else:
slave_info = res[0]["cmd_results"][0]["table_data"][0]
slave_delay = 0
if slave_info["Seconds_Behind_Master"] is not None:
slave_delay = int(slave_info["Seconds_Behind_Master"])
if (
slave_info["Slave_IO_Running"] == "Yes"
and slave_info["Slave_SQL_Running"] == "Yes"
and slave_delay <= 300
):
return True
else:
self.log_info(
_(
"Slave_IO_Running!=Yes or Slave_SQL_Running=!Yes or Seconds_Behind_Master>300,"
"请确定slave复制链路正常且延迟不能超过300s。"
)
)
return False


class MySQLCheckSlaveDelayComponent(Component):
name = __name__
code = "mysql_check_slave_delay"
bound_service = MySQLCheckSlaveDelayService

0 comments on commit d5f6e26

Please sign in to comment.