/usr/bin/mysqlfailover is in mysql-utilities 1.3.5-2.
This file is owned by root:root, with mode 0o755.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 | #! /usr/bin/python
#
# Copyright (c) 2012, 2013, Oracle and/or its affiliates. All rights reserved.
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; version 2 of the License.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
#
"""
This file contains the replication slave administration utility. It is used to
perform replication operations on one or more slaves.
"""
from mysql.utilities.common.tools import check_python_version
# Check Python version compatibility
check_python_version()
import logging
import os.path
import signal
import sys
from mysql.utilities.exception import UtilError, UtilRplError
from mysql.utilities.common.messages import SCRIPT_THRESHOLD_WARNING
from mysql.utilities.common.options import add_verbosity
from mysql.utilities.common.options import add_failover_options, add_rpl_user
from mysql.utilities.common.options import check_server_lists
from mysql.utilities.common.options import UtilitiesParser
from mysql.utilities.common.server import check_hostname_alias
from mysql.utilities.common.tools import check_connector_python
from mysql.utilities.common.topology import parse_failover_connections
from mysql.utilities.command.rpl_admin import RplCommands, purge_log
from mysql.utilities import VERSION_FRM
# Constants
NAME = "MySQL Utilities - mysqlfailover "
DESCRIPTION = "mysqlfailover - automatic replication health monitoring and failover"
USAGE = "%prog --master=root@localhost --discover-slaves-login=root " + \
"--candidates=root@host123:3306,root@host456:3306 "
_DATE_FORMAT = '%Y-%m-%d %H:%M:%S %p'
_DATE_LEN = 22
# Check for connector/python
if not check_connector_python():
sys.exit(1)
# Setup a terminal signal handler for SIGNIT
# Must use SetConsoleCtrlHandler function on Windows!
# If posix, save old terminal settings so we can restore them on exit.
try:
# Only valid for *nix systems.
import tty, termios
old_terminal_settings = termios.tcgetattr(sys.stdin)
except:
# Ok to fail for Windows
pass
def set_signal_handler(func):
# If posix, restore old terminal settings.
if os.name == "nt":
from ctypes import windll
windll.kernel32.SetConsoleCtrlHandler(func, True)
# Install SIGTERM signal handler
else:
signal.signal(signal.SIGTERM, func)
# If ctypes present, we have Windows so define the exit with decorators
try:
import ctypes
@ctypes.WINFUNCTYPE(ctypes.c_int, ctypes.c_uint)
def on_exit(signal, func=None):
logging.info("Failover console stopped with SIGTERM.")
sys.exit(0)
except:
def on_exit(signal, func=None):
if os.name == "posix":
termios.tcsetattr(sys.stdin, termios.TCSADRAIN,
old_terminal_settings)
logging.info("Failover console stopped with SIGTERM.")
sys.exit(0)
set_signal_handler(on_exit)
# Setup the command parser
parser = UtilitiesParser(
version=VERSION_FRM.format(program=os.path.basename(sys.argv[0])),
description=DESCRIPTION,
usage=USAGE,
add_help_option=False)
# Default option to provide help information
parser.add_option("--help", action="help", help="display this help message "
"and exit")
# Setup utility-specific options:
add_failover_options(parser)
# Interval for continuous mode
parser.add_option("--interval", "-i", action="store", dest="interval",
type="int", default="15", help="interval in seconds for "
"polling the master for failure and reporting health. "
"Default = 15 seconds. Lowest value is 5 seconds.")
# Add failover modes
parser.add_option("--failover-mode", "-f", action="store", dest="failover_mode",
type="choice", default="auto", choices=["auto", "elect",
"fail"], help="action to take when the master "
"fails. 'auto' = automatically fail to best slave, "
"'elect' = fail to candidate list or if no candidate meets "
"criteria fail, 'fail' = take no action and stop when master "
"fails. Default = 'auto'.")
# Add failover detection extension point
parser.add_option("--exec-fail-check", action="store", dest="exec_fail",
type="string", default=None, help="name of script to "
"execute on each interval to invoke failover")
# Add force to override registry entry
parser.add_option("--force", action="store_true", dest="force", default=False,
help="override the registration check on master for "
"multiple instances of the console monitoring the same "
"master.")
# Add refresh script external point
parser.add_option("--exec-post-failover", action="store", dest="exec_post_fail",
type="string", default=None, help="name of script to "
"execute after failover is complete and the utility has "
"refreshed the health report.")
# Add rediscover on interval
parser.add_option("--rediscover", action="store_true", dest="rediscover",
help="rediscover slaves on interval. Allows console to "
"detect when slaves have been removed or added.")
# Pedantic mode for failing if some inconsistencies are found
parser.add_option("-p", "--pedantic", action="store_true", default=False,
dest="pedantic", help="fail if some inconsistencies are "
"found (e.g. errant transactions on slaves).")
# Add no keyboard input
parser.add_option("--no-keyboard", action="store_true", default=False,
dest="no_keyboard", help="start with no keyboard input "
"support.")
# Add option to run as daemon
parser.add_option("--daemon", action="store", dest="daemon", default=None,
help="run on daemon mode. It can be start, stop, restart "
"or nodetach.",
type="choice", choices=("start", "stop", "restart",
"nodetach"))
# Add pidfile for the daemon option
parser.add_option("--pidfile", action="store", dest="pidfile",
type="string", default=None, help="pidfile for running "
"mysqlfailover as a daemon.")
# Add report values for daemon mode
parser.add_option("--report-values", action="store", dest="report_values",
type="string", default="health",
help="report values used in mysqlfailover running as a "
"daemon. It can be health, gtid or uuid. Multiple values "
"can be used separated by commas. The default is health.")
# Add verbosity mode
add_verbosity(parser, False)
# Replication user and password
add_rpl_user(parser, None)
# Now we process the rest of the arguments.
opt, args = parser.parse_args()
# Check slaves list
if opt.daemon != "stop":
check_server_lists(parser, opt.master, opt.slaves)
# Check for errors
if int(opt.interval) < 5:
parser.error("The --interval option requires a value greater than or "
"equal to 5.")
# The value for --timeout needs to be an integer > 0.
try:
if int(opt.timeout) <= 0:
parser.error("The --timeout option requires a value greater than 0.")
except ValueError:
parser.error("The --timeout option requires an integer value.")
# if opt.master is None and opt.daemon and opt.daemon != "stop":
if opt.master is None and opt.daemon != "stop":
parser.error("You must specify a master to monitor.")
if opt.slaves is None and opt.discover is None and opt.daemon != "stop":
parser.error("You must supply a list of slaves or the "
"--discover-slaves-login option.")
if opt.failover_mode == 'elect' and opt.candidates is None:
parser.error("Failover mode = 'elect' requires at least one candidate.")
# Parse the master, slaves, and candidates connection parameters
try:
master_val, slaves_val, candidates_val = parse_failover_connections(opt)
except UtilRplError:
_, e, _ = sys.exc_info()
print("ERROR: %s" % e.errmsg)
sys.exit(1)
# Check hostname alias
for slave_val in slaves_val:
if check_hostname_alias(master_val, slave_val):
parser.error("The master and one of the slaves are the same host and port.")
for cand_val in candidates_val:
if check_hostname_alias(master_val, cand_val):
parser.error("The master and one of the candidates are the same host and port.")
# Create dictionary of options
options = {
'candidates' : candidates_val,
'ping' : 3 if opt.ping is None else opt.ping,
'verbosity' : 0 if opt.verbosity is None else opt.verbosity,
'before' : opt.exec_before,
'after' : opt.exec_after,
'fail_check' : opt.exec_fail,
'max_position' : opt.max_position,
'max_delay' : opt.max_delay,
'discover' : opt.discover,
'timeout' : int(opt.timeout),
'interval' : opt.interval,
'failover_mode' : opt.failover_mode,
'logging' : opt.log_file is not None,
'log_file' : opt.log_file,
'force' : opt.force,
'post_fail' : opt.exec_post_fail,
'rpl_user' : opt.rpl_user,
'rediscover' : opt.rediscover,
'pedantic' : opt.pedantic,
'no_keyboard' : opt.no_keyboard,
'daemon' : opt.daemon,
'pidfile' : opt.pidfile,
'report_values' : opt.report_values,
'script_threshold' : opt.script_threshold,
}
# Purge log file of old data
if opt.log_file is not None and not purge_log(opt.log_file, opt.log_age):
parser.error("Error purging log file.")
# Setup log file
logging.basicConfig(filename=opt.log_file, level=logging.INFO,
format='%(asctime)s %(levelname)s %(message)s',
datefmt=_DATE_FORMAT)
# Warn user about script threshold checking.
if opt.script_threshold:
print(SCRIPT_THRESHOLD_WARNING)
# Check if the values specified for the --report-values option are valid.
for report in opt.report_values.split(','):
if report.lower() not in ("health", "gtid", "uuid"):
parser.error("The value for the option --report-values is not valid: "
"'{0}', the values allowed are 'health', 'gitd' or 'uuid'"
"".format(opt.report_values))
# Check the daemon options
if opt.daemon:
# Check if a POSIX system
if os.name != "posix":
parser.error("Running mysqlfailover with --daemon is only available "
"for POSIX systems.")
# Check the presence of --log
if opt.daemon != "stop" and not opt.log_file:
parser.error("The option --log is required when using --daemon.")
# Test pidfile
if opt.daemon != "nodetach":
pidfile = opt.pidfile or "./failover_daemon.pid"
pidfile = os.path.realpath(os.path.normpath(pidfile))
if opt.daemon == "start":
# Test if pidfile exists
if os.path.exists(pidfile):
parser.error("pidfile {0} already exists. The daemon is "
"already running?".format(pidfile))
# Test if pidfile is writable
try:
with open(pidfile, "w") as f:
f.write("{0}\n".format(0))
# Delete temporary pidfile
os.remove(pidfile)
except IOError as err:
parser.error("Unable to write pidfile: {0}"
"".format(err.strerror))
else:
# opt.daemon == stop/restart, test if pidfile is readable
pid = None
try:
if not os.path.exists(pidfile):
parser.error("pidfile {0} does not exist.".format(pidfile))
with open(pidfile, "r") as f:
pid = int(f.read().strip())
except IOError:
pid = None
except ValueError:
pid = None
# Test pid presence
if not pid:
parser.error("Can not read pid from pidfile.")
if opt.pidfile and not opt.daemon:
parser.error("The option --daemon is required when using --pidfile.")
try:
rpl_cmds = RplCommands(master_val, slaves_val, options)
if opt.daemon:
rpl_cmds.auto_failover_as_daemon()
else:
rpl_cmds.auto_failover(opt.interval)
except UtilError:
_, e, _ = sys.exc_info()
# log the error in case it was an usual exception
logging.log(logging.CRITICAL, e.errmsg.strip(' '))
print("ERROR: %s" % e.errmsg)
sys.exit(1)
except KeyboardInterrupt:
sys.exit(0)
sys.exit(0)
|