4.1 创建普通用户
所有服务器上创建普通用户toor、设置密码及sudo授权ifconfig,加入mysql用户组
useradd -u 900 toor
echo "chenliang"|passwd --stdin toor
id toor
sed -i '92a toor ALL=(ALL) NOPASSWD:/sbin/ifconfig' /etc/sudoers
visudo -c
usermod -g mysql toor
4.2 创建密钥对
#切换到toor用户下,生成密钥,复制公钥到其它服务器(包含自身)
#切换到toor普通用户下,生成密钥对,每一台服务器都要操作
[toor@db01 ~]$ su - toor
[toor@db01 ~]$ ssh-keygen -t rsa -P "" -f /home/toor/.ssh/id_rsa
Generating public/private rsa key pair.
Created directory '/home/toor/.ssh'.
Your identification has been saved in /home/toor/.ssh/id_dsa.
Your public key has been saved in /home/toor/.ssh/id_dsa.pub.
The key fingerprint is:
16:11:a5:3a:6d:f6:9d:a9:69:7f:03:a3:91:95:34:a3 toor@db01
The key's randomart image is:
+--[ DSA 1024]----+
| oo. |
| o + |
| o o + |
| o .E o |
| o S o |
| = .o.oo |
| .o+o |
| oo o |
| .o... . |
+-----------------+
#拷贝公钥到其它服务器,包括自身,在每一台服务器上都要执行以下四条命令
#且是在toor普通用户下
ssh-copy-id -i .ssh/id_rsa.pub "-p 921 [email protected]"
ssh-copy-id -i .ssh/id_rsa.pub "-p 921 [email protected]"
ssh-copy-id -i .ssh/id_rsa.pub "-p 921 [email protected]"
ssh-copy-id -i .ssh/id_rsa.pub "-p 921 [email protected]"
4.3 相关命令做软链接
对mysqlbinlog和mysql命令做软链接,所有服务器都需要进行操作,这里以db01为例
[root@db01 ~]# ln -sv /apps/mysql/bin/mysqlbinlog /usr/bin/mysqlbinlog
`/usr/bin/mysqlbinlog' -> `/apps/mysql/bin/mysqlbinlog'
[root@db01 ~]# ln -sv /apps/mysql/bin/mysql /usr/bin/mysql
`/usr/bin/mysql' -> `/apps/mysql/bin/mysql'
[root@db01 ~]# ll /usr/bin/{mysqlbinlog,mysql}
lrwxrwxrwx 1 root root 21 Nov 16 11:32 /usr/bin/mysql -> /apps/mysql/bin/mysql
lrwxrwxrwx 1 root root 27 Nov 16 11:31 /usr/bin/mysqlbinlog -> /apps/mysql/bin/mysqlbinlog
4.4 创建mha用户
这里需要创建mha用户(在mysql里面创建),因前面做了主从复制了,所以只需要在
db01(master)服务器上创建。
#在主库上创建mha用户
[root@db01 ~]# mysql -uroot -pchenliang -S /data/3306/mysql.sock
mysql>
mysql> grant all privileges on *.* to 'mha'@'172.16.1.%' identified by 'mha';
Query OK, 0 rows affected, 1 warning (0.08 sec)
mysql> select user,host,authentication_string from mysql.user where user='mha' and host='172.16.1.%';
+------+------------+-------------------------------------------+
| user | host | authentication_string |
+------+------------+-------------------------------------------+
| mha | 172.16.1.% | *F4C9AC49A736981AE2739FC2F4A1FD92B4F07929 |
+------+------------+-------------------------------------------+
1 row in set (0.00 sec)
#在从库(db02、db03、db04)上检查是否有mha用户
mysql> select user,host from mysql.user where user='mha' and host='172.16.1.%';
+------+------------+
| user | host |
+------+------------+
| mha | 172.16.1.% |
+------+------------+
1 row in set (0.00 sec)
4.5 安装mha node包
安装mha node包,所以服务器都需要安装。这里以db01服务器上的安装为例
[root@db01 ~]# yum install perl-DBD-MySQL -y
[root@db01 ~]# cd tools/
[root@db01 tools]# rz
[root@db01 tools]# ll mha4mysql-node-0.56-0.el6.noarch.rpm
-rw-r--r-- 1 root root 36326 Sep 16 2016 mha4mysql-node-0.56-0.el6.noarch.rpm
[root@db01 tools]# rpm -ivh mha4mysql-node-0.56-0.el6.noarch.rpm
Preparing... ########################################### [100%]
1:mha4mysql-node ########################################### [100%]
4.6 安装mha manager包
注意:这里是在db04服务器上安装,其它服务器不用安装
[root@db04 ~]# wget -O /etc/yum.repos.d/epel.repo http://mirrors.aliyun.com/repo/epel-6.repo
[root@db04 ~]# yum install perl-Config-Tiny epel-release perl-Log-Dispatch perl-Parallel-ForkManager perl-Time-HiRes -y
[root@db04 ~]# rpm -qa perl-Config-Tiny epel-release perl-Log-Dispatch perl-Parallel-ForkManager perl-Time-HiRes
perl-Parallel-ForkManager-1.20-1.el6.noarch
perl-Log-Dispatch-2.27-1.el6.noarch
perl-Time-HiRes-1.9721-144.el6.x86_64
perl-Config-Tiny-2.12-7.1.el6.noarch
epel-release-6-8.noarch
[root@db04 ~]# cd tools/
[root@db04 tools]# rz
[root@db04 tools]# ll mha4mysql-manager-0.56-0.el6.noarch.rpm
-rw-r--r-- 1 root root 87119 Sep 16 2016 mha4mysql-manager-0.56-0.el6.noarch.rpm
[root@db04 tools]# rpm -ivh mha4mysql-manager-0.56-0.el6.noarch.rpm
Preparing... ########################################### [100%]
1:mha4mysql-manager ########################################### [100%]
4.7 创建mha相关目录
注意:这里是在db04服务器上创建相应的目录
#创建MHA的工作目录
[root@db04 ~]# mkdir /etc/mha/app/app1 -p
[root@db04 ~]# chown -R toor:toor /etc/mha/app/app1/
[root@db04 ~]# ls -ld /etc/mha/app/app1/
drwxr-xr-x 2 toor toor 4096 Nov 16 12:27 /etc/mha/app/app1/
#创建MHA的日志目录
[root@db04 ~]# mkdir /var/log/mha/app/app1 -p
[root@db04 ~]# chown -R toor:toor /var/log/mha/app/app1/
[root@db04 ~]# ls -ld /var/log/mha/app/app1/
drwxr-xr-x 2 toor toor 4096 Nov 16 12:28 /var/log/mha/app/app1/
4.8 配置mha配置文件
[root@db04 ~]# cd /etc/mha/app/app1/
[root@db04 app1]# vim app1.cnf
[server default]
manager_log=/var/log/mha/app/app1/manager.log
manager_workdir=/var/log/mha/app/app1
master_binlog_dir=/data/3306/binlog
master_ip_failover_script=/server/scripts/master_ip_failover
password=mha
ping_interval=2
repl_password=chenliang
repl_user=rep
ssh_user=toor
ssh_port=921
user=mha
[server1]
hostname=172.16.1.11
port=3306
[server2]
hostname=172.16.1.12
port=3306
[server3]
hostname=172.16.1.13
port=3306
[server4]
hostname=172.16.1.14
no_master=1
port=3306
[root@db04 app1]# chown -R toor:toor /etc/mha/app/app1/app1.cnf
[root@db04 app1]# ll /etc/mha/app/app1/app1.cnf
-rw-r--r-- 1 toor toor 468 Nov 16 12:32 /etc/mha/app/app1/app1.cnf
#配置文件说明
[server default]
manager_log=/var/log/mha/app/app1/manager.log #mha的日志保存路径及文件名
manager_workdir=/var/log/mha/app/app1 #mha的工作目录
master_binlog_dir=/data/3306/binlog #所有mysql 的binlog日志存放路径
master_ip_failover_script=/server/scripts/master_ip_failover#VIP飘移脚本的存放路径
password=mha #mha用户的密码
ping_interval=2 #每隔2秒检测一下Master是否正常
repl_password=chenliang #主从复制用户的密码
repl_user=rep #主从复制的用户
ssh_user=toor #ssh通信的用户
ssh_port=921 #ssh的端口
user=mha #mha的用户名mha
[server1] #服务器1
hostname=172.16.1.11 #hostname最好用ip地址来指定
port=3306 #mysql服务的端口
[server2] #服务器2
hostname=172.16.1.12 #hostname最好用ip地址来指定
port=3306 #mysql服务的端口
[server3] #服务器3
hostname=172.16.1.13 #hostname最好用ip地址来指定
port=3306 #mysql服务的端口
[server4] #服务器4
hostname=172.16.1.14 #hostname最好用ip地址来指定
no_master=1 #不让其服务器提升为master
port=3306 #mysql服务的端口
4.9 配置mha vip飘移脚本
注意:这里也只是在db04服务器上编写脚本
[root@db04 ~]# mkdir /server/scripts/ -p
[root@db04 ~]# cd /server/scripts/
[root@db04 scripts]# rz
[root@db04 scripts]# ll master_ip_failover
-rw-r--r-- 1 root root 3049 Nov 8 20:30 master_ip_failover
[root@db04 scripts]# cat master_ip_failover
#!/usr/bin/env perl
use strict;
use warnings FATAL =>'all';
use Getopt::Long;
my (
$command, $ssh_user, $orig_master_host, $orig_master_ip,
$orig_master_port, $new_master_host, $new_master_ip, $new_master_port,
);
my $ssh_port = '921' ;
my $vip = '172.16.1.10/24';
my $key = "1";
my $ssh_start_vip = " sudo /sbin/ifconfig eth1:$key $vip";
my $ssh_stop_vip = "sudo /sbin/ifconfig eth1:$key down";
GetOptions(
'command=s' => \$command,
'ssh_user=s' => \$ssh_user,
'orig_master_host=s' => \$orig_master_host,
'orig_master_ip=s' => \$orig_master_ip,
'orig_master_port=i' => \$orig_master_port,
'new_master_host=s' => \$new_master_host,
'new_master_ip=s' => \$new_master_ip,
'new_master_port=i' => \$new_master_port,
);
exit &main();
sub main {
#print "\n\nIN SCRIPT TEST====$ssh_stop_vip==$ssh_start_vip===\n\n";
if ( $command eq "stop" || $command eq "stopssh" ) {
# $orig_master_host, $orig_master_ip, $orig_master_port are passed.
# If you manage master ip address at global catalog database,
# invalidate orig_master_ip here.
my $exit_code = 1;
eval {
print "\n\n\n***************************************************************\n";
print "Disabling the VIP - $vip on old master: $orig_master_host\n";
print "***************************************************************\n\n\n\n";
&stop_vip();
$exit_code = 0;
};
if ($@) {
warn "Got Error: $@\n";
exit $exit_code;
}
exit $exit_code;
}
elsif ( $command eq "start" ) {
# all arguments are passed.
# If you manage master ip address at global catalog database,
# activate new_master_ip here.
# You can also grant write access (create user, set read_only=0, etc) here.
my $exit_code = 10;
eval {
print "\n\n\n***************************************************************\n";
print "Enabling the VIP - $vip on new master: $new_master_host \n";
print "***************************************************************\n\n\n\n";
&start_vip();
$exit_code = 0;
};
if ($@) {
warn $@;
exit $exit_code;
}
exit $exit_code;
}
elsif ( $command eq "status" ) {
print "Checking the Status of the script.. OK \n";
`ssh -p$ssh_port $ssh_user\@$orig_master_host \" $ssh_start_vip \"`;
exit 0;
}
else {
&usage();
exit 1;
}
}
# A simple system call that enable the VIP on the new master
sub start_vip() {
`ssh -p$ssh_port $ssh_user\@$new_master_host \" $ssh_start_vip \"`;
}
# A simple system call that disable the VIP on the old_master
sub stop_vip() {
`ssh -p$ssh_port $ssh_user\@$orig_master_host \" $ssh_stop_vip \"`;
}
sub usage {
"Usage: master_ip_failover -command=start|stop|stopssh|status -orig_master_host=host -orig_master_ip=ip -orig_master_port=po
rt -new_master_host=host -new_master_ip=i-new_master_port=port\n";
}
[root@db04 scripts]# chmod +x master_ip_failover
[root@db04 scripts]# chown toor:toor master_ip_failover
[root@db04 scripts]# ll master_ip_failover
-rwxr-xr-x 1 toor toor 3049 Nov 16 12:47 master_ip_failover
4.10 配置VIP地址
注意:这里是在Master(db01)服务器上配置vip地址
[root@db01 ~]# ifconfig eth1:1 172.16.1.10/24
[root@db01 ~]# ifconfig eth1:1
eth1:1 Link encap:Ethernet HWaddr 00:0C:29:6B:2E:55
inet addr:172.16.1.10 Bcast:172.16.1.255 Mask:255.255.255.0
UP BROADCAST RUNNING MULTICAST MTU:1500 Metric:1
[root@db01 ~]# cp -a /etc/sysconfig/network-scripts/ifcfg-eth1 /etc/sysconfig/network-scripts/ifcfg-eth1:1
[root@db01 ~]# vim /etc/sysconfig/network-scripts/ifcfg-eth1:1
DEVICE=eth1:1
TYPE=Ethernet
ONBOOT=yes
NM_CONTROLLED=yes
BOOTPROTO=none
IPADDR=172.16.1.10
NETMASK=255.255.255.0
USERCTL=no
PEERDNS=yes
IPV6INIT=no
1.11 检查mha的配置
注意:这里是在db04服务器上的toor普通用户下进行操作
#检查ssh免密触是否正常
[toor@db04 ~]$ masterha_check_ssh --conf=/etc/mha/app/app1/app1.cnf
Fri Nov 16 12:57:21 2018 - [warning] Global configuration file /etc/masterha_default.cnf not found. Skipping.
Fri Nov 16 12:57:21 2018 - [info] Reading application default configuration from /etc/mha/app/app1/app1.cnf..
Fri Nov 16 12:57:21 2018 - [info] Reading server configuration from /etc/mha/app/app1/app1.cnf..
Fri Nov 16 12:57:21 2018 - [info] Starting SSH connection tests..
Fri Nov 16 12:57:22 2018 - [debug]
Fri Nov 16 12:57:21 2018 - [debug] Connecting via SSH from [email protected](172.16.1.11:921) to [email protected](172.16.1.12:921)..
Fri Nov 16 12:57:22 2018 - [debug] ok.
Fri Nov 16 12:57:22 2018 - [debug] Connecting via SSH from [email protected](172.16.1.11:921) to [email protected](172.16.1.13:921)..
Fri Nov 16 12:57:22 2018 - [debug] ok.
Fri Nov 16 12:57:22 2018 - [debug] Connecting via SSH from [email protected](172.16.1.11:921) to [email protected](172.16.1.14:921)..
Fri Nov 16 12:57:22 2018 - [debug] ok.
Fri Nov 16 12:57:23 2018 - [debug]
Fri Nov 16 12:57:22 2018 - [debug] Connecting via SSH from [email protected](172.16.1.12:921) to [email protected](172.16.1.11:921)..
Fri Nov 16 12:57:22 2018 - [debug] ok.
Fri Nov 16 12:57:22 2018 - [debug] Connecting via SSH from [email protected](172.16.1.12:921) to [email protected](172.16.1.13:921)..
Fri Nov 16 12:57:22 2018 - [debug] ok.
Fri Nov 16 12:57:22 2018 - [debug] Connecting via SSH from [email protected](172.16.1.12:921) to [email protected](172.16.1.14:921)..
Fri Nov 16 12:57:23 2018 - [debug] ok.
Fri Nov 16 12:57:23 2018 - [debug]
Fri Nov 16 12:57:22 2018 - [debug] Connecting via SSH from [email protected](172.16.1.13:921) to [email protected](172.16.1.11:921)..
Fri Nov 16 12:57:23 2018 - [debug] ok.
Fri Nov 16 12:57:23 2018 - [debug] Connecting via SSH from [email protected](172.16.1.13:921) to [email protected](172.16.1.12:921)..
Fri Nov 16 12:57:23 2018 - [debug] ok.
Fri Nov 16 12:57:23 2018 - [debug] Connecting via SSH from [email protected](172.16.1.13:921) to [email protected](172.16.1.14:921)..
Fri Nov 16 12:57:23 2018 - [debug] ok.
Fri Nov 16 12:57:24 2018 - [debug]
Fri Nov 16 12:57:23 2018 - [debug] Connecting via SSH from [email protected](172.16.1.14:921) to [email protected](172.16.1.11:921)..
Fri Nov 16 12:57:23 2018 - [debug] ok.
Fri Nov 16 12:57:23 2018 - [debug] Connecting via SSH from [email protected](172.16.1.14:921) to [email protected](172.16.1.12:921)..
Fri Nov 16 12:57:24 2018 - [debug] ok.
Fri Nov 16 12:57:24 2018 - [debug] Connecting via SSH from [email protected](172.16.1.14:921) to [email protected](172.16.1.13:921)..
Fri Nov 16 12:57:24 2018 - [debug] ok.
Fri Nov 16 12:57:24 2018 - [info] All SSH connection tests passed successfully.
#检查主从复制是否正常
[toor@db04 ~]$ masterha_check_repl --conf=/etc/mha/app/app1/app1.cnf
Fri Nov 16 12:59:03 2018 - [warning] Global configuration file /etc/masterha_default.cnf not found. Skipping.
Fri Nov 16 12:59:03 2018 - [info] Reading application default configuration from /etc/mha/app/app1/app1.cnf..
Fri Nov 16 12:59:03 2018 - [info] Reading server configuration from /etc/mha/app/app1/app1.cnf..
Fri Nov 16 12:59:03 2018 - [info] MHA::MasterMonitor version 0.56.
Fri Nov 16 12:59:04 2018 - [info] GTID failover mode = 1
Fri Nov 16 12:59:04 2018 - [info] Dead Servers:
Fri Nov 16 12:59:04 2018 - [info] Alive Servers:
Fri Nov 16 12:59:04 2018 - [info] 172.16.1.11(172.16.1.11:3306)
Fri Nov 16 12:59:04 2018 - [info] 172.16.1.12(172.16.1.12:3306)
Fri Nov 16 12:59:04 2018 - [info] 172.16.1.13(172.16.1.13:3306)
Fri Nov 16 12:59:04 2018 - [info] 172.16.1.14(172.16.1.14:3306)
Fri Nov 16 12:59:04 2018 - [info] Alive Slaves:
Fri Nov 16 12:59:04 2018 - [info] 172.16.1.12(172.16.1.12:3306) Version=5.7.19-log (oldest major version between slaves) log-bin:enabled
Fri Nov 16 12:59:04 2018 - [info] GTID ON
Fri Nov 16 12:59:04 2018 - [info] Replicating from 172.16.1.11(172.16.1.11:3306)
Fri Nov 16 12:59:04 2018 - [info] 172.16.1.13(172.16.1.13:3306) Version=5.7.19-log (oldest major version between slaves) log-bin:enabled
Fri Nov 16 12:59:04 2018 - [info] GTID ON
Fri Nov 16 12:59:04 2018 - [info] Replicating from 172.16.1.11(172.16.1.11:3306)
Fri Nov 16 12:59:04 2018 - [info] 172.16.1.14(172.16.1.14:3306) Version=5.7.19-log (oldest major version between slaves) log-bin:enabled
Fri Nov 16 12:59:04 2018 - [info] GTID ON
Fri Nov 16 12:59:04 2018 - [info] Replicating from 172.16.1.11(172.16.1.11:3306)
Fri Nov 16 12:59:04 2018 - [info] Not candidate for the new Master (no_master is set)
Fri Nov 16 12:59:04 2018 - [info] Current Alive Master: 172.16.1.11(172.16.1.11:3306)
Fri Nov 16 12:59:04 2018 - [info] Checking slave configurations..
Fri Nov 16 12:59:04 2018 - [info] read_only=1 is not set on slave 172.16.1.12(172.16.1.12:3306).
Fri Nov 16 12:59:04 2018 - [info] read_only=1 is not set on slave 172.16.1.13(172.16.1.13:3306).
Fri Nov 16 12:59:04 2018 - [info] read_only=1 is not set on slave 172.16.1.14(172.16.1.14:3306).
Fri Nov 16 12:59:04 2018 - [info] Checking replication filtering settings..
Fri Nov 16 12:59:04 2018 - [info] binlog_do_db= , binlog_ignore_db=
Fri Nov 16 12:59:04 2018 - [info] Replication filtering check ok.
Fri Nov 16 12:59:04 2018 - [info] GTID (with auto-pos) is supported. Skipping all SSH and Node package checking.
Fri Nov 16 12:59:04 2018 - [info] Checking SSH publickey authentication settings on the current master..
Fri Nov 16 12:59:04 2018 - [info] HealthCheck: SSH to 172.16.1.11 is reachable.
Fri Nov 16 12:59:04 2018 - [info]
172.16.1.11(172.16.1.11:3306) (current master)
+--172.16.1.12(172.16.1.12:3306)
+--172.16.1.13(172.16.1.13:3306)
+--172.16.1.14(172.16.1.14:3306)
Fri Nov 16 12:59:04 2018 - [info] Checking replication health on 172.16.1.12..
Fri Nov 16 12:59:04 2018 - [info] ok.
Fri Nov 16 12:59:04 2018 - [info] Checking replication health on 172.16.1.13..
Fri Nov 16 12:59:04 2018 - [info] ok.
Fri Nov 16 12:59:04 2018 - [info] Checking replication health on 172.16.1.14..
Fri Nov 16 12:59:04 2018 - [info] ok.
Fri Nov 16 12:59:04 2018 - [info] Checking master_ip_failover_script status:
Fri Nov 16 12:59:04 2018 - [info] /server/scripts/master_ip_failover --command=status --ssh_user=toor --orig_master_host=172.16.1.11 --orig_master_ip=172.16.1.11 --orig_master_port=3306 --orig_master_ssh_port=921
Unknown option: orig_master_ssh_port
Checking the Status of the script.. OK
Fri Nov 16 12:59:04 2018 - [info] OK.
Fri Nov 16 12:59:04 2018 - [warning] shutdown_script is not defined.
Fri Nov 16 12:59:04 2018 - [info] Got exit code 0 (Not master dead).
MySQL Replication Health is OK
4.12 编写mha的启动命令
注意:这里是在db04服务器上的root用户下进行操作
#把启动命令追加到一个文件中
[root@db04 ~]# echo "nohup masterha_manager --conf=/etc/mha/app/app1/app1.cnf --remove_dead_master_conf --ignore_last_failover </dev/null> /var/log/mha/app/app1/manager.log 2>&1 &" >mha
[root@db04 ~]# cat mha
nohup masterha_manager --conf=/etc/mha/app/app1/app1.cnf --remove_dead_master_conf --ignore_last_failover </dev/null> /var/log/mha/app/app1/manager.log 2>&1 &
[root@db04 ~]# ll mha
-rw-r--r-- 1 root root 159 Nov 16 13:49 mha
[root@db04 ~]# chown toor:toor mha
[root@db04 ~]# chmod 700 mha
[root@db04 ~]# mv mha /usr/bin/
[root@db04 ~]# ll /usr/bin/mha
-rwx------ 1 toor toor 159 Nov 16 13:49 /usr/bin/mha
4.13 启动mha服务
注意:这里是在db04服务器上进行操作
[root@db04 ~]# su - toor
[toor@db04 ~]$ mha
[toor@db04 ~]$ ps -ef|grep mha
toor 5220 1 8 13:51 pts/0 00:00:00 perl /usr/bin/masterha_manager --conf=/etc/mha/app/app1/app1.cnf --remove_dead_master_conf --ignore_last_failover
toor 5232 5191 1 13:51 pts/0 00:00:00 grep --color=auto mha