一、关系图
 
二、安装mysql-mmm
1)安装epel
相关文档参见:http://fedoraproject.org/wiki/EPEL
2) monitor软件安装
 [root@localhost ~]# yum install –y mysql-mmm-monitor-*
包如下:
[root@localhost ~]# rpm -qa|grep mysql
mysql-mmm-monitor-2.2.1-1.el5
mysql-mmm-2.2.1-1.el5
mysql-5.0.77-4.el5_5.4
3)数据库所在机器安装(包括master,slave)
[root@localhost ~]# yum install –y mysql-mmm-agent*
包如下:
[root@localhost ~]# rpm -qa|grep mysql
mysql-test-5.0.77-4.el5_5.4
mysql-mmm-agent-2.2.1-1.el5
mysql-5.0.77-4.el5_5.4
mysql-server-5.0.77-4.el5_5.4
mysql-devel-5.0.77-4.el5_5.4
mysql-bench-5.0.77-4.el5_5.4
mysql-mmm-2.2.1-1.el5
mysql-connector-odbc-3.51.26r1127-1.el5
 
三、配置文件
1)monitor配置文件
[root@localhost ~]# vi /etc/mysql-mmm/mmm_mon.conf
include mmm_common.conf
 
<monitor>
    ip                  127.0.0.1
    pid_path            /var/run/mysql-mmm/mmm_mond.pid
    bin_path            /usr/libexec/mysql-mmm
    status_path         /var/lib/mysql-mmm/mmm_mond.status
    ping_ips            172.16.71.128,172.16.71.130 #master,slave实际数据库ip
    auto_set_online     60
</monitor>
 
<host default>
    monitor_user        mmm_monitor
    monitor_password    10jqka 
</host>
 
Debug
 
2)通用的配置文件,在monitor及master,slave上放置的这个文件都一致
[root@localhost ~]# vi /etc/mysql-mmm/mmm_common.conf
active_master_role       writer
 
<host default>
    cluster_interface       eth0
    pid_path                /var/run/mysql-mmm/mmm_agentd.pid
    bin_path                /usr/libexec/mysql-mmm/
    replication_user        replicant
    replication_password    10jqka
    agent_user              mmm_agent
    agent_password          10jqka
</host>
 
<host db1>
    ip      172.16.71.128 #真实master数据库ip
    mode    master
    peer    db2
</host>
 
<host db2>
     ip      172.16.71.130 #真实master数据库ip
    mode    master
    peer    db1
</host>
 
#<host db3>
#     ip      192.168.100.51 #真实slave数据库ip
#     mode    slave
#</host>
<role writer>
    hosts   db1, db2
    ips     172.16.71.253 #虚拟写数据库ip
    mode    exclusive
</role>
 
<role reader>
    hosts   db1, db2
    ips     172.16.71.251,172.16.71.252 #虚拟读数据库ip
    mode    balanced
</role>
 
3)master,slave配置文件
[root@localhost ~]# vi /etc/mysql-mmm/mmm_agent.conf
include mmm_common.conf
 
# The 'this' variable refers to this server. Proper operation requires
# that 'this' server (db1 by default), as well as all other servers, have the
# proper IP addresses set in mmm_common.conf.
this db1#如为第一台master db则为db1如为第二台则为db2与mmm_common.conf里的机器对应
 
 
 
三、查看效果
1)启动db1的相关服务
service mysqld start
service mysql-mmm-agent start
数据库授权:所有数据库的授权一致
GRANT REPLICATION CLIENT ON *.* TO 'mmm_monitor'@'172.16.71.%' IDENTIFIED BY '10jqka';
GRANT SUPER, REPLICATION CLIENT, PROCESS ON *.* TO 'mmm_agent'@'172.16.71.%'    IDENTIFIED BY '10jqka';
grant all on *.* to replicant@'172.16.71.%' identified by '10jqka';
flush privileges;
2)启动monitor相关服务
service mysql-mmm-monitor start
查看状态:
mmm_control show
把db1设置为online状态:
mmm_control set_online db1
开放mmm_agentd端口9989
真实机器查看分配的vip地址
[root@localhost ~]# ip a
1: lo: <LOOPBACK,UP,LOWER_UP> mtu 16436 qdisc noqueue
    link/loopback 00:00:00:00:00:00 brd 00:00:00:00:00:00
    inet 127.0.0.1/8 scope host lo
    inet6 ::1/128 scope host
       valid_lft forever preferred_lft forever
2: eth0: <BROADCAST,MULTICAST,UP,LOWER_UP> mtu 1500 qdisc pfifo_fast qlen 1000
    link/ether 00:0c:29:ef:79:70 brd ff:ff:ff:ff:ff:ff
    inet 172.16.71.132/24 brd 172.16.71.255 scope global eth0
    inet 172.16.71.251/32 scope global eth0
    inet 172.16.71.253/32 scope global eth0
    inet6 fe80::20c:29ff:feef:7970/64 scope link
       valid_lft forever preferred_lft forever
 
四、主主(master-master)同步配置
1)172.16.71.132机器my.cnf
skip-name-resolve
server_id            = 132
set-variable = key_buffer_size=512M
set-variable = table_cache=32
set-variable = sort_buffer_size=32M
set-variable = read_buffer_size=32M
set-variable = max_connections=2100
set-variable = log_slow_queries=/var/lib/mysql/log/mysql-slow.log
set-variable = log_bin=/var/lib/mysql/log/mysql-bin
set-variable = long_query_time=1
set-variable = thread_concurrency=16
set-variable = tmp_table_size=4000000000
set-variable = slave_skip_errors=all
#replicate-ignore-db=mysql
#replicate-ignore-db=test 发觉加上这个ignore选项后会导致mmm接管出现点小问题不知道为什么
log-slave-updates
sync_binlog=1
auto_increment_increment=2
auto_increment_offset=1
进入mysql配置设置为从
 
mysql> change master to master_host='172.16.71.128';
mysql>change master to master_user='repl';
mysql>change master to master_password='10jqka';
mysql>start slave
主(master)服务器配置:
GRANT REPLICATION SLAVE ON *.* TO 'repl'@'172.16.71.%' IDENTIFIED BY '10jqka';
 
 
2)172.16.71.128机器my.cnf配置
skip-name-resolve
server_id            = 1
set-variable = key_buffer_size=512M
set-variable = table_cache=32
set-variable = sort_buffer_size=32M
set-variable = read_buffer_size=32M
set-variable = max_connections=2100
set-variable = log_slow_queries=/var/lib/mysql/log/mysql-slow.log
set-variable = log_bin=/var/lib/mysql/log/mysql-bin
set-variable = long_query_time=1
set-variable = thread_concurrency=16
set-variable = tmp_table_size=4000000000
set-variable = slave_skip_errors=all
#replicate-ignore-db=mysql
#replicate-ignore-db=test
log-slave-updates
sync_binlog=1
auto_increment_increment=2
auto_increment_offset=2
 
进入mysql配置设置为从
 
mysql> change master to master_host='172.16.71.132';
mysql>change master to master_user='repl';
mysql>change master to master_password='10jqka';
mysql>start slave
主(master)服务器配置:
GRANT REPLICATION SLAVE ON *.* TO 'repl'@'172.16.71.%' IDENTIFIED BY '10jqka';
 
五、其它从 (slave)服务器配置:
my.cnf配置
skip-name-resolve
server_id            = 1
set-variable = key_buffer_size=512M
set-variable = table_cache=32
set-variable = sort_buffer_size=32M
set-variable = read_buffer_size=32M
set-variable = max_connections=2100
set-variable = log_slow_queries=/var/lib/mysql/log/mysql-slow.log
set-variable = log_bin=/var/lib/mysql/log/mysql-bin
set-variable = long_query_time=1
set-variable = thread_concurrency=16
set-variable = tmp_table_size=4000000000
set-variable = slave_skip_errors=all
 
mysql>change master to master_host='172.16.71.253';
mysql>change master to master_user='repl';
mysql>change master to master_password='10jqka';                            mysql>change master to master_log_file=’mysql-bin.00001’;
mysql>change master to master_log_pos=128;                                 mysql>start slave
或者在my.cnf加入
server-id=2
master-host=172.16.71.253
master-user=repl
master-password=10jqka
 
问题1:
两台机器互为对方的主,此时不能使用master的VIP作为该两机器的主,如果使用VIP作为master的话没有一台先起来作为vip机器的话些会导致monitor不能使用,日志如下:
2010/12/06 16:29:46 WARN db1 is not replicating from db2
2010/12/06 16:29:46 WARN db2 is not replicating from db1
 
问题2:
当/etc/mysql-mmm/mmm_mon.conf的auto_set_online      3时间设置为较长时,在瞬间关闭现有主,开启现未开启的备时,会导致monitor不能自动切换VIP导致mmm不可用,需要手工设置online状态,有时候甚至会导致monitor启动问题。为防止这情况发生可以把该时间设置短些,或者先让一其中的一台主起来后,再关闭另一台。
 
 
问题3:ERROR:Can't connect to monitor daemon
查看进程一般少了perl相关进程,莫名其妙的感觉,经多次尝试试验,一般都是在mysql那些拥有agent机器上的配置问题,还有monitor的auto_set_online时间设置
[root@localhost ~]# ps axu|grep mmm
root       3113 0.0 7.6 14000 8956 ?        S    16:27   0:00 mmm_mond
root       3115 0.9 33.2 106440 38976 ?        Sl   16:27   0:00 mmm_mond
root       3136 0.4 5.5 10388 6456 ?        S    16:28   0:00 perl /usr/libexec/mysql-mmm/monitor/checker ping_ip
root       3140 0.4 6.5 15208 7640 ?        S    16:28   0:00 perl /usr/libexec/mysql-mmm/monitor/checker mysql
root       3141 0.3 5.4 10388 6448 ?        S    16:28   0:00 perl /usr/libexec/mysql-mmm/monitor/checker ping
root       3142 0.5 6.5 15208 7636 ?        S    16:28   0:00 perl /usr/libexec/mysql-mmm/monitor/checker rep_backlog
root       3144 0.6 6.4 15208 7592 ?        S    16:28   0:00 perl /usr/libexec/mysql-mmm/monitor/checker rep_threads
root       3148 0.0 0.5   3916   652 pts/0    R+   16:28   0:00 grep mmm
 
 
 
六、其它补充资料
主从状态查看:
查看master的状态
SHOW MASTER STATUS;
Position不应为0
查看slave的状态
show slave status;
Slave_IO_Running | Slave_SQL_Running这两个字段 应为YES|YES.
show processlist;查看进程
 
slave start; #启动从复制
STOP SLAVE; #停止从复制
RESET MASTER; #重设master日志
RESET SLAVE;#重设slave日志
 
当 Slave_IO_Running: 为No时,从服务器无法同步时操作下如
SLAVE STOP;#停止 slave
CHANGE MASTER TO MASTER_LOG_FILE='mysql-bin.000001', MASTER_LOG_POS=0;
#把 master_log_file设置为从主show master status;得出来的日志名,POS设置为0
SLAVE START;#再次启用 slave
 
 
Mysql 普通主从配置(未使用mmm参考)
配置主从my.cnf文件:
skip-innodb
skip-name-resolve
server_id            = 132
set-variable = key_buffer_size=512M
set-variable = table_cache=32
set-variable = sort_buffer_size=32M
set-variable = read_buffer_size=32M
set-variable = max_connections=2100
set-variable = log_slow_queries=/var/lib/mysql/log/mysql-slow.log
set-variable = log_bin=/var/lib/mysql/log/mysql-bin#从库这条语句注释掉
set-variable = long_query_time=1
set-variable = thread_concurrency=16
set-variable = tmp_table_size=4000000000
set-variable = slave_skip_errors=all
因为 mysql版本不同在从服务器下开启了下面选项导致同步不能进行
replicate-ignore-db=mysql
replicate-do-db =test