最近集群不太稳定,应用总是挂,手动重启太烦,写了个自动重启的脚本,分享下
#!--encoding=utf-8
import os
import shlex
import subprocess
from apscheduler.schedulers.blocking import BlockingScheduler
# app_name : restart path[shell_path, jar_path]
restart_dict = {
"app_mr": "/app/mr/start.sh /app/mr/jars/app_mr.jar",
"app_streaming": "/app/streaming/start.sh /app/streaming/jars/app_streaming.jar",
}
def task():
app_list = os.popen(" yarn application -list | awk '{print $2}'| tail -n +3 ")
app_set = set()
for app in app_list:
app_set.add(app.replace("\n", ""))
for k, v in restart_dict.items():
if k not in app_set:
p = subprocess.Popen(shlex.split(v))
# (stdout, stderr) = p.communicate()
# p.send_signal(CTRL_C_EVENT)
if __name__ == "__main__":
scheduler = BlockingScheduler()
# 每30s一次
scheduler.add_job(task, 'cron', second='*/30')
try:
scheduler.start()
except Exception, ex:
print ex
scheduler.shutdown()