最近集群不太稳定,应用总是挂,手动重启太烦,写了个自动重启的脚本,分享下
#!--encoding=utf-8import osimport shleximport subprocessfrom apscheduler.schedulers.blocking import BlockingScheduler# app_name : restart path[shell_path, jar_path]restart_dict = { "app_mr": "/app/mr/start.sh /app/mr/jars/app_mr.jar", "app_streaming": "/app/streaming/start.sh /app/streaming/jars/app_streaming.jar", }def task(): app_list = os.popen(" yarn application -list | awk '{print $2}'| tail -n +3 ") app_set = set() for app in app_list: app_set.add(app.replace("\n", "")) for k, v in restart_dict.items(): if k not in app_set: p = subprocess.Popen(shlex.split(v)) # (stdout, stderr) = p.communicate() # p.send_signal(CTRL_C_EVENT)if __name__ == "__main__": scheduler = BlockingScheduler() # 每30s一次 scheduler.add_job(task, 'cron', second='*/30') try: scheduler.start() except Exception, ex: print ex scheduler.shutdown()