基于zookeeper实现任务调度(1)

最近公司发生了服务定时同步的机制异常,看着公司的分布式任务调度组件,想着自己实现一个 github地址

业务背景

A模块中的定时器每个30s去执行一次任务(任务内容是远程获取消息并处理发送)。原定是A模块部署到两个服务器,但是目前A模块独立运行两个之后总是会获取到相同的远程消息,然后重复执行处理了两次。

实际场景

公司采用Spring quartz 建立定时任务模块。 当任务模块进行了分布式部署,通常会出现定时任务重复执行的情况。 怎么避免这种情况呢,是否可以构建一个任务注册中心,Quartz负责注册任务,但不具体执行任务内的业务逻辑。


target.png

解决问题

任务注册中心解决任务重复注册的问题,同时将任务分配给若干处理器进行具体的业务处理,保证在同一个时间内,一个任务只会被一个处理器进行处理。

实现方式

利用ZooKeeper的Master选举机制实现。 注册任务就相当于在ZooKeeper中创建或更新一个节点。通过更新节点的内容,来记录任务的执行状态。

过程说明

任务调度,从管理器分配任务,根据不同的任务Id进行注册

public class ZKScheduleManager extends ThreadPoolTaskScheduler implements ApplicationContextAware {

    /**
     * 
     */
    private static final long serialVersionUID = 1L;
    
    private static final int DEFAULT_POOL_SIZE = 20;

    private static final transient Logger LOGGER = LoggerFactory.getLogger(ZKScheduleManager.class);
    
    private final CountDownLatch downLatch = new CountDownLatch(1);

    private Map zkConfig;
    
    protected ZKManager zkManager;

    private IScheduleDataManager scheduleDataManager;

    /**
     * 当前调度服务的信息
     */
    protected ScheduleServer currenScheduleServer;

    /**
     * 是否启动调度管理,如果只是做系统管理,应该设置为false,对应key值为onlyAdmin
     */
    public boolean start = true;

    /**
     * 心跳间隔
     */
    private int timerInterval = 1000;

    /**
     * 是否注册成功
     */
    private boolean isScheduleServerRegister = true;

    private static ApplicationContext applicationcontext;
    
    private Map isOwnerMap = new ConcurrentHashMap();

    private Timer hearBeatTimer;
    private Lock initLock = new ReentrantLock();
    private boolean isStopSchedule = false;
    private Lock registerLock = new ReentrantLock();
    
    private List initTaskDefines = new ArrayList();
    
    private volatile String errorMessage = "No config Zookeeper connect information";
    private InitialThread initialThread;

    public ZKScheduleManager() {
        this.currenScheduleServer = ScheduleServer.createScheduleServer(null);
    }

    public void init() throws Exception {
        if(this.zkConfig != null){
            for (Map.Entry e : this.zkConfig.entrySet()) {
                ConsoleManager.properties.put(e.getKey(), e.getValue());
            }
        }
        if(ConsoleManager.properties.containsKey("onlyClient")){
            String val = String.valueOf(ConsoleManager.properties.get("onlyClient"));
            if(StringUtils.isNotBlank(val)){
                start = Boolean.valueOf(val);
            }
        }
        this.setPoolSize(DEFAULT_POOL_SIZE);
        if(ConsoleManager.properties.containsKey("poolSize")){
            String val = String.valueOf(ConsoleManager.properties.get("poolSize"));
            if(StringUtils.isNotBlank(val)){
                this.setPoolSize(Integer.valueOf(val));
            }
        }
        System.out.println("properties:"+ConsoleManager.properties);
        this.init(ConsoleManager.properties);
    }

    public void init(Properties p) throws Exception {
        if (this.initialThread != null) {
            this.initialThread.stopThread();
        }
        this.initLock.lock();
        try {
            this.scheduleDataManager = null;
            if (this.zkManager != null) {
                this.zkManager.close();
            }
            this.zkManager = new ZKManager(p);
            this.errorMessage = "Zookeeper connecting ......"
                    + this.zkManager.getConnectStr();
            initialThread = new InitialThread(this);
            initialThread.setName("ScheduleManager-initialThread");
            initialThread.start();
        } finally {
            this.initLock.unlock();
        }
    }

    private void rewriteScheduleInfo() throws Exception {
        registerLock.lock();
        try {
            if (this.isStopSchedule) {
                if (LOGGER.isDebugEnabled()) {
                    LOGGER.debug("外部命令终止调度,不在注册调度服务,避免遗留垃圾数据:"
                            + currenScheduleServer.getUuid());
                }
                return;
            }
            // 先发送心跳信息
            if (errorMessage != null) {
                this.currenScheduleServer.setDealInfoDesc(errorMessage);
            }
            if (!this.scheduleDataManager
                    .refreshScheduleServer(this.currenScheduleServer)) {
                // 更新信息失败,清除内存数据后重新注册
                this.clearMemoInfo();
                this.scheduleDataManager.registerScheduleServer(this.currenScheduleServer);
            }
            isScheduleServerRegister = true;
        } finally {
            registerLock.unlock();
        }
    }

    /**
     * 清除内存中所有的已经取得的数据和任务队列,在心态更新失败,或者发现注册中心的调度信息被删除
     */
    public void clearMemoInfo() {
        try {

        } finally {
        }

    }

    /**
     * 根据当前调度服务器的信息,重新计算分配所有的调度任务
     * 任务的分配是需要加锁,避免数据分配错误。为了避免数据锁带来的负面作用,通过版本号来达到锁的目的
     * 
     * 1、获取任务状态的版本号 2、获取所有的服务器注册信息和任务队列信息 3、清除已经超过心跳周期的服务器注册信息 3、重新计算任务分配
     * 4、更新任务状态的版本号【乐观锁】 5、根系任务队列的分配信息
     * 
     * @throws Exception
     */
    public void assignScheduleTask() throws Exception {
        scheduleDataManager.clearExpireScheduleServer();
        List serverList = scheduleDataManager.loadScheduleServerNames();
        if (!scheduleDataManager.isLeader(this.currenScheduleServer.getUuid(),
                serverList)) {
            if (LOGGER.isDebugEnabled()) {
                LOGGER.debug(this.currenScheduleServer.getUuid()
                        + ":不是负责任务分配的Leader,直接返回");
            }
            return;
        }
        //黑名单
        for(String ip:zkManager.getIpBlacklist()){
            int index = serverList.indexOf(ip);
            if (index > -1){
                serverList.remove(index);
            }
        }
        // 设置初始化成功标准,避免在leader转换的时候,新增的线程组初始化失败
        scheduleDataManager.assignTask(this.currenScheduleServer.getUuid(), serverList);
    }

    /**
     * 定时向数据配置中心更新当前服务器的心跳信息。 如果发现本次更新的时间如果已经超过了,服务器死亡的心跳周期,则不能在向服务器更新信息。
     * 而应该当作新的服务器,进行重新注册。
     * 
     * @throws Exception
     */
    public void refreshScheduleServer() throws Exception {
        try {
            rewriteScheduleInfo();
            // 如果任务信息没有初始化成功,不做任务相关的处理
            if (!this.isScheduleServerRegister) {
                return;
            }

            // 重新分配任务
            this.assignScheduleTask();
            // 检查本地任务
            this.checkLocalTask();
        } catch (Throwable e) {
            // 清除内存中所有的已经取得的数据和任务队列,避免心跳线程失败时候导致的数据重复
            this.clearMemoInfo();
            if (e instanceof Exception) {
                throw (Exception) e;
            } else {
                throw new Exception(e.getMessage(), e);
            }
        }
    }
    
    public void checkLocalTask() throws Exception {
        // 检查系统任务执行情况
        scheduleDataManager.checkLocalTask(this.currenScheduleServer.getUuid());
    }

    /**
     * 在Zk状态正常后回调数据初始化
     * 
     * @throws Exception
     */
    public void initialData() throws Exception {
        this.zkManager.initial();
        this.scheduleDataManager = new ScheduleDataManager4ZK(this.zkManager);
        checkScheduleDataManager();
        if (this.start) {
            // 注册调度管理器
            this.scheduleDataManager.registerScheduleServer(this.currenScheduleServer);
            if (hearBeatTimer == null) {
                hearBeatTimer = new Timer("ScheduleManager-"
                        + this.currenScheduleServer.getUuid() + "-HearBeat");
            }
            hearBeatTimer.schedule(new HeartBeatTimerTask(this), 1000, this.timerInterval);
            
            //初始化启动数据
            if(initTaskDefines != null && initTaskDefines.size() > 0){
                for(TaskDefine taskDefine : initTaskDefines){
                    scheduleDataManager.addTask(taskDefine);
                }
            }
        }
    }
    
    private Runnable taskWrapper(final Runnable task){
        return new Runnable(){
            public void run(){
                TaskDefine taskDefine = resolveTaskName(task);
                String name = taskDefine.stringKey();
                if(StringUtils.isNotEmpty(name)){
                    boolean isOwner = false;
                    boolean isRunning = true;
                    try {
                        if(!isScheduleServerRegister){
                            Thread.sleep(1000);
                        }
                        if(zkManager.checkZookeeperState()){
                            isOwner = scheduleDataManager.isOwner(name, currenScheduleServer.getUuid());
                            isOwnerMap.put(name, isOwner);
                            isRunning = scheduleDataManager.isRunning(name);
                        }else{
                            // 如果zk不可用,使用历史数据
                            if(null != isOwnerMap){
                                isOwner = isOwnerMap.get(name);
                            }
                        }
                        if(isOwner && isRunning){
                            String msg = null;
                            try {
                                task.run();
                                LOGGER.info("Cron job has been executed.");
                            } catch (Exception e) {
                                msg = e.getLocalizedMessage();
                            }
                            scheduleDataManager.saveRunningInfo(name, currenScheduleServer.getUuid(), taskDefine.getRunTimes(), msg);
                        }
                    } catch (Exception e) {
                        LOGGER.error("Check task owner error.", e);
                    }
                }
            }
        };
    }
    
    private TaskDefine resolveTaskName(final Runnable task) {
        Method targetMethod = null;
        TaskDefine taskDefine = new TaskDefine();
        if(task instanceof ScheduledMethodRunnable){
            ScheduledMethodRunnable runnable = (ScheduledMethodRunnable)task;
            taskDefine.setType(TaskDefine.TYPE_UNCODE_SINGLE_TASK);
            taskDefine.valueOf(runnable.getTaskDefine());
            taskDefine.setRunTimes(runnable.getRunTimes());
        }else if(task instanceof ScheduledDistributedSubRunnable){
            ScheduledDistributedSubRunnable runnable = (ScheduledDistributedSubRunnable)task;
            taskDefine.setType(TaskDefine.TYPE_UNCODE_MULTI_SUB_TASK);
            taskDefine.valueOf(runnable.getTaskDefine());
            taskDefine.setRunTimes(runnable.getRunTimes());
        }else if(task instanceof ScheduledDistributedMainRunnable){
            ScheduledDistributedMainRunnable runnable = (ScheduledDistributedMainRunnable)task;
            taskDefine.valueOf(runnable.getTaskDefine());
            taskDefine.setRunTimes(runnable.getRunTimes());
            taskDefine.setType(TaskDefine.TYPE_UNCODE_MULTI_MAIN_TASK);
        }else{
            org.springframework.scheduling.support.ScheduledMethodRunnable springScheduledMethodRunnable = (org.springframework.scheduling.support.ScheduledMethodRunnable)task;
            targetMethod = springScheduledMethodRunnable.getMethod();
            taskDefine.setType(TaskDefine.TYPE_SPRING_TASK);
            String[] beanNames = applicationcontext.getBeanNamesForType(targetMethod.getDeclaringClass());
            if(null != beanNames && StringUtils.isNotEmpty(beanNames[0])){
                taskDefine.setTargetBean(beanNames[0]);
                taskDefine.setTargetMethod(targetMethod.getName());
            }
        }
        
        return taskDefine;
    }

    class HeartBeatTimerTask extends java.util.TimerTask {
        private transient final Logger log = LoggerFactory.getLogger(HeartBeatTimerTask.class);
        ZKScheduleManager manager;

        public HeartBeatTimerTask(ZKScheduleManager aManager) {
            manager = aManager;
        }

        public void run() {
            try {
                Thread.currentThread().setPriority(Thread.MAX_PRIORITY);
                manager.refreshScheduleServer();
            } catch (Exception ex) {
                log.error(ex.getMessage(), ex);
            }
        }
    }

    class InitialThread extends Thread {
        private transient Logger log = LoggerFactory.getLogger(InitialThread.class);
        ZKScheduleManager sm;

        public InitialThread(ZKScheduleManager sm) {
            this.sm = sm;
        }

        boolean isStop = false;

        public void stopThread() {
            this.isStop = true;
        }

        @Override
        public void run() {
            sm.initLock.lock();
            try {
                int count = 0;
                while (!sm.zkManager.checkZookeeperState()) {
                    count = count + 1;
                    if (count % 50 == 0) {
                        sm.errorMessage = "Zookeeper connecting ......"
                                + sm.zkManager.getConnectStr() + " spendTime:"
                                + count * 20 + "(ms)";
                        log.error(sm.errorMessage);
                    }
                    Thread.sleep(20);
                    if (this.isStop) {
                        return;
                    }
                }
                sm.initialData();
            } catch (Throwable e) {
                log.error(e.getMessage(), e);
            } finally {
                sm.initLock.unlock();
            }

        }

    }

    public IScheduleDataManager getScheduleDataManager() {
        return scheduleDataManager;
    }

    @Override
    public void setApplicationContext(ApplicationContext applicationcontext)
            throws BeansException {
        ZKScheduleManager.applicationcontext = applicationcontext;
    }
    
    public void setZkManager(ZKManager zkManager) {
        this.zkManager = zkManager;
    }
    
    public ZKManager getZkManager() {
        return zkManager;
    }

    public void setZkConfig(Map zkConfig) {
        this.zkConfig = zkConfig;
    }
    
    /**
     * 使用fixedRate的方式提交任务调度请求
     * 
     * 任务首次启动时间未设置,任务池将会尽可能早的启动任务 
     * 
* * @param task 待执行的任务  * @param period 两次任务启动时间之间的间隔时间,默认单位是毫秒 * @return 任务句柄 */ public ScheduledFuture scheduleAtFixedRate(Runnable task, long period) { try { TaskDefine taskDefine = resolveTaskName(task); taskDefine.setPeriod(period); checkScheduleDataManager(); boolean rt = isUncodeTask(task); if(rt == false){ scheduleDataManager.addTask(taskDefine); } LOGGER.debug(currenScheduleServer.getUuid() +":自动向集群注册任务[" + taskDefine.stringKey() + "]"); } catch (Exception e) { LOGGER.error("update task error", e); } return super.scheduleAtFixedRate(taskWrapper(task), period); } /** * 提交任务调度请求 * * @param task 待执行任务   * @param trigger 使用Trigger指定任务调度规则 * @return 任务句柄 */ public ScheduledFuture schedule(Runnable task, Trigger trigger) { try { TaskDefine taskDefine = resolveTaskName(task); String cronEx = trigger.toString(); int index = cronEx.indexOf(":"); if(index >= 0){ cronEx = cronEx.substring(index + 1); taskDefine.setCronExpression(cronEx.trim()); } checkScheduleDataManager(); boolean rt = isUncodeTask(task); if(rt == false){ scheduleDataManager.addTask(taskDefine); } LOGGER.debug(currenScheduleServer.getUuid() +":自动向集群注册任务[" + taskDefine.getSingalKey() + "]"); } catch (Exception e) { LOGGER.error("update task error", e); } return super.schedule(taskWrapper(task), trigger); } /** * 提交任务调度请求 *
     * 注意任务只执行一次,使用startTime指定其启动时间  
     * 
* @param task 待执行任务 * @param startTime 任务启动时间 * @return 任务句柄 */ public ScheduledFuture schedule(Runnable task, Date startTime) { try { TaskDefine taskDefine = resolveTaskName(task); taskDefine.setStartTime(startTime); checkScheduleDataManager(); boolean rt = isUncodeTask(task); if(rt == false){ scheduleDataManager.addTask(taskDefine); } LOGGER.debug(currenScheduleServer.getUuid() +":自动向集群注册任务[" + taskDefine.getSingalKey() + "]"); } catch (Exception e) { LOGGER.error("update task error", e); } return super.schedule(taskWrapper(task), startTime); } private void checkScheduleDataManager() throws InterruptedException { if(scheduleDataManager == null){ downLatch.await(1000, TimeUnit.MILLISECONDS); }else{ downLatch.countDown(); } } private boolean isUncodeTask(Runnable task){ if(task instanceof ScheduledMethodRunnable){ return true; }else if(task instanceof ScheduledDistributedSubRunnable){ return true; }else if(task instanceof ScheduledDistributedMainRunnable){ return true; } return false; } /** * 使用fixedRate的方式提交任务调度请求 *
     * 任务首次启动时间由传入参数指定 
     * 
* @param task 待执行的任务  * @param startTime 任务启动时间 * @param period 两次任务启动时间之间的间隔时间,默认单位是毫秒 * @return 任务句柄 */ public ScheduledFuture scheduleAtFixedRate(Runnable task, Date startTime, long period) { try { TaskDefine taskDefine = resolveTaskName(task); taskDefine.setStartTime(startTime); taskDefine.setPeriod(period); checkScheduleDataManager(); boolean rt = isUncodeTask(task); if(rt == false){ scheduleDataManager.addTask(taskDefine); } LOGGER.debug(currenScheduleServer.getUuid() +":自动向集群注册任务[" + taskDefine.getSingalKey() + "]"); } catch (Exception e) { LOGGER.error("update task error", e); } return super.scheduleAtFixedRate(taskWrapper(task), startTime, period); } /** * 使用fixedDelay的方式提交任务调度请求 *
     *  任务首次启动时间由传入参数指定 
     * 
* @param task 待执行任务 * @param startTime 任务启动时间 * @param delay 上一次任务结束时间与下一次任务开始时间的间隔时间,单位默认是毫秒 * @return 任务句柄 */ public ScheduledFuture scheduleWithFixedDelay(Runnable task, Date startTime, long delay) { try { TaskDefine taskDefine = resolveTaskName(task); taskDefine.setStartTime(startTime); taskDefine.setPeriod(delay); checkScheduleDataManager(); boolean rt = isUncodeTask(task); if(rt == false){ scheduleDataManager.addTask(taskDefine); } LOGGER.debug(currenScheduleServer.getUuid() +":自动向集群注册任务[" + taskDefine.getSingalKey() + "]"); } catch (Exception e) { LOGGER.error("update task error", e); } return super.scheduleWithFixedDelay(taskWrapper(task), startTime, delay); } /** * 使用fixedDelay的方式提交任务调度请求 *
     * 任务首次启动时间未设置,任务池将会尽可能早的启动任务 
     * 
* @param task 待执行任务 * @param delay 上一次任务结束时间与下一次任务开始时间的间隔时间,单位默认是毫秒 * @return 任务句柄 */ public ScheduledFuture scheduleWithFixedDelay(Runnable task, long delay) { try { TaskDefine taskDefine = resolveTaskName(task); taskDefine.setPeriod(delay); checkScheduleDataManager(); boolean rt = isUncodeTask(task); if(rt == false){ scheduleDataManager.addTask(taskDefine); } LOGGER.debug(currenScheduleServer.getUuid() +":自动向集群注册任务[" + taskDefine.getSingalKey() + "]"); } catch (Exception e) { LOGGER.error("update task error", e); } return super.scheduleWithFixedDelay(taskWrapper(task), delay); } public boolean checkAdminUser(String account, String password){ if(StringUtils.isBlank(account) || StringUtils.isBlank(password)){ return false; } String name = zkConfig.get(ZKManager.KEYS.userName.key); String pwd = zkConfig.get(ZKManager.KEYS.password.key); if(account.equals(name) && password.equals(pwd)){ return true; } return false; } public String getScheduleServerUUid(){ if(null != currenScheduleServer){ return currenScheduleServer.getUuid(); } return null; } public Map getIsOwnerMap() { return isOwnerMap; } public static ApplicationContext getApplicationcontext() { return ZKScheduleManager.applicationcontext; } public void setInitTaskDefines(List initTaskDefines) { this.initTaskDefines = initTaskDefines; } public void destroy() { try { if (this.initialThread != null) { this.initialThread.stopThread(); } if (this.scheduleDataManager != null) { this.scheduleDataManager.clearExpireScheduleServer(); } if (this.hearBeatTimer != null) { this.hearBeatTimer.cancel(); } } catch (Exception e) { e.printStackTrace(); } finally { if (this.zkManager != null) { try { this.zkManager.close(); } catch (Exception e) { e.printStackTrace(); } } } } }

任务注册

public class ConsoleManager {
    
    private static transient Logger log = LoggerFactory.getLogger(ConsoleManager.class);
    
//    private static Gson GSON = new GsonBuilder().create();

    private static ZKScheduleManager scheduleManager;
    
    static Properties properties = new Properties();
    
    public static void setProperties(Properties prop){
        properties.putAll(prop);
    }
    
    public static ZKScheduleManager getScheduleManager() throws Exception {
        if(null == ConsoleManager.scheduleManager){
            synchronized(ConsoleManager.class) {
                ConsoleManager.scheduleManager = ZKScheduleManager.getApplicationcontext().getBean(ZKScheduleManager.class);
            }
        }
        return ConsoleManager.scheduleManager;
    }

    /**
     * 添加任务
     * @param taskDefine 任务定义
     */
    public static void addScheduleTask(TaskDefine taskDefine) {
        try {
            log.info("添加任务:"+taskDefine.getSingalKey());
            ConsoleManager.getScheduleManager().getScheduleDataManager().addTask(taskDefine);
        } catch (Exception e) {
            log.error(e.getMessage(), e);
        }
    }
    
    /**
     * 删除任务
     * @param taskDefine 任务定义
     */
    public static void delScheduleTask(TaskDefine taskDefine) {
        try {
            ConsoleManager.scheduleManager.getScheduleDataManager().delTask(taskDefine);
        } catch (Exception e) {
            log.error(e.getMessage(), e);
        }
    }
    
    /**
     * 不可用
     * @param targetBean bean名称
     * @param targetMethod 方法名称
     */
    @Deprecated
    public static void delScheduleTask(String targetBean, String targetMethod) {
        try {
            ConsoleManager.scheduleManager.getScheduleDataManager().delTask(targetBean, targetMethod);
        } catch (Exception e) {
            log.error(e.getMessage(), e);
        }
    }
    
    /**
     * 修改任务
     * @param taskDefine 任务定义
     */
    public static void updateScheduleTask(TaskDefine taskDefine) {
        try {
            ConsoleManager.scheduleManager.getScheduleDataManager().updateTask(taskDefine);
        } catch (Exception e) {
            log.error(e.getMessage(), e);
        }
    }
    
    /**
     * 查询所有任务列表
     * @return 任务列表
     */
    public static List queryScheduleTask() {
        List taskDefines = new ArrayList();
        try {
            List tasks = ConsoleManager.getScheduleManager().getScheduleDataManager().selectTask();
            taskDefines.addAll(tasks);
        } catch (Exception e) {
            log.error(e.getMessage(), e);
        }
        return taskDefines;
    }
    
    /**
     * 任务是否存在
     * @param taskDefine  任务定义
     * @return 是或否
     * @throws Exception 异常
     */
    public static boolean isExistsTask(TaskDefine taskDefine) throws Exception{
            return ConsoleManager.scheduleManager.getScheduleDataManager().isExistsTask(taskDefine);
    }
    
    /**
     * 根据标识查询相关任务
     * @param taskDefine 任务定义
     * @return 任务信息
     * @throws Exception 异常
     */
    public static TaskDefine queryScheduleTask(TaskDefine taskDefine) throws Exception{
        return ConsoleManager.scheduleManager.getScheduleDataManager().selectTask(taskDefine);
    }
    
    /**
     * 判断当前任务是否属于当前节点
     * @param taskDefine 任务定义
     * @return 是或否
     * @throws Exception 异常
     */
    public static boolean isOwner(TaskDefine taskDefine) throws Exception{
        return ConsoleManager.scheduleManager.getScheduleDataManager().isOwner(taskDefine.getSingalKey(), 
                ConsoleManager.getScheduleManager().getScheduleServerUUid());
    }
    
}

你可能感兴趣的:(基于zookeeper实现任务调度(1))