標籤:lis auto ken 並發 obs sleep form cancel serial
Quartz.Net的叢集部署詳解
標籤(空格分隔): Quartz.Net Job
最近工作上要用Job,公司的job有些不滿足個人的使用,於是就想自己搞一個Job站練練手,網上看了一下,發現Quartz,於是就瞭解了一下。
第一版
目前個人使用的是Asp.net Core,在core2.0下面進行的開發。
第一版自己簡單的寫了一個調度器。
public static class SchedulerManage{ private static IScheduler _scheduler = null; private static object obj = new object(); public static IScheduler Scheduler { get { var scheduler = _scheduler; if (scheduler == null) { //在這之前有可能_scheduler被改變了scheduler用的還是原來的值 lock (obj) { //這裡讀取最新的記憶體裡面的值賦值給scheduler,保證讀取到的是最新的_scheduler scheduler = Volatile.Read(ref _scheduler); if (scheduler == null) { scheduler = GetScheduler().Result; Volatile.Write(ref _scheduler, scheduler); } } } return scheduler; } } public static async Task<BaseResponse> RunJob(IJobDetail job, ITrigger trigger) { var response = new BaseResponse(); try { var isExist = await Scheduler.CheckExists(job.Key); var time = DateTimeOffset.Now; if (isExist) { //恢複已經存在任務 await Scheduler.ResumeJob(job.Key); } else { time = await Scheduler.ScheduleJob(job, trigger); } response.IsSuccess = true; response.Msg = time.ToString("yyyy-MM-dd HH:mm:ss"); } catch (Exception ex) { response.Msg = ex.Message; } return response; } public static async Task<BaseResponse> StopJob(JobKey jobKey) { var response = new BaseResponse(); try { var isExist = await Scheduler.CheckExists(jobKey); if (isExist) { await Scheduler.PauseJob(jobKey); } response.IsSuccess = true; response.Msg = "暫停成功!!"; } catch (Exception ex) { response.Msg = ex.Message; } return response; } public static async Task<BaseResponse> DelJob(JobKey jobKey) { var response = new BaseResponse(); try { var isExist = await Scheduler.CheckExists(jobKey); if (isExist) { response.IsSuccess = await Scheduler.DeleteJob(jobKey); } } catch (Exception ex) { response.IsSuccess = false; response.Msg = ex.Message; } return response; } private static async Task<IScheduler> GetScheduler() { NameValueCollection props = new NameValueCollection() { {"quartz.serializer.type", "binary" } }; StdSchedulerFactory factory = new StdSchedulerFactory(props); var scheduler = await factory.GetScheduler(); await scheduler.Start(); return scheduler; }}
簡單的實現了,動態運行job,暫停Job,添加job。弄完以後,發現貌似沒啥問題,只要自己把啟動並執行job資訊找張表格儲存體一下,好像都ok了。
輪到發布的時候,突然發現現實機器不止一台,是通過Nigix進行反向 Proxy。突然發現以下幾個問題:
1,多台機器很有可能一個Job在多台機器上運行。
2,當進行部署的時候,必須得停掉機器,如何在機器停掉以後重新部署的時候自動回復正在啟動並執行Job。
3,如何均衡的運行所有job。
個人當時的想法
1,第一個問題:由於是經過Nigix的反向 Proxy,添加Job和運行job只能落到一台伺服器上,基本沒啥問題。個人控制好RunJob的介面,運行了一次,把JobDetail的那張表的運行狀態改成已運行,也就不存在多個機器同時啟動並執行情況。
2,在第一個問題解決的情況下,由於我們公司的Nigix反向 Proxy的邏輯是:均衡策略。所以均衡運行所有job都沒啥問題。
3,重點來了!!!!
如何在部署的時候恢複正在啟動並執行Job?
由於我們已經有了一張JobDetail表。裡面可以擷取到哪些正在啟動並執行Job。wome我們把他找出來直接在程式啟動的時候運行一下不就好了嗎嘛。
下面是個人實現的:
//HostedService,在主機啟動並執行時候啟動並執行一個服務public class HostedService : IHostedService{ public HostedService(ISchedulerJob schedulerCenter) { _schedulerJob = schedulerCenter; } private ISchedulerJob _schedulerJob = null; public async Task StartAsync(CancellationToken cancellationToken) { LogHelper.WriteLog("開啟Hosted+Env:"+env); var reids= new RedisOperation(); if (reids.SetNx("RedisJobLock", "1")) { await _schedulerJob.StartAllRuningJob(); } reids.Expire("RedisJobLock", 300); } public async Task StopAsync(CancellationToken cancellationToken) { LogHelper.WriteLog("結束Hosted"); var redis = new RedisOperation(); if (redis.RedisExists("RedisJobLock")) { var count=redis.DelKey("RedisJobLock"); LogHelper.WriteLog("刪除Reidskey-RedisJobLock結果:" + count); } }} //注入用的特性 [ServiceDescriptor(typeof(ISchedulerJob), ServiceLifetime.Transient)] public class SchedulerCenter : ISchedulerJob { public SchedulerCenter(ISchedulerJobFacade schedulerJobFacade) { _schedulerJobFacade = schedulerJobFacade; } private ISchedulerJobFacade _schedulerJobFacade = null; public async Task<BaseResponse> DelJob(SchedulerJobModel jobModel) { var response = new BaseResponse(); if (jobModel != null && jobModel.JobId != 0 && jobModel.JobName != null) { response = await _schedulerJobFacade.Modify(new SchedulerJobModifyRequest() { JobId = jobModel.JobId, DataFlag = 0 }); if (response.IsSuccess) { response = await SchedulerManage.DelJob(GetJobKey(jobModel)); if (!response.IsSuccess) { response = await _schedulerJobFacade.Modify(new SchedulerJobModifyRequest() { JobId = jobModel.JobId, DataFlag = 1 }); } } } else { response.Msg = "請求參數有誤"; } return response; } public async Task<BaseResponse> RunJob(SchedulerJobModel jobModel) { if (jobModel != null) { var jobKey = GetJobKey(jobModel); var triggleBuilder = TriggerBuilder.Create().WithIdentity(jobModel.JobName + "Trigger", jobModel.JobGroup).WithCronSchedule(jobModel.JobCron).StartAt(jobModel.JobStartTime); if (jobModel.JobEndTime != null && jobModel.JobEndTime != new DateTime(1900, 1, 1) && jobModel.JobEndTime == new DateTime(1, 1, 1)) { triggleBuilder.EndAt(jobModel.JobEndTime); } triggleBuilder.ForJob(jobKey); var triggle = triggleBuilder.Build(); var data = new JobDataMap(); data.Add("***", "***"); data.Add("***", "***"); data.Add("***", "***"); var job = JobBuilder.Create<SchedulerJob>().WithIdentity(jobKey).SetJobData(data).Build(); var result = await SchedulerManage.RunJob(job, triggle); if (result.IsSuccess) { var response = await _schedulerJobFacade.Modify(new SchedulerJobModifyRequest() { JobId = jobModel.JobId, JobState = 1 }); if (!response.IsSuccess) { await SchedulerManage.StopJob(jobKey); } return response; } else { return result; } } else { return new BaseResponse() { Msg = "Job名稱為空白!!" }; } } public async Task<BaseResponse> StopJob(SchedulerJobModel jobModel) { var response = new BaseResponse(); if (jobModel != null && jobModel.JobId != 0 && jobModel.JobName != null) { response = await _schedulerJobFacade.Modify(new SchedulerJobModifyRequest() { JobId = jobModel.JobId, JobState = 2 }); if (response.IsSuccess) { response = await SchedulerManage.StopJob(GetJobKey(jobModel)); if (!response.IsSuccess) { response = await _schedulerJobFacade.Modify(new SchedulerJobModifyRequest() { JobId = jobModel.JobId, JobState = 2 }); } } } else { response.Msg = "請求參數有誤"; } return response; } private JobKey GetJobKey(SchedulerJobModel jobModel) { return new JobKey($"{jobModel.JobId}_{jobModel.JobName}", jobModel.JobGroup); } public async Task<BaseResponse> StartAllRuningJob() { try { var jobListResponse = await _schedulerJobFacade.QueryList(new SchedulerJobListRequest() { DataFlag = 1, JobState = 1, Environment=Kernel.Environment.ToLower() }); if (!jobListResponse.IsSuccess) { return jobListResponse; } var jobList = jobListResponse.Models; foreach (var job in jobList) { await RunJob(job); } return new BaseResponse() { IsSuccess = true, Msg = "程式啟動時,啟動所有運行中的job成功!!" }; } catch (Exception ex) { LogHelper.WriteExceptionLog(ex); return new BaseResponse() { IsSuccess = false, Msg = "程式啟動時,啟動所有運行中的job失敗!!" }; } } }
在程式啟動的時候,把所有的Job去運行一遍,當中對於多次啟動並執行用到了Redis的分布式鎖,現在啟動的時候鎖住,不讓別人運行,在程式卸載的時候去把鎖釋放掉!!感覺沒啥問題,主要是可能負載平衡有問題,全打到一台伺服器上去了,勉強能夠快速的打到效果。當然高可用什麼的就先犧牲掉了。
坑點又來了
大家知道,在稍微大點的公司,營運和開發是分開的,公司用的daoker進行部署,在程式停止的時候,不會調用
HostedService的StopAsync方法!!
當時心裡真是一萬個和諧和諧奔騰而過!!
個人也就懶得和營運去扯這些東西了。最後的最後就是:設定一個redis的分布式鎖的到期時間,大概預估一個部署的時間,只要在部署直接,鎖能夠在就行了,然後每次部署的間隔要大於鎖到期時間。好麻煩,說多了都是淚!!
Quartz.Net的分布式叢集運用Schedule配置
public async Task<IScheduler> GetScheduler() { var properties = new NameValueCollection(); properties["quartz.serializer.type"] = "binary"; //儲存類型 properties["quartz.jobStore.type"] = "Quartz.Impl.AdoJobStore.JobStoreTX, Quartz"; //表明首碼 properties["quartz.jobStore.tablePrefix"] = "QRTZ_"; //驅動類型 properties["quartz.jobStore.driverDelegateType"] = "Quartz.Impl.AdoJobStore.SqlServerDelegate, Quartz"; //資料庫名稱 properties["quartz.jobStore.dataSource"] = "SchedulJob"; //連接字串Data Source = myServerAddress;Initial Catalog = myDataBase;User Id = myUsername;Password = myPassword; properties["quartz.dataSource.SchedulJob.connectionString"] = "Data Source =.; Initial Catalog = SchedulJob;User ID = sa; Password = Ld309402556;"; //sqlserver版本(Core下面已經沒有什麼20,21版本了) properties["quartz.dataSource.SchedulJob.provider"] = "SqlServer"; //是否叢集,叢集模式下要設定為true properties["quartz.jobStore.clustered"] = "true"; properties["quartz.scheduler.instanceName"] = "TestScheduler"; //叢集模式下設定為auto,自動擷取執行個體的Id,叢集下一定要id不一樣,不然不會自動回復 properties["quartz.scheduler.instanceId"] = "AUTO"; properties["quartz.threadPool.type"] = "Quartz.Simpl.SimpleThreadPool, Quartz"; properties["quartz.threadPool.threadCount"] = "25"; properties["quartz.threadPool.threadPriority"] = "Normal"; properties["quartz.jobStore.misfireThreshold"] = "60000"; properties["quartz.jobStore.useProperties"] = "false"; ISchedulerFactory factory = new StdSchedulerFactory(properties); return await factory.GetScheduler(); }
然後是測試代碼:
public async Task TestJob() { var sched = await GetScheduler(); //Console.WriteLine("***** Deleting existing jobs/triggers *****"); //sched.Clear(); Console.WriteLine("------- Initialization Complete -----------"); Console.WriteLine("------- Scheduling Jobs ------------------"); string schedId = sched.SchedulerName; //sched.SchedulerInstanceId; int count = 1; IJobDetail job = JobBuilder.Create<SimpleRecoveryJob>() .WithIdentity("job_" + count, schedId) // put triggers in group named after the cluster node instance just to distinguish (in logging) what was scheduled from where .RequestRecovery() // ask scheduler to re-execute this job if it was in progress when the scheduler went down... .Build(); ISimpleTrigger trigger = (ISimpleTrigger)TriggerBuilder.Create() .WithIdentity("triger_" + count, schedId) .StartAt(DateBuilder.FutureDate(1, IntervalUnit.Second)) .WithSimpleSchedule(x => x.WithRepeatCount(1000).WithInterval(TimeSpan.FromSeconds(5))) .Build(); Console.WriteLine("{0} will run at: {1} and repeat: {2} times, every {3} seconds", job.Key, trigger.GetNextFireTimeUtc(), trigger.RepeatCount, trigger.RepeatInterval.TotalSeconds); sched.ScheduleJob(job, trigger); count++; job = JobBuilder.Create<SimpleRecoveryJob>() .WithIdentity("job_" + count, schedId) // put triggers in group named after the cluster node instance just to distinguish (in logging) what was scheduled from where .RequestRecovery() // ask scheduler to re-execute this job if it was in progress when the scheduler went down... .Build(); trigger = (ISimpleTrigger)TriggerBuilder.Create() .WithIdentity("triger_" + count, schedId) .StartAt(DateBuilder.FutureDate(2, IntervalUnit.Second)) .WithSimpleSchedule(x => x.WithRepeatCount(1000).WithInterval(TimeSpan.FromSeconds(5))) .Build(); Console.WriteLine(string.Format("{0} will run at: {1} and repeat: {2} times, every {3} seconds", job.Key, trigger.GetNextFireTimeUtc(), trigger.RepeatCount, trigger.RepeatInterval.TotalSeconds)); sched.ScheduleJob(job, trigger); // jobs don‘t start firing until start() has been called... Console.WriteLine("------- Starting Scheduler ---------------"); sched.Start(); Console.WriteLine("------- Started Scheduler ----------------"); Console.WriteLine("------- Waiting for one hour... ----------"); Thread.Sleep(TimeSpan.FromHours(1)); Console.WriteLine("------- Shutting Down --------------------"); sched.Shutdown(); Console.WriteLine("------- Shutdown Complete ----------------"); }
測試添加兩個job,每隔5s執行一次。
在圖中可以看到:job1和job2不會重複執行,當我停了Job2時,job2也在job1當中運行。
這樣就可以實現分布式部署時的問題了,Quzrtz.net的資料庫結構隨便網上找一下,運行一些就好了。
截取幾個資料庫的資料圖:基本上就儲存了一些這樣的資訊
JobDetail
觸發器的資料
這個是調度器的
這個是鎖的
下一期:
1.Job的介紹:有狀態Job,無狀態Job。
2.MisFire
3.Trigger,Cron介紹
4.第一部分的改造,自己實現一個基於在HostedService能夠進行分布式調度的Job類,其實只要實現了這個,其他的上面講的都沒有問題。棄用Quartz的表的行級鎖。因為這並發高了比較慢!!
個人問題
個人還是沒有測試出來這個RequestRecovery。怎麼用過的!!
Quartz.Net分布式運用