using System; using System.Collections.Generic; using System.Linq; using System.Text; using Quartz; using SCC.Common; using SCC.Models; using SCC.Interface; using HtmlAgilityPack; using Newtonsoft.Json; using Newtonsoft.Json.Linq; namespace SCC.Crawler.GP { /// /// 数据爬取类 /// 山东群英会 /// [DisallowConcurrentExecution] [PersistJobDataAfterExecution] public class SDQYHJob : IJob { /// /// 构造函数 /// public SDQYHJob() { log = new LogHelper(); services = IOC.Resolve(); email = IOC.Resolve(); } /// /// 作业执行入口 /// /// 作业执行上下文 public void Execute(IJobExecutionContext context) { Config = CommonHelper.GetConfigFromDataMap(context.JobDetail.JobDataMap); //预设节假日不开奖 if (Config.SkipDate.Contains(CommonHelper.SCCSysDateTime.ToString("yyyyMMdd"))) return; LatestQiHao = context.JobDetail.JobDataMap.GetString("LatestQiHao"); try { //服务启动时配置初始数据 if (string.IsNullOrEmpty(LatestQiHao)) { var lastItem = services.GetLastItem(currentLottery); if (lastItem != null) { LatestQiHao = lastItem.Term.ToString(); } } //第一次启动服务或最新期号为昨天的开奖期号,则自检昨天开奖数据是否抓取完毕(否则插入邮件数据),并重置当天期号和失败列表 if (string.IsNullOrEmpty(LatestQiHao) || !LatestQiHao.StartsWith(CommonHelper.SCCSysDateTime.ToString("yyMMdd"))) { CheckingYesterdayTheLotteryData(); LatestQiHao = CommonHelper.GenerateTodayQiHaoYYMMDDQQQ(0); } //当最新期号不符合当天总期数,执行当天作业 if (Convert.ToInt32(LatestQiHao.Substring(6)) != Config.TimesPerDay) { DoTodayJobByMainUrl(); DoTodayJobByBackUrl(); } } catch (Exception ex) { log.Error(typeof(SDQYHJob), string.Format("【{0}】抓取时发生错误,错误信息【{1}】", Config.Area + Config.LotteryName, ex.Message)); } //保存最新期号和失败期号列表 context.JobDetail.JobDataMap["LatestQiHao"] = LatestQiHao; } /// /// 自检昨天开奖数据 /// private void CheckingYesterdayTheLotteryData() { if (Config.SkipDate.Contains(CommonHelper.SCCSysDateTime.AddDays(-1).ToString("yyyyMMdd"))) return;//如果昨日设定不开奖则不自检昨日开奖数据 //从数据库中获取昨天数据抓取失败列表 FailedQiHaoList = services.GetYesterdayFailQQQList(currentLottery, Config.TimesPerDay); if (FailedQiHaoList.Count > 0) { DoYesterdayFailedListByMainUrl(); DoYesterdayFailedListByBackUrl(); foreach (var fQiHao in FailedQiHaoList) { //将抓取失败数据推送至邮件列表,待邮件服务发送至配置管理员的邮箱中 if (email.AddEmail(Config.Area + Config.LotteryName, fQiHao, CommonHelper.GenerateYesterdayOpenTime(Config, fQiHao))) log.Error(typeof(SDQYHJob), CommonHelper.GetJobLogError(Config, fQiHao)); } } } /// /// 通过主站点抓取开奖数据 /// (山东福彩网) /// private void DoTodayJobByMainUrl() { if (!string.IsNullOrEmpty(Config.MainUrl)) { var OpenList = GetTodayOpenListFromMainUrl(); if (OpenList.Count == 0) return;//无抓取数据 var newestQiHao = OpenList.First().Key; var startQiNum = Convert.ToInt32(LatestQiHao.Substring(6)) + 1; var newestQiNum = Convert.ToInt32(newestQiHao.Substring(6)); if (startQiNum > newestQiNum) return;//无最新数据 //处理最新开奖数据 string getQiHao = string.Empty; for (var i = startQiNum; i <= newestQiNum; i++) { getQiHao = CommonHelper.GenerateTodayQiHaoYYMMDDQQQ(i); var matchItem = OpenList.Where(R => R.Key == getQiHao).FirstOrDefault(); if (matchItem.Key != null && SaveRecord(getQiHao, matchItem.Value, false)) { //处理成功写入日志 log.Info(typeof(SDQYHJob), CommonHelper.GetJobMainLogInfo(Config, getQiHao)); LatestQiHao = getQiHao; } } } } /// /// 通过主站抓取错误期号列表中每一个期号 /// (山东福彩网) /// private void DoYesterdayFailedListByMainUrl() { if (!string.IsNullOrEmpty(Config.MainUrl) && FailedQiHaoList.Count > 0) { var OpenList = GetYesterdayOpenListFromMainUrl(); if (OpenList.Count == 0) return;//无抓取数据 var SuccessList = new List(); foreach (string failedQiHao in FailedQiHaoList) { var matchItem = OpenList.Where(R => R.Key == failedQiHao).FirstOrDefault(); if (matchItem.Key != null && SaveRecord(failedQiHao, matchItem.Value, true)) { //处理成功写入日志 log.Info(typeof(SDQYHJob), CommonHelper.GetJobMainLogInfo(Config, failedQiHao)); SuccessList.Add(failedQiHao); continue; } } foreach (var successQiHao in SuccessList) { FailedQiHaoList.Remove(successQiHao); } } } /// /// 通过主站点抓取今日最新开奖列表 /// /// private Dictionary GetTodayOpenListFromMainUrl() { var postdata = string.Format("q1={0}&q2={1}&method=tjtQyhNew", string.Empty, string.Empty); return GetOpenListFromMainUrl(postdata); } /// /// 通过主站点抓取昨日开奖列表 /// /// private Dictionary GetYesterdayOpenListFromMainUrl() { var yesterdayFirst = CommonHelper.SCCSysDateTime.AddDays(-1).ToString("yyMMdd") + "K001"; var yesterdayLast = CommonHelper.SCCSysDateTime.AddDays(-1).ToString("yyMMdd") + "K" + Config.TimesPerDay.ToString().PadLeft(3, '0'); var postdata = string.Format("q1={0}&q2={1}&method=tjtQyhNew", yesterdayFirst, yesterdayLast); return GetOpenListFromMainUrl(postdata); } /// /// 通过主站点抓取开奖列表 /// /// 请求数据 /// private Dictionary GetOpenListFromMainUrl(string postdata) { Dictionary result = new Dictionary(); try { var HtmlResource = NetHelper.GetUrlResponse(Config.MainUrl, "POST", postdata, Encoding.GetEncoding("gb2312")); if (!string.IsNullOrWhiteSpace(HtmlResource)) { HtmlDocument doc = new HtmlDocument(); doc.LoadHtml(HtmlResource); var tables = doc.DocumentNode.SelectNodes("//table"); if (tables.Count < 2) return result; var trs = tables[1].ChildNodes.Where(node => node.Name == "tr").ToList(); string matchQiHao = string.Empty; string matchKJHaoMa = string.Empty; List tds = null; for (var i = 1; i < trs.Count - 1; i++)//第一行是表头,最后一行也是表头内容 { var trstyle = trs[i].Attributes["style"]; if (trstyle != null && trstyle.Value == "display:none") { continue; } tds = trs[i].ChildNodes.Where(node => node.Name == "td").ToList(); matchQiHao = tds[0].InnerText.Trim().Replace("K", ""); matchKJHaoMa = tds[3].InnerText.Trim().Replace(" ", ","); result.Add(matchQiHao, matchKJHaoMa); } } } catch (Exception ex) { log.Error(typeof(SDQYHJob), string.Format("【{0}】通过主站点抓取开奖列表时发生错误,错误信息【{1}】", Config.Area + Config.LotteryName, ex.Message)); } return result; } /// /// 通过备用站点抓取开奖数据 /// (彩乐乐) /// private void DoTodayJobByBackUrl() { if (!string.IsNullOrEmpty(Config.BackUrl)) { var OpenList = GetTodayOpenListFromBackUrl(); if (OpenList.Count == 0) return;//无抓取数据 var newestQiHao = OpenList.Last().Key; var startQiNum = Convert.ToInt32(LatestQiHao.Substring(6)) + 1; var newestQiNum = Convert.ToInt32(newestQiHao.Substring(6)); if (startQiNum > newestQiNum) return;//无最新数据 //处理最新开奖数据 var getQiHao = string.Empty; for (var i = startQiNum; i <= newestQiNum; i++) { getQiHao = CommonHelper.GenerateTodayQiHaoYYMMDDQQQ(i); var matchItem = OpenList.Where(R => R.Key == getQiHao).FirstOrDefault(); if (matchItem.Key != null && SaveRecord(getQiHao, matchItem.Value, false)) { //处理成功写入日志 log.Info(typeof(SDQYHJob), CommonHelper.GetJobBackLogInfo(Config, getQiHao)); LatestQiHao = getQiHao; } } } } /// /// 通过备用地址抓取错误期号列表中每一个期号 /// (彩乐乐) /// private void DoYesterdayFailedListByBackUrl() { if (!string.IsNullOrEmpty(Config.BackUrl) && FailedQiHaoList.Count > 0) { var OpenList = GetYesterdayOpenListFromBackUrl(); if (OpenList.Count == 0) return;//无抓取数据 var SuccessList = new List(); foreach (var failedQiHao in FailedQiHaoList) { var matchItem = OpenList.Where(R => R.Key == failedQiHao).FirstOrDefault(); if (matchItem.Key != null && SaveRecord(failedQiHao, matchItem.Value, true)) { //处理成功写入日志 log.Info(typeof(SDQYHJob), CommonHelper.GetJobBackLogInfo(Config, failedQiHao)); SuccessList.Add(failedQiHao); continue; } } foreach (var successQiHao in SuccessList) { FailedQiHaoList.Remove(successQiHao); } } } /// /// 通过备用站点抓取今日最新开奖数据 /// /// private Dictionary GetTodayOpenListFromBackUrl() { var requestUrl = string.Format(Config.BackUrl, 0); return GetOpenListFromBackUrl(requestUrl); } /// /// 通过备用站点抓取昨日开奖数据 /// /// private Dictionary GetYesterdayOpenListFromBackUrl() { var requestUrl = string.Format(Config.BackUrl, 1); return GetOpenListFromBackUrl(requestUrl); } /// /// 通过备用站点抓取开奖数据 /// /// 备用站点 /// private Dictionary GetOpenListFromBackUrl(string requestUrl) { Dictionary result = new Dictionary(); try { var HtmlResource = NetHelper.GetUrlResponse(requestUrl); if (!string.IsNullOrWhiteSpace(HtmlResource)) { HtmlDocument doc = new HtmlDocument(); doc.LoadHtml(HtmlResource); var tbody = doc.GetElementbyId("cpdata_new"); if (tbody == null) return result; var trs = tbody.ChildNodes.Where(node => node.Name == "tr").ToList(); string matchQiHao = string.Empty; string matchKJHaoMa = string.Empty; for (var i = 0; i < trs.Count; i++)//第一行是表头 { var trstyle = trs[i].Attributes["style"]; if (trstyle != null && trstyle.Value == "display:none") { continue; } var tds = trs[i].ChildNodes.Where(node => node.Name == "td").ToList(); matchQiHao = tds[0].InnerText.Trim(); matchKJHaoMa = string.Format("{0},{1},{2},{3},{4}", tds[1].InnerText.Trim(), tds[2].InnerText.Trim(), tds[3].InnerText.Trim(), tds[4].InnerText.Trim(), tds[5].InnerText.Trim()); result.Add(matchQiHao, matchKJHaoMa); } } } catch (Exception ex) { log.Error(typeof(HLJ11X5Job), string.Format("【{0}】通过备用站点抓取开奖列表时发生错误,错误信息【{1}】", Config.Area + Config.LotteryName, ex.Message)); } return result; } /// /// 将此彩种指定期号和开奖号码保存至数据库 /// /// 期号 /// 开奖号码(形如01,02,03,04,05) /// 是否是保存昨天的记录 /// private bool SaveRecord(string QiHao, string OpenCode, bool IsYesterdayRecord) { if (!string.IsNullOrWhiteSpace(QiHao) && !string.IsNullOrWhiteSpace(OpenCode)) { OpenCode5Model model = new OpenCode5Model(); model.Term = Convert.ToInt64(QiHao); var haoMaArray = OpenCode.Split(new char[] { ',' }); model.OpenCode1 = Convert.ToInt32(haoMaArray[0]); model.OpenCode2 = Convert.ToInt32(haoMaArray[1]); model.OpenCode3 = Convert.ToInt32(haoMaArray[2]); model.OpenCode4 = Convert.ToInt32(haoMaArray[3]); model.OpenCode5 = Convert.ToInt32(haoMaArray[4]); if (IsYesterdayRecord) model.OpenTime = CommonHelper.GenerateYesterdayOpenTime(Config, QiHao); else model.OpenTime = CommonHelper.GenerateTodayOpenTime(Config, QiHao); return services.AddOpen5Code(currentLottery, model); } return false; } #region Attribute /// /// 配置信息 /// private SCCConfig Config = null; /// /// 当天抓取的最新一期期号 /// private string LatestQiHao = null; /// /// 当天抓取失败列表 /// private List FailedQiHaoList = null; /// /// 日志对象 /// private LogHelper log = null; /// /// 数据服务 /// private IOpen5Code services = null; /// /// 当前彩种 /// private SCCLottery currentLottery { get { return SCCLottery.ShanDongQYH; } } /// /// 邮件接口 /// private IEmail email = null; #endregion } }