using System; using System.Collections.Generic; using System.Linq; using System.Text; using System.Text.RegularExpressions; using HtmlAgilityPack; using Quartz; using SCC.Common; using SCC.Crawler.Tools; using SCC.Interface; using SCC.Models; namespace SCC.Crawler.DT { /// /// 江苏体彩7位数 /// [DisallowConcurrentExecution] [PersistJobDataAfterExecution] public class JSTC7WSJob : IJob { /// /// 初始化函数 /// public JSTC7WSJob() { log = new LogHelper(); services = IOC.Resolve(); email = IOC.Resolve(); } /// /// 作业执行入口 /// /// 作业执行上下文 public void Execute(IJobExecutionContext context) { Config = CommonHelper.GetConfigFromDataMap(context.JobDetail.JobDataMap); //预设节假日不开奖 if (Config.SkipDate.Contains(CommonHelper.SCCSysDateTime.ToString("yyyyMMdd"))) return; LatestItem = context.JobDetail.JobDataMap["LatestItem"] as OpenCode7DTModel; try { //服务启动时配置初始数据 if (LatestItem == null) { LatestItem = services.GetOpenCode7DTLastItem(currentLottery); if (LatestItem == null) LatestItem = new OpenCode7DTModel { Term = CommonHelper.GenerateQiHaoYYQQQ(0), OpenTime = new DateTime(CommonHelper.SCCSysDateTime.Year, 1, 1) }; } //程序时间第二天,程序根据配置检查是否昨天有开奖 isGetData = false; if (CommonHelper.CheckDTIsNeedGetData(Config)) { DoMainUrl(); DoBackUrl(); } if (!LatestItem.Term.ToString().StartsWith(CommonHelper.SCCSysDateTime.ToString("yy"))) LatestItem = new OpenCode7DTModel { Term = CommonHelper.GenerateQiHaoYYQQQ(0), OpenTime = new DateTime(CommonHelper.SCCSysDateTime.Year, 1, 1) }; //当今日开奖并且当前时间是晚上8点过后开始抓取 if (CommonHelper.CheckTodayIsOpenDay(Config) && CommonHelper.SCCSysDateTime.Hour > 12) { DoMainUrl(); DoBackUrl(); } // // TrendChartHelper.GenerateJSTC7WSTrendChart(log); } catch (Exception ex) { log.Error(typeof(JSTC7WSJob), string.Format("【{0}】抓取时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message)); } //保存最新期号 context.JobDetail.JobDataMap["LatestItem"] = LatestItem; } /// /// 通过主站点爬取开奖数据 /// (江苏体彩网) /// private void DoMainUrl() { if (!string.IsNullOrEmpty(Config.MainUrl)) { var OpenList = GetOpenListFromMainUrl(Config.MainUrl); if (OpenList.Count == 0) return; //无抓取数据 var newestQiHao = OpenList.First().Term.ToString(); var startQiNum = Convert.ToInt32(LatestItem.Term.ToString().Substring(2)) + 1; var newestQiNum = Convert.ToInt32(newestQiHao.Substring(2)); if (startQiNum > newestQiNum) return; //无最新数据 //处理最新开奖数据 var getQiHao = string.Empty; OpenCode7DTModel matchItem = null; for (var i = startQiNum; i <= newestQiNum; i++) { getQiHao = LatestItem.Term.ToString().Substring(0, 2) + i.ToString().PadLeft(3, '0'); matchItem = OpenList.Where(R => R.Term.ToString() == getQiHao).FirstOrDefault(); if (matchItem != null && OptimizeMainModel(ref matchItem) && services.AddDTOpen7Code(currentLottery, matchItem)) { //Do Success Log log.Info(typeof(JSTC7WSJob), CommonHelper.GetJobMainLogInfo(Config, getQiHao)); LatestItem = matchItem; isGetData = true; } } } } /// /// 获取主站开奖列表数据 /// /// 主站地址 /// private List GetOpenListFromMainUrl(string mainUrl) { var result = new List(); try { var pageIndex = 1; var htmlResource = string.Empty; var resourceUrl = new Uri(mainUrl); var isLoop = true; var lastYear = (DateTime.Now.Year - 1).ToString().Substring(2); var postData = "current_page={0}&all_count=0&num="; var OpenTime = string.Empty; while (isLoop) { htmlResource = NetHelper.GetUrlResponse(resourceUrl.AbsoluteUri, "POST", string.Format(postData, pageIndex), Encoding.UTF8); var jsonData = htmlResource.JsonToEntity(); var dataList = jsonData["items"]; foreach (var data in dataList) { if (data["num"].Value.StartsWith(lastYear)) { isLoop = false; break; } OpenTime = data["date_publish"].Value.Insert(6, "-").Insert(4, "-"); result.Add(new OpenCode7DTModel { Term = Convert.ToInt32(data["num"].Value), OpenCode1 = Convert.ToInt32(data["one"].Value), OpenCode2 = Convert.ToInt32(data["two"].Value), OpenCode3 = Convert.ToInt32(data["three"].Value), OpenCode4 = Convert.ToInt32(data["four"].Value), OpenCode5 = Convert.ToInt32(data["five"].Value), OpenCode6 = Convert.ToInt32(data["six"].Value), OpenCode7 = Convert.ToInt32(data["seven"].Value), OpenTime = Convert.ToDateTime(OpenTime), DetailUrl = string.Format( "http://www.js-lottery.com/Article/news/group_id/3/article_id/{0}.html", data["article_id"].Value) }); } pageIndex++; } var checkDataHelper = new CheckDataHelper(); var dbdata = services.GetListS(currentLottery) .ToDictionary(w => w.Term.ToString(), w => w.GetCodeStr()); checkDataHelper.CheckData(dbdata, result.ToDictionary(w => w.Term.ToString(), w => w.GetCodeStr()), Config.Area, currentLottery); result = result.OrderByDescending(S => S.Term).ToList(); } catch (Exception ex) { log.Error(typeof(JSTC7WSJob), string.Format("【{0}】通过主站点抓取开奖列表时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message)); } return result; } /// /// 完善主站江苏体彩7位数开奖详情信息 /// /// private bool OptimizeBackModel(ref OpenCode7DTModel model, HtmlNode tr) { try { var entity = new KaijiangDetailsEntity(); entity.KaiJiangItems = new List(); var tds = tr.ChildNodes.Where(w => w.Name == "td").ToList(); var xiaoshoue = tds[2].InnerText.Trim().Replace(",", "").Replace("元", ""); var jiangchi = ""; var tedengjiang = new Kaijiangitem { Name = "特等奖", Total = tds[3].InnerText.Trim(), TotalMoney = tds[4].InnerText }; entity.KaiJiangItems.Add(tedengjiang); var yidengjiang = new Kaijiangitem { Name = "一等奖", Total = tds[5].InnerText.Trim(), TotalMoney = tds[6].InnerText }; entity.KaiJiangItems.Add(yidengjiang); var erdengjiang = new Kaijiangitem { Name = "二等奖", Total = tds[7].InnerText.Trim(), TotalMoney = tds[8].InnerText }; entity.KaiJiangItems.Add(erdengjiang); entity.Gdje = jiangchi; entity.Trje = xiaoshoue; model.Spare = entity.TryToJson(); } catch (Exception ex) { log.Error(typeof(JSTC7WSJob), string.Format("【{0}】通过主站点优化开奖列表时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message)); } return false; } /// /// 完善主站江苏体彩7位数开奖详情信息 /// /// private bool OptimizeMainModel(ref OpenCode7DTModel model) { try { var entity = new KaijiangDetailsEntity(); entity.KaiJiangItems = new List(); var htmlResource = NetHelper.GetUrlResponse(model.DetailUrl); if (htmlResource == null) return false; if (!string.IsNullOrEmpty(htmlResource)) { var doc = new HtmlDocument(); doc.LoadHtml(htmlResource); var table = doc.DocumentNode.SelectNodes("//table"); if (table != null && table.Count > 1) { var trs = table[1].ChildNodes.Where(N => N.Name.ToLower() == "tbody").First().ChildNodes .Where(N => N.Name.ToLower() == "tr").ToList(); for (var i = 0; i < trs.Count; i++) { var tds = trs[i].ChildNodes.Where(N => N.Name.ToLower() == "td").ToList(); if (tds[0].InnerText == "特等奖") { var tmp = new Kaijiangitem { Name = "特等奖", Total = tds[1].InnerText.Replace(",", string.Empty).Replace("注", string.Empty), TotalMoney = tds[2].InnerText.Replace("元", string.Empty).Replace("--", "0").Replace(",", "") .Trim() }; entity.KaiJiangItems.Add(tmp); //Level1Num = Convert.ToInt32(tds[1].InnerText.Replace(",", string.Empty).Replace("注", string.Empty)); //Level1Money = Convert.ToDecimal(tds[2].InnerText.Replace("元", string.Empty)); } else if (tds[0].InnerText == "一等奖") { var tmp = new Kaijiangitem { Name = "一等奖", Total = tds[1].InnerText.Replace(",", string.Empty).Replace("注", string.Empty), TotalMoney = tds[2].InnerText.Replace("元", string.Empty).Replace("--", "0").Replace(",", "") .Trim() }; entity.KaiJiangItems.Add(tmp); } else if (tds[0].InnerText == "二等奖") { var tmp = new Kaijiangitem { Name = "二等奖", Total = tds[1].InnerText.Replace(",", string.Empty).Replace("注", string.Empty), TotalMoney = tds[2].InnerText.Replace("元", string.Empty).Replace("--", "0").Replace(",", "") .Trim() }; entity.KaiJiangItems.Add(tmp); } else if (tds[0].InnerText == "三等奖") { var tmp = new Kaijiangitem { Name = "三等奖", Total = tds[1].InnerText.Replace(",", string.Empty).Replace("注", string.Empty), TotalMoney = tds[2].InnerText.Replace("元", string.Empty).Replace("--", "0").Replace(",", "") .Trim() }; entity.KaiJiangItems.Add(tmp); } else if (tds[0].InnerText == "四等奖") { var tmp = new Kaijiangitem { Name = "四等奖", Total = tds[1].InnerText.Replace(",", string.Empty).Replace("注", string.Empty), TotalMoney = tds[2].InnerText.Replace("元", string.Empty).Replace("--", "0").Replace(",", "") .Trim() }; entity.KaiJiangItems.Add(tmp); } else if (tds[0].InnerText == "五等奖") { var tmp = new Kaijiangitem { Name = "五等奖", Total = tds[1].InnerText.Replace(",", string.Empty).Replace("注", string.Empty), TotalMoney = tds[2].InnerText.Replace("元", string.Empty).Replace("--", "0").Replace(",", "") .Trim() }; entity.KaiJiangItems.Add(tmp); } } var reg1 = new Regex(@"本省(区、市)销售额:([\s\S]*?)元"); var match1 = reg1.Match(htmlResource); if (match1.Success) { //2016年182期及以前期数 //Sales = Convert.ToDecimal(match1.Result("$1")); entity.Trje = match1.Result("$1"); } else { //2016年183期及以后期数 reg1 = new Regex(@"本期销售金额:([\s\S]*?)元"); match1 = reg1.Match(htmlResource); if (match1.Success) entity.Trje = match1.Result("$1"); } var ps = table[1].ParentNode.ChildNodes.Where(N => N.Name.ToLower() == "p").ToList(); var potString = ps.Last().InnerHtml; reg1 = new Regex(@"
([\s\S]*?)元"); match1 = reg1.Match(potString); if (match1.Success) { var potValue = match1.Result("$1").Replace(" ", string.Empty); if (potValue.Contains("
")) // Jackpot = Convert.ToDecimal(potValue.Substring(potValue.IndexOf("
") + 4)); entity.Gdje = potValue.Substring(potValue.IndexOf("
") + 4); else // Jackpot = Convert.ToDecimal(potValue); entity.Gdje = potValue; } model.Spare = entity.TryToJson(); return true; } } } catch (Exception ex) { log.Error(typeof(JSTC7WSJob), string.Format("【{0}】通过主站点优化开奖列表时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message)); } return false; } /// /// 通过备用站点抓取开奖数据 /// (百度乐彩) /// private void DoBackUrl() { if (!string.IsNullOrEmpty(Config.BackUrl)) { var OpenList = GetOpenListFromBackUrl(); if (OpenList.Count == 0) return; //无抓取数据 var newestQiHao = OpenList.First().Term.ToString(); var startQiNum = Convert.ToInt32(LatestItem.Term.ToString().Substring(2)) + 1; var newestQiNum = Convert.ToInt32(newestQiHao.Substring(2)); if (startQiNum > newestQiNum) return; //无最新数据 //处理最新开奖数据 var getQiHao = string.Empty; OpenCode7DTModel matchItem = null; for (var i = startQiNum; i <= newestQiNum; i++) { getQiHao = LatestItem.Term.ToString().Substring(0, 2) + i.ToString().PadLeft(3, '0'); matchItem = OpenList.Where(R => R.Term.ToString() == getQiHao).FirstOrDefault(); if (matchItem != null && services.AddDTOpen7Code(currentLottery, matchItem)) { //Do Success Log log.Info(typeof(JSTC7WSJob), CommonHelper.GetJobBackLogInfo(Config, getQiHao)); LatestItem = matchItem; isGetData = true; } } } } private List GetOpenListFromBackUrl() { var result = new List(); try { var url = Config.BackUrl + "?lid=10048&page=1"; var htmlResource = NetHelper.GetBaiDuLeCaiResponse(url); if (htmlResource == null) return result; var doc = new HtmlDocument(); doc.LoadHtml(htmlResource); var table = doc.DocumentNode.SelectSingleNode("//table"); if (table == null) return result; var trs = table.ChildNodes.Where(node => node.Name == "tr").ToList(); trs.RemoveAll(w => w.GetAttributeValue("class", "") != ""); foreach (var item in trs) { var tds = item.ChildNodes.Where(w => w.Name == "td").ToList(); var qihao = tds[0].InnerText.Trim().Substring(2); var kaijianghao = tds[1].InnerText.Trim(); var opentime = tds[9].InnerText.Trim(); var tmp = new OpenCode7DTModel { Term = long.Parse(qihao), OpenTime = DateTime.Parse(opentime) }; tmp.OpenCode1 = int.Parse(kaijianghao.Substring(0, 1)); tmp.OpenCode2 = int.Parse(kaijianghao.Substring(1, 1)); tmp.OpenCode3 = int.Parse(kaijianghao.Substring(2, 1)); tmp.OpenCode4 = int.Parse(kaijianghao.Substring(3, 1)); tmp.OpenCode5 = int.Parse(kaijianghao.Substring(4, 1)); tmp.OpenCode6 = int.Parse(kaijianghao.Substring(5, 1)); tmp.OpenCode7 = int.Parse(kaijianghao.Substring(6, 1)); OptimizeBackModel(ref tmp, item); result.Add(tmp); } var checkDataHelper = new CheckDataHelper(); var dbdata = services.GetListS(currentLottery) .ToDictionary(w => w.Term.ToString(), w => w.GetCodeStr()); checkDataHelper.CheckData(dbdata, result.ToDictionary(w => w.Term.ToString(), w => w.GetCodeStr()), Config.Area, currentLottery); result = result.OrderByDescending(S => S.Term).ToList(); } catch (Exception ex) { log.Error(typeof(JSTC7WSJob), string.Format("【{0}】通过备用站点抓取开奖列表时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message)); } return result; } #region Attribute /// /// 配置信息 /// private SCCConfig Config; /// /// 当天抓取的最新一期开奖记录 /// private OpenCode7DTModel LatestItem; /// /// 当天抓取失败列表 /// private List FailedQiHaoList = null; /// /// 日志对象 /// private readonly LogHelper log; /// /// 数据服务 /// private readonly IDTOpenCode services; /// /// 当前彩种 /// private SCCLottery currentLottery => SCCLottery.JiangSuTC7WS; /// /// 邮件接口 /// private IEmail email; /// /// 是否本次运行抓取到开奖数据 /// private bool isGetData; #endregion } }