QXCJob.cs 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286
  1. using System;
  2. using System.Collections.Generic;
  3. using System.Linq;
  4. using System.Text;
  5. using HtmlAgilityPack;
  6. using Quartz;
  7. using SCC.Common;
  8. using SCC.Crawler.Tools;
  9. using SCC.Interface;
  10. using SCC.Models;
  11. namespace SCC.Crawler.QG
  12. {
  13. /// <summary>
  14. /// 七星彩
  15. /// </summary>
  16. public class QXCJob : IJob
  17. {
  18. public QXCJob()
  19. {
  20. log = new LogHelper();
  21. services = IOC.Resolve<IDTOpenCode>();
  22. email = IOC.Resolve<IEmail>();
  23. }
  24. #region QXC执行入口
  25. /// <summary>
  26. /// 作业执行入口
  27. /// </summary>
  28. /// <param name="context">作业执行上下文</param>
  29. public void Execute(IJobExecutionContext context)
  30. {
  31. Config = CommonHelper.GetConfigFromDataMap(context.JobDetail.JobDataMap);
  32. //预设节假日不开奖
  33. if (Config.SkipDate.Contains(CommonHelper.SCCSysDateTime.ToString("yyyyMMdd"))) return;
  34. LatestItem = context.JobDetail.JobDataMap["LatestItem"] as OpenCode7DTModel;
  35. try
  36. {
  37. //服务启动时配置初始数据
  38. if (LatestItem == null)
  39. {
  40. LatestItem = services.GetOpenCode7DTLastItem(currentLottery);
  41. if (LatestItem == null)
  42. LatestItem = new OpenCode7DTModel
  43. {
  44. Term = CommonHelper.GenerateQiHaoYYYYQQQ(0),
  45. OpenTime = new DateTime(CommonHelper.SCCSysDateTime.Year, 1, 1)
  46. };
  47. }
  48. //程序时间第二天,程序根据配置检查是否昨天有开奖
  49. isGetData = false;
  50. if (CommonHelper.CheckDTIsNeedGetData(Config)) DoMainUrl();
  51. if (!LatestItem.Term.ToString().StartsWith(CommonHelper.SCCSysDateTime.ToString("yy")))
  52. LatestItem = new OpenCode7DTModel
  53. {
  54. Term = CommonHelper.GenerateQiHaoYYYYQQQ(0),
  55. OpenTime = new DateTime(CommonHelper.SCCSysDateTime.Year, 1, 1)
  56. };
  57. //当今日开奖并且当前时间是晚上8点过后开始抓取
  58. if (CommonHelper.CheckTodayIsOpenDay(Config) && CommonHelper.SCCSysDateTime.Hour > 12) DoMainUrl();
  59. //
  60. //
  61. }
  62. catch (Exception ex)
  63. {
  64. log.Error(GetType(), string.Format("【{0}】抓取时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message));
  65. }
  66. //保存最新期号
  67. context.JobDetail.JobDataMap["LatestItem"] = LatestItem;
  68. }
  69. #endregion
  70. #region
  71. /// <summary>
  72. /// 把获取到的数据list存入数据库
  73. /// </summary>
  74. private void DoMainUrl()
  75. {
  76. if (!string.IsNullOrEmpty(Config.MainUrl))
  77. {
  78. var openList = GetOpenListFromMainUrl(Config.MainUrl);
  79. if (openList.Count == 0) return; //无抓取数据
  80. //抓取到的最新期数
  81. var newestQiHao = Convert.ToInt32(openList.First().Term.ToString());
  82. //数据库里面最新期数
  83. var startQiNum = Convert.ToInt32(LatestItem.Term.ToString());
  84. if (startQiNum > newestQiHao) return; //无最新数据
  85. //处理最新开奖数据
  86. var getQiHao = string.Empty;
  87. OpenCode7DTModel matchItem = null;
  88. for (var i = startQiNum; i <= newestQiHao; i++)
  89. {
  90. getQiHao = i.ToString();
  91. matchItem = openList.FirstOrDefault(r => r.Term.ToString() == getQiHao);
  92. if (matchItem != null && services.AddDTOpen7Code(currentLottery, matchItem))
  93. {
  94. //Do Success Log
  95. log.Info(GetType(), CommonHelper.GetJobMainLogInfo(Config, getQiHao));
  96. LatestItem = matchItem;
  97. isGetData = true;
  98. }
  99. }
  100. }
  101. }
  102. /// <summary>
  103. /// 通过主站点爬取开奖数据
  104. /// </summary>
  105. private List<OpenCode7DTModel> GetOpenListFromMainUrl(string mainUrl)
  106. {
  107. var result = new List<OpenCode7DTModel>();
  108. try
  109. {
  110. var url = new Uri(mainUrl);
  111. var htmlResource = NetHelper.GetUrlResponse(mainUrl, Encoding.GetEncoding("utf-8"));
  112. if (htmlResource == null) return result;
  113. var doc = new HtmlDocument();
  114. doc.LoadHtml(htmlResource);
  115. var table = doc.DocumentNode.SelectSingleNode("//table");
  116. if (table == null) return result;
  117. var trs = table.ChildNodes.Where(node => node.Name == "tr").ToList();
  118. OpenCode7DTModel model = null;
  119. HtmlNode nodeA = null;
  120. var optimizeUrl = string.Empty;
  121. for (var i = 0; i < trs.Count; i++) //第一二行为表头
  122. {
  123. var trstyle = trs[i].Attributes["style"];
  124. if (trstyle != null && trstyle.Value == "display:none") continue;
  125. var tds = trs[i].ChildNodes.Where(node => node.Name == "td").ToList();
  126. if (tds.Count < 12) continue;
  127. model = new OpenCode7DTModel();
  128. var Term = tds[0].InnerText.Trim();
  129. if (Term.Length <= 7)
  130. {
  131. model.Term = Convert.ToInt64("20" + Term);
  132. }
  133. else
  134. {
  135. model.Term = Convert.ToInt64(Term);
  136. }
  137. optimizeUrl = model.Term.ToString();
  138. model.OpenTime = Convert.ToDateTime(tds[1].InnerText.Substring(0, 5));
  139. if (tds[2].ChildNodes.Count == 0) continue;
  140. var b = tds[2].ChildNodes.Where(n => n.Name.ToLower() == "b").ToList();
  141. var span = b[0].ChildNodes.Where(n => n.Name.ToLower() == "span").ToList();
  142. model.OpenCode1 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(0, 1).Trim());
  143. model.OpenCode2 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(1, 1).Trim());
  144. model.OpenCode3 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(2, 1).Trim());
  145. model.OpenCode4 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(3, 1).Trim());
  146. model.OpenCode5 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(4, 1).Trim());
  147. model.OpenCode6 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(5, 1).Trim());
  148. model.OpenCode7 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(6, 1).Trim());
  149. var details = GetKaijiangDetails(optimizeUrl);
  150. model.Spare = details;
  151. result.Add(model);
  152. }
  153. var checkDataHelper = new CheckDataHelper();
  154. var dbdata = services.GetListS<OpenCode7DTModel>(currentLottery)
  155. .ToDictionary(w => w.Term.ToString(), w => w.GetCodeStr());
  156. checkDataHelper.CheckData(dbdata, result.ToDictionary(w => w.Term.ToString(), w => w.GetCodeStr()),
  157. Config.Area, currentLottery);
  158. result = result.OrderByDescending(S => S.Term).ToList();
  159. }
  160. catch (Exception ex)
  161. {
  162. log.Error(GetType(),
  163. string.Format("【{0}】通过主站抓取开奖列表时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message));
  164. }
  165. return result;
  166. }
  167. /// <summary>
  168. /// 开奖详情
  169. /// </summary>
  170. /// <param name="optimizeUrl">地址</param>
  171. /// <returns></returns>
  172. private string GetKaijiangDetails(string optimizeUrl)
  173. {
  174. var url = "https://www.8200.cn/kjh/qxc/" + optimizeUrl + ".htm";
  175. var htmlResource = NetHelper.GetUrlResponse(url, Encoding.GetEncoding("utf-8"));
  176. var doc = new HtmlDocument();
  177. doc.LoadHtml(htmlResource);
  178. var div = doc.DocumentNode.SelectSingleNode("//div[@class='text-16']");
  179. if (div == null) return null;
  180. //爬去奖金
  181. var jiangjin = div.ChildNodes.Where(node => node.Name == "p").ToList();
  182. //爬去奖项
  183. //var tbody = div.ChildNodes.Where(node => node.Name == "tbody").ToList();
  184. var table = doc.DocumentNode.SelectSingleNode("//table");
  185. var trs = table.ChildNodes.Where(node => node.Name == "tr").ToList();
  186. var gdje = jiangjin[2].InnerText.Replace(" 万元", "").Replace("奖池滚存:", "").Replace("--", "0").Replace(",", "")
  187. .Trim();
  188. var trje = jiangjin[1].InnerText.Replace(" 万元", "").Replace("本期销量:", "").Replace("--", "0").Replace(",", "")
  189. .Trim();
  190. var entity = new KaijiangDetailsEntity
  191. {
  192. Gdje = gdje == "0" ? "0" : (double.Parse(gdje) * 10000).ToString(),
  193. Trje = trje == "0" ? "0" : (double.Parse(trje) * 10000).ToString()
  194. };
  195. //TODO
  196. //组装详情
  197. var list = new List<Kaijiangitem>();
  198. for (var i = 0; i < trs.Count; i++)
  199. {
  200. var tds = trs[i].ChildNodes.Where(node => node.Name == "td").ToList();
  201. var kaijiangitem = new Kaijiangitem();
  202. var TotalMoney = tds[1].InnerText.Replace("元", "").Replace("--", "0").Replace(",", "").Trim();
  203. kaijiangitem.Name = tds[0].InnerText.Trim();
  204. kaijiangitem.TotalMoney = TotalMoney == "0" ? "0" : double.Parse(TotalMoney).ToString();
  205. kaijiangitem.Total = tds[2].InnerText.Trim().Replace(" 注", "").Replace("--", "0").Trim();
  206. list.Add(kaijiangitem);
  207. }
  208. entity.KaiJiangItems = list;
  209. return entity.TryToJson();
  210. }
  211. #endregion
  212. #region QXC初始化
  213. /// <summary>
  214. /// 配置信息
  215. /// </summary>
  216. private SCCConfig Config;
  217. /// <summary>
  218. /// 当天抓取的最新一期开奖记录
  219. /// </summary>
  220. private OpenCode7DTModel LatestItem;
  221. /// <summary>
  222. /// 当天抓取失败列表
  223. /// </summary>
  224. private List<string> FailedQiHaoList = null;
  225. /// <summary>
  226. /// 日志对象
  227. /// </summary>
  228. private readonly LogHelper log;
  229. /// <summary>
  230. /// 数据服务
  231. /// </summary>
  232. private readonly IDTOpenCode services;
  233. /// <summary>
  234. /// 当前彩种
  235. /// </summary>
  236. private SCCLottery currentLottery => SCCLottery.QXC;
  237. /// <summary>
  238. /// 邮件接口
  239. /// </summary>
  240. private IEmail email;
  241. /// <summary>
  242. /// 是否本次运行抓取到开奖数据
  243. /// </summary>
  244. private bool isGetData;
  245. #endregion
  246. }
  247. }