SSQJob.cs 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364
  1. using System;
  2. using System.Collections.Generic;
  3. using System.Linq;
  4. using System.Text;
  5. using HtmlAgilityPack;
  6. using Quartz;
  7. using SCC.Common;
  8. using SCC.Crawler.Tools;
  9. using SCC.Interface;
  10. using SCC.Models;
  11. namespace SCC.Crawler.QG
  12. {
  13. /// <summary>
  14. /// 双色球
  15. /// </summary>
  16. public class SSQJob : IJob
  17. {
  18. /// <summary>
  19. /// 构造函数
  20. /// </summary>
  21. public SSQJob()
  22. {
  23. log = new LogHelper();
  24. services = IOC.Resolve<IDTOpenCode>();
  25. email = IOC.Resolve<IEmail>();
  26. }
  27. #region SSQ作业执行入口
  28. /// <summary>
  29. /// 作业执行入口
  30. /// </summary>
  31. /// <param name="context">作业执行上下文</param>
  32. public void Execute(IJobExecutionContext context)
  33. {
  34. Config = CommonHelper.GetConfigFromDataMap(context.JobDetail.JobDataMap);
  35. //预设节假日不开奖
  36. if (Config.SkipDate.Contains(CommonHelper.SCCSysDateTime.ToString("yyyyMMdd"))) return;
  37. LatestItem = context.JobDetail.JobDataMap["LatestItem"] as OpenCode7DTModel;
  38. try
  39. {
  40. //服务启动时配置初始数据
  41. if (LatestItem == null)
  42. {
  43. LatestItem = services.GetOpenCode7DTLastItem(currentLottery);
  44. if (LatestItem == null)
  45. LatestItem = new OpenCode7DTModel
  46. {
  47. Term = CommonHelper.GenerateQiHaoYYYYQQQ(0),
  48. OpenTime = new DateTime(CommonHelper.SCCSysDateTime.Year, 1, 1)
  49. };
  50. }
  51. //程序时间第二天,程序根据配置检查是否昨天有开奖
  52. isGetData = false;
  53. if (CommonHelper.CheckDTIsNeedGetData(Config)) DoMainUrl();
  54. if (!LatestItem.Term.ToString().StartsWith(CommonHelper.SCCSysDateTime.ToString("yy")))
  55. LatestItem = new OpenCode7DTModel
  56. {
  57. Term = CommonHelper.GenerateQiHaoYYYYQQQ(0),
  58. OpenTime = new DateTime(CommonHelper.SCCSysDateTime.Year, 1, 1)
  59. };
  60. //当今日开奖并且当前时间是晚上8点过后开始抓取
  61. if (CommonHelper.CheckTodayIsOpenDay(Config) && CommonHelper.SCCSysDateTime.Hour > 12) DoMainUrl();
  62. //
  63. //更新最后一期的开机号
  64. CheckGetKaiJiHao();
  65. }
  66. catch (Exception ex)
  67. {
  68. log.Error(GetType(), string.Format("【{0}】抓取时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message));
  69. }
  70. //保存最新期号
  71. context.JobDetail.JobDataMap["LatestItem"] = LatestItem;
  72. }
  73. #endregion
  74. #region SSQ爬取开机号数据
  75. /// <summary>
  76. /// 把获取的开机号数据更新到数据库
  77. /// </summary>
  78. private void CheckGetKaiJiHao()
  79. {
  80. try
  81. {
  82. List<KaiJiangHao> kai = GetKaiJiHao();
  83. foreach (var item in kai)
  84. {
  85. var isSucc = services.UpdateSSQDetailByTerm(currentLottery, item.QiHao, item.Kaijianghao);
  86. if (isSucc)
  87. {
  88. log.Info(GetType(), $"更新{Config.LotteryName}第{ item.QiHao}期开机号成功!");
  89. }
  90. else
  91. {
  92. log.Error(GetType(), $"更新{Config.LotteryName}第{ item.QiHao}期开机号失败!");
  93. }
  94. }
  95. }
  96. catch (Exception e)
  97. {
  98. log.Error(GetType(), e);
  99. }
  100. }
  101. /// <summary>
  102. /// 根据网站获取开机号数据
  103. /// </summary>
  104. private List<KaiJiangHao> GetKaiJiHao()
  105. {
  106. List<KaiJiangHao> result = new List<KaiJiangHao>();
  107. var url = "https://www.8200.cn/kjh/ssq/kjih.htm?size=30";
  108. var htmlResource = NetHelper.GetUrlResponse(url, Encoding.GetEncoding("utf-8"));
  109. if (htmlResource == null) return null;
  110. if (!string.IsNullOrEmpty(htmlResource))
  111. {
  112. var doc = new HtmlDocument();
  113. doc.LoadHtml(htmlResource);
  114. var table = doc.DocumentNode.SelectSingleNode("//table");
  115. if (table == null) return null;
  116. var trs = table.ChildNodes.Where(node => node.Name == "tr").ToList();
  117. KaiJiangHao model = null;
  118. for (var i = 0; i <= 15; i++)
  119. {
  120. var tds = trs[i].ChildNodes.Where(S => S.Name.ToLower() == "td").ToList();
  121. model = new KaiJiangHao();
  122. model.QiHao = Convert.ToInt32(tds[0].InnerText.Trim());
  123. if (tds[2].InnerText.Trim() == "--")
  124. {
  125. model.Kaijianghao = "";
  126. }
  127. else
  128. {
  129. string source = tds[2].InnerText.Replace(" + ", ",").Replace(" ", ",").Replace(",,", ",").Trim();
  130. source = source.IndexOf(",") >= 0 ? source.Substring(1, source.Length - 1) : source;
  131. model.Kaijianghao = source;
  132. }
  133. result.Add(model);
  134. }
  135. }
  136. return result;
  137. }
  138. #endregion
  139. #region SSQ爬取开奖号数据
  140. /// <summary>
  141. /// 把爬取的集合和数据库做比较并保存最新期数
  142. /// </summary>
  143. private void DoMainUrl()
  144. {
  145. if (!string.IsNullOrEmpty(Config.MainUrl))
  146. {
  147. var openList = GetOpenListFromMainUrl(Config.MainUrl);
  148. if (openList.Count == 0) return; //无抓取数据
  149. //抓取到的最新期数
  150. var newestQiHao = Convert.ToInt32(openList.First().Term.ToString());
  151. //数据库里面最新期数
  152. var startQiNum = Convert.ToInt32(LatestItem.Term.ToString());
  153. if (startQiNum > newestQiHao) return; //无最新数据
  154. //处理最新开奖数据
  155. var getQiHao = string.Empty;
  156. OpenCode7DTModel matchItem = null;
  157. for (var i = startQiNum; i <= newestQiHao; i++)
  158. {
  159. getQiHao = i.ToString();
  160. matchItem = openList.FirstOrDefault(r => r.Term.ToString() == getQiHao);
  161. if (matchItem != null && services.AddDTOpen7Code(currentLottery, matchItem))
  162. {
  163. //Do Success Log
  164. log.Info(GetType(), CommonHelper.GetJobMainLogInfo(Config, getQiHao));
  165. LatestItem = matchItem;
  166. isGetData = true;
  167. }
  168. }
  169. }
  170. }
  171. /// <summary>
  172. /// 通过主站点爬取开奖数据
  173. /// (福建体彩网)
  174. ///
  175. /// </summary>
  176. private List<OpenCode7DTModel> GetOpenListFromMainUrl(string mainUrl)
  177. {
  178. var result = new List<OpenCode7DTModel>();
  179. try
  180. {
  181. var url = new Uri(mainUrl);
  182. var htmlResource = NetHelper.GetUrlResponse(mainUrl, Encoding.GetEncoding("utf-8"));
  183. if (htmlResource == null) return result;
  184. var doc = new HtmlDocument();
  185. doc.LoadHtml(htmlResource);
  186. var table = doc.DocumentNode.SelectSingleNode("//table");
  187. if (table == null) return result;
  188. var trs = table.ChildNodes.Where(node => node.Name == "tr").ToList();
  189. OpenCode7DTModel model = null;
  190. HtmlNode nodeA = null;
  191. var optimizeUrl = string.Empty;
  192. for (var i = 0; i < trs.Count; i++) //第一二行为表头
  193. {
  194. var trstyle = trs[i].Attributes["style"];
  195. if (trstyle != null && trstyle.Value == "display:none") continue;
  196. var tds = trs[i].ChildNodes.Where(node => node.Name == "td").ToList();
  197. if (tds.Count < 8) continue;
  198. model = new OpenCode7DTModel();
  199. model.Term = Convert.ToInt64(tds[0].InnerText.Trim());
  200. optimizeUrl = model.Term.ToString();
  201. model.OpenTime = Convert.ToDateTime(tds[1].InnerText.Substring(0, 5));
  202. if (tds[2].ChildNodes.Count == 0) continue;
  203. var b = tds[2].ChildNodes.Where(n => n.Name.ToLower() == "b").ToList();
  204. var span = b[0].ChildNodes.Where(n => n.Name.ToLower() == "span").ToList();
  205. model.OpenCode1 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(0, 2).Trim());
  206. model.OpenCode2 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(2, 2).Trim());
  207. model.OpenCode3 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(4, 2).Trim());
  208. model.OpenCode4 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(6, 2).Trim());
  209. model.OpenCode5 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(8, 2).Trim());
  210. model.OpenCode6 = Convert.ToInt32(span[0].InnerText.Replace(" ", "").Substring(10, 2).Trim());
  211. model.OpenCode7 = Convert.ToInt32(span[1].InnerText.Replace(" ", "").Substring(0, 2).Trim());
  212. var details = GetKaijiangDetails(optimizeUrl);
  213. model.Spare = details;
  214. result.Add(model);
  215. }
  216. var checkDataHelper = new CheckDataHelper();
  217. var dbdata = services.GetListS<OpenCode7DTModel>(currentLottery)
  218. .ToDictionary(w => w.Term.ToString(), w => w.GetCodeStr());
  219. checkDataHelper.CheckData(dbdata, result.ToDictionary(w => w.Term.ToString(), w => w.GetCodeStr()),
  220. Config.Area, currentLottery);
  221. result = result.OrderByDescending(S => S.Term).ToList();
  222. }
  223. catch (Exception ex)
  224. {
  225. log.Error(GetType(),
  226. string.Format("【{0}】通过主站抓取开奖列表时发生错误,错误信息【{1}】", Config.Area + currentLottery, ex.Message));
  227. }
  228. return result;
  229. }
  230. /// <summary>
  231. /// 双色球详情
  232. /// </summary>
  233. /// <param name="optimizeUrl"></param>
  234. /// <returns></returns>
  235. private string GetKaijiangDetails(string optimizeUrl)
  236. {
  237. var url = "https://www.8200.cn/kjh/ssq/" + optimizeUrl + ".htm";
  238. var htmlResource = NetHelper.GetUrlResponse(url, Encoding.GetEncoding("utf-8"));
  239. var doc = new HtmlDocument();
  240. doc.LoadHtml(htmlResource);
  241. var div = doc.DocumentNode.SelectSingleNode("//div[@class='text-16']");
  242. if (div == null) return null;
  243. //爬去奖金
  244. var jiangjin = div.ChildNodes.Where(node => node.Name == "p").ToList();
  245. //爬去奖项
  246. //var tbody = div.ChildNodes.Where(node => node.Name == "tbody").ToList();
  247. var table = doc.DocumentNode.SelectSingleNode("//table");
  248. var trs = table.ChildNodes.Where(node => node.Name == "tr").ToList();
  249. var gdje = jiangjin[3].InnerText.Replace(" 亿元", "").Replace("奖池滚存:", "").Replace("--", "0").Replace(",", "")
  250. .Trim();
  251. var trje = jiangjin[2].InnerText.Replace(" 亿元", "").Replace("本期销量:", "").Replace("--", "0").Replace(",", "")
  252. .Trim();
  253. var entity = new KaijiangDetailsEntity
  254. {
  255. Gdje = gdje == "0" ? "0" : (double.Parse(gdje) * 100000000).ToString(),
  256. Trje = trje == "0" ? "0" : (double.Parse(trje) * 100000000).ToString()
  257. };
  258. //TODO
  259. //组装详情
  260. var list = new List<Kaijiangitem>();
  261. for (var i = 0; i < trs.Count; i++)
  262. {
  263. var tds = trs[i].ChildNodes.Where(node => node.Name == "td").ToList();
  264. var kaijiangitem = new Kaijiangitem();
  265. var TotalMoney = tds[1].InnerText.Replace("元", "").Replace("--", "0").Replace(",", "").Trim();
  266. kaijiangitem.Name = tds[0].InnerText.Trim();
  267. kaijiangitem.TotalMoney = TotalMoney == "0" ? "0" : double.Parse(TotalMoney).ToString();
  268. kaijiangitem.Total = tds[2].InnerText.Trim().Replace(" 注", "");
  269. list.Add(kaijiangitem);
  270. }
  271. entity.KaiJiangItems = list;
  272. return entity.TryToJson();
  273. }
  274. #endregion
  275. #region SSQ初始化
  276. /// <summary>
  277. /// 配置信息
  278. /// </summary>
  279. private SCCConfig Config;
  280. /// <summary>
  281. /// 当天抓取的最新一期开奖记录
  282. /// </summary>
  283. private OpenCode7DTModel LatestItem;
  284. /// <summary>
  285. /// 当天抓取失败列表
  286. /// </summary>
  287. private List<string> FailedQiHaoList = null;
  288. /// <summary>
  289. /// 日志对象
  290. /// </summary>
  291. private readonly LogHelper log;
  292. /// <summary>
  293. /// 数据服务
  294. /// </summary>
  295. private readonly IDTOpenCode services;
  296. /// <summary>
  297. /// 当前彩种
  298. /// </summary>
  299. private SCCLottery currentLottery => SCCLottery.SSQ;
  300. /// <summary>
  301. /// 邮件接口
  302. /// </summary>
  303. private IEmail email;
  304. /// <summary>
  305. /// 是否本次运行抓取到开奖数据
  306. /// </summary>
  307. private bool isGetData;
  308. #endregion
  309. }
  310. }