CloudMonitorBusiness.cs 103 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382
  1. using PMS.BusinessModels.CloudMonitorManage;
  2. using PMS.BusinessModels.SMS;
  3. using PMS.BusinessService.SysManager;
  4. using PMS.DBService.CloudMonitorManage;
  5. using PMS.DBService.SysManager;
  6. using PMS.Interface;
  7. using PMS.Interface.CloudMonitorManage;
  8. using PMS.Interface.MessageManage;
  9. using PMS.Plugins.Common;
  10. using QWPlatform.IService;
  11. using QWPlatform.SystemLibrary;
  12. using QWPlatform.SystemLibrary.LogManager;
  13. using QWPlatform.SystemLibrary.Utils;
  14. using System;
  15. using System.Collections.Generic;
  16. using System.Configuration;
  17. using System.Data;
  18. using System.Linq;
  19. using System.Text;
  20. using System.Threading;
  21. using System.Threading.Tasks;
  22. using static System.Collections.Specialized.BitVector32;
  23. using System.Web.Caching;
  24. namespace PMS.BusinessService.CloudMonitorManage
  25. {
  26. public class CloudMonitorBusiness : ICloudMonitor
  27. {
  28. private ConfigDBService configDBService = DataServiceBase.Instance<ConfigDBService>();
  29. private CloudMonitorService dbCloudMonitor = DataServiceBase.Instance<CloudMonitorService>();
  30. //系统配置
  31. SysConfigBLLServier configBll = QWPlatform.SystemLibrary.Provider.SingletonProvider<SysConfigBLLServier>.Instance;
  32. //推送消息
  33. IMessageManage notice = InterfaceFactory.CreateBusinessInstance<IMessageManage>();
  34. //发布地址
  35. public static string publishingAddress = ConfigurationManager.AppSettings["PublishingAddress"].ToStringEx();
  36. private static Logger Log = Logger.Instance;
  37. /// <summary>
  38. /// 云监控配置
  39. /// </summary>
  40. private static CloudMonitorConfig _cloudMonitorConfig = null;
  41. /// <summary>
  42. /// key:服务器id value:服务器指标id
  43. /// </summary>
  44. private static Dictionary<string, string> _cacheIndexId = new Dictionary<string, string>();
  45. /// <summary>
  46. /// 持续预警
  47. /// </summary>
  48. private static Dictionary<string, object> _cacheDuration = new Dictionary<string, object>();
  49. /// <summary>
  50. /// 自定义预警数据
  51. /// </summary>
  52. private static List<CustomAlertModel> _cacheCustomAlertList;
  53. /// <summary>
  54. /// 项目监控数据
  55. /// </summary>
  56. private static List<ProjectMonitorModel> _cacheProjectMonitorList;
  57. #region 云监控配置相关
  58. /// <summary>
  59. /// 保存总配置
  60. /// </summary>
  61. /// <param name="cloudMonitorConfig"></param>
  62. /// <returns></returns>
  63. public bool SaveCloudMonitorConfig(CloudMonitorConfig cloudMonitorConfig)
  64. {
  65. //如果有保存则清空缓存
  66. _cloudMonitorConfig = null;
  67. return configDBService.SaveCloudMonitorConfig(cloudMonitorConfig);
  68. }
  69. /// <summary>
  70. /// 保存采集配置
  71. /// </summary>
  72. /// <param name="collectionConfig"></param>
  73. /// <returns></returns>
  74. public bool SaveCollectionConfig(CollectionConfig collectionConfig)
  75. {
  76. var config = GetCloudMonitorConfig();
  77. config.CollectionConfig = collectionConfig;
  78. WebUI.Jobs.SchedulerMain.CollectionInterruptJob(collectionConfig.采集服务中断执行频率);
  79. return SaveCloudMonitorConfig(config);
  80. }
  81. /// <summary>
  82. /// 保存预警配置
  83. /// </summary>
  84. /// <param name="alertConfig"></param>
  85. /// <returns></returns>
  86. public bool SaveAlertConfig(AlertConfig alertConfig)
  87. {
  88. var config = GetCloudMonitorConfig();
  89. config.AlertConfig = alertConfig;
  90. return SaveCloudMonitorConfig(config);
  91. }
  92. /// <summary>
  93. /// 获取配置
  94. /// </summary>
  95. /// <returns></returns>
  96. public CloudMonitorConfig GetCloudMonitorConfig()
  97. {
  98. if (_cloudMonitorConfig == null)
  99. {//如果有缓存则获取缓存的信息
  100. _cloudMonitorConfig = configDBService.GetCloudMonitorConfig();
  101. }
  102. return _cloudMonitorConfig;
  103. }
  104. #endregion
  105. #region 自定义预警配置相关
  106. /// <summary>
  107. /// 根据项目id获取自定义配置
  108. /// </summary>
  109. /// <param name="itemId"></param>
  110. /// <returns></returns>
  111. public List<CustomAlertModel> GetCustomAlertModelByItemId(string itemId)
  112. {
  113. var data = dbCloudMonitor.GetCustomAlertModelByItemId(itemId);
  114. return data;
  115. }
  116. /// <summary>
  117. /// 根据项目id获取 启动的自定义预警配置
  118. /// </summary>
  119. /// <param name="itemId"></param>
  120. /// <returns></returns>
  121. public List<CustomAlertModel> GetCustomAlertModelByItemIdAndStart(string itemId)
  122. {
  123. var data = dbCloudMonitor.GetCustomAlertModelByItemIdAndStart(itemId);
  124. return data;
  125. }
  126. /// <summary>
  127. /// 根据项目id获取 启动的自定义服务配置
  128. /// </summary>
  129. /// <param name="itemId"></param>
  130. /// <returns></returns>
  131. public List<CustomAPIModel> GetCustomServerModelByItemIdAndStart(string itemId)
  132. {
  133. var data = dbCloudMonitor.GetCustomServerModelByItemIdAndStart(itemId);
  134. return data;
  135. }
  136. /// <summary>
  137. /// 根据渠道id获取自定义配置
  138. /// </summary>
  139. /// <param name="channelId"></param>
  140. /// <returns></returns>
  141. public List<CustomAlertModel> GetCustomAlertModelByChannelId(string channelId, string search)
  142. {
  143. var data = dbCloudMonitor.GetCustomAlertModelByChannelId(channelId, search);
  144. return data;
  145. }
  146. /// <summary>
  147. /// 根据渠道id获取自定义API配置
  148. /// </summary>
  149. /// <param name="channelId"></param>
  150. /// <returns></returns>
  151. public List<CustomAPIModel> GetCustomAPIModelByChannelId(string channelId, string search)
  152. {
  153. var data = dbCloudMonitor.GetCustomAPIModelByChannelId(channelId, search);
  154. return data;
  155. }
  156. /// <summary>
  157. /// 根据创建人id获取自定义配置
  158. /// </summary>
  159. /// <param name="creatorId"></param>
  160. /// <returns></returns>
  161. public List<CustomAlertModel> GetCustomAlertModelByCreatorId(string creatorId)
  162. {
  163. var data = dbCloudMonitor.GetCustomAlertModelByCreatorId(creatorId);
  164. return data;
  165. }
  166. /// <summary>
  167. /// 新增自定义配置
  168. /// </summary>
  169. /// <param name="model"></param>
  170. /// <returns></returns>
  171. public bool InsertCustomAlert(CustomAlertModel model)
  172. {
  173. _cacheCustomAlertList = null;
  174. var data = dbCloudMonitor.InsertCustomAlert(model);
  175. return data;
  176. }
  177. /// <summary>
  178. /// 新增自定义API配置
  179. /// </summary>
  180. /// <param name="model"></param>
  181. /// <returns></returns>
  182. public bool InsertCustomAPI(CustomAPIModel model)
  183. {
  184. _cacheCustomAlertList = null;
  185. var data = dbCloudMonitor.InsertCustomAPI(model);
  186. return data;
  187. }
  188. /// <summary>
  189. /// 修改
  190. /// </summary>
  191. /// <param name="model"></param>
  192. /// <returns></returns>
  193. public bool UpdateCustomAlert(CustomAlertModel model)
  194. {
  195. _cacheCustomAlertList = null;
  196. var data = dbCloudMonitor.UpdateCustomAlert(model);
  197. return data;
  198. }
  199. /// <summary>
  200. /// 修改
  201. /// </summary>
  202. /// <param name="model"></param>
  203. /// <returns></returns>
  204. public bool UpdateCustomAPI(CustomAPIModel model)
  205. {
  206. _cacheCustomAlertList = null;
  207. var data = dbCloudMonitor.UpdateCustomAPI(model);
  208. return data;
  209. }
  210. /// <summary>
  211. /// 根据id删除
  212. /// </summary>
  213. /// <param name="id"></param>
  214. /// <returns></returns>
  215. public bool DeleteCustomAlertById(string id)
  216. {
  217. _cacheCustomAlertList = null;
  218. var data = dbCloudMonitor.DeleteCustomAlertById(id);
  219. return data;
  220. }
  221. /// <summary>
  222. /// 根据id删除
  223. /// </summary>
  224. /// <param name="id"></param>
  225. /// <returns></returns>
  226. public bool DeleteCustomAPIById(string id)
  227. {
  228. var data = dbCloudMonitor.DeleteCustomAPIById(id);
  229. return data;
  230. }
  231. /// <summary>
  232. /// 获取启动的所有自定义预警配置
  233. /// </summary>
  234. /// <returns></returns>
  235. public List<CustomAlertModel> GetCustomAlertModelByStart()
  236. {
  237. if (_cacheCustomAlertList == null)
  238. _cacheCustomAlertList = dbCloudMonitor.GetCustomAlertModelByStart();
  239. return _cacheCustomAlertList;
  240. }
  241. #endregion
  242. #region 服务器指标信息相关
  243. /// <summary>
  244. /// 根据项目id获取服务器信息
  245. /// </summary>
  246. /// <param name="itemid"></param>
  247. /// <returns></returns>
  248. public List<ServerInfoModel> GetServerByItemId(string itemid)
  249. {
  250. var data = dbCloudMonitor.GetServerByItemId(itemid);
  251. var serverIds = string.Join(",", data.Select(m => m.ID).ToList());
  252. if (!string.IsNullOrEmpty(serverIds))
  253. {
  254. var dbs = GetDbInfoByServerId(serverIds);
  255. data.ForEach(m =>
  256. {
  257. m.数据库 = dbs.Where(n => m.ID == n.服务器ID).ToList();
  258. });
  259. }
  260. return data;
  261. }
  262. /// <summary>
  263. /// 获取所有服务器指标信息
  264. /// </summary>
  265. /// <returns></returns>
  266. public List<ServerIndexInfoModel> GetServerIndexInfoAll()
  267. {
  268. var data = dbCloudMonitor.GetServerIndexInfoAll();
  269. WorkWithColor(data);
  270. return data;
  271. }
  272. /// <summary>
  273. /// 获取所有服务器指标信息 通过项目id过滤
  274. /// </summary>
  275. /// <returns></returns>
  276. public List<ServerIndexInfoModel> GetServerIndexInfoByProjectId(string itemId)
  277. {
  278. var data = dbCloudMonitor.GetServerIndexInfoByProjectId(itemId);
  279. WorkWithColor(data);
  280. return data;
  281. }
  282. /// <summary>
  283. /// 获取所有服务器指标信息 通过渠道id过滤
  284. /// </summary>
  285. /// <returns></returns>
  286. public List<ServerIndexInfoModel> GetServerIndexInfoByChannelId(string channelId, string search = "")
  287. {
  288. var data = dbCloudMonitor.GetServerIndexInfoByChannelId(channelId, search);
  289. WorkWithColor(data);
  290. return data;
  291. }
  292. /// <summary>
  293. /// 获取指标详情 根据指标id
  294. /// </summary>
  295. /// <param name="indexId"></param>
  296. public List<ServerIndexDetailModel> GetServerIndexDetailByIndexId(string indexId, DateTime startTime, DateTime endTime)
  297. {
  298. var data = dbCloudMonitor.GetServerIndexDetailByIndexId(indexId, startTime, endTime);
  299. return data;
  300. }
  301. /// <summary>
  302. /// 获取指标详情 根据服务器id
  303. /// </summary>
  304. /// <param name="serverId"></param>
  305. public List<ServerIndexDetailModel> GetServerIndexDetailByServerId(string serverId, DateTime startTime, DateTime endTime)
  306. {
  307. var data = dbCloudMonitor.GetServerIndexDetailByServerId(serverId, startTime, endTime);
  308. return data;
  309. }
  310. /// <summary>
  311. /// 处理小数精度和颜色
  312. /// </summary>
  313. /// <param name="models"></param>
  314. private void WorkWithColor(List<ServerIndexInfoModel> models)
  315. {
  316. var config = GetCloudMonitorConfig().AlertConfig;
  317. foreach (var item in models)
  318. {
  319. var currentValue = Math.Round(item.CPU使用率, 2);
  320. item.CPU使用率 = currentValue;
  321. if (config.CPU使用濒危 <= currentValue && currentValue < config.CPU使用高危)
  322. {
  323. item.CPU状态 = "濒危";
  324. }
  325. else if (config.CPU使用高危 <= currentValue)
  326. {
  327. item.CPU状态 = "高危";
  328. }
  329. currentValue = Math.Round(item.内存使用率, 2);
  330. item.内存使用率 = currentValue;
  331. if (config.内存使用濒危 <= currentValue && currentValue < config.内存使用高危)
  332. {
  333. item.内存状态 = "濒危";
  334. }
  335. else if (config.内存使用高危 <= currentValue)
  336. {
  337. item.内存状态 = "高危";
  338. }
  339. currentValue = Math.Round(item.磁盘使用率, 2);
  340. item.磁盘使用率 = currentValue;
  341. if (config.磁盘使用濒危 <= currentValue && currentValue < config.磁盘使用高危)
  342. {
  343. item.磁盘状态 = "濒危";
  344. }
  345. else if (config.磁盘使用高危 <= currentValue)
  346. {
  347. item.磁盘状态 = "高危";
  348. }
  349. }
  350. }
  351. #endregion
  352. #region 服务器预警相关
  353. /// <summary>
  354. /// 插入服务器预警
  355. /// </summary>
  356. /// <param name="model"></param>
  357. /// <returns></returns>
  358. public string InsertServerAlert(ServerAlertDetailModel model)
  359. {
  360. if (string.IsNullOrEmpty(model.外部唯一键))
  361. {
  362. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  363. }
  364. var serverAlert = dbCloudMonitor.GetServerAlertByServerIdAndAlertType(model.外部唯一键);
  365. //没查询到,代表当前没得同类型预警,插入预警
  366. if (serverAlert == null)
  367. {
  368. ServerAlertModel alertModel = new ServerAlertModel
  369. {
  370. ID = Guid.NewGuid().ToString("D"),
  371. 服务器ID = model.服务器ID,
  372. 预警类型 = model.预警类型,
  373. 创建时间 = model.最后修改时间,
  374. 项目ID = model.项目ID,
  375. 最后上报时间 = DateTime.Now,
  376. 外部唯一键 = model.外部唯一键
  377. };
  378. dbCloudMonitor.InsertServerAlert(alertModel);
  379. model.预警ID = alertModel.ID;
  380. dbCloudMonitor.InsertServerAlertDetail(model);
  381. //通知线程(邮件等)
  382. ThreadPool.QueueUserWorkItem(new WaitCallback(SendNotice), alertModel.ID);
  383. }
  384. else
  385. {
  386. model.预警ID = serverAlert.ID;
  387. var detailModel = dbCloudMonitor.GetServerAlertDetailByAlertIdAndAlertNameAndAlertLevel(model.预警ID, model.预警名称, model.预警等级);
  388. if (detailModel == null)
  389. {
  390. dbCloudMonitor.InsertServerAlertDetail(model);
  391. }
  392. else
  393. {
  394. //查询到了,更新次数
  395. detailModel.预警说明 = model.预警说明;
  396. detailModel.当前值 = model.当前值;
  397. detailModel.预警次数 += model.预警次数;
  398. detailModel.最后修改时间 = model.最后修改时间;
  399. dbCloudMonitor.UpdateServerAlertDetailNumber(detailModel);
  400. }
  401. }
  402. return model.预警ID;
  403. }
  404. /// <summary>
  405. /// 发送通知
  406. /// </summary>
  407. /// <param name="alertlId">预警ID</param>
  408. private void SendNotice(object alertlId)
  409. {
  410. //获取数据,处理数据
  411. var alertModel = GetServerAlertByAlertlId((string)alertlId);
  412. var toUsers = new List<string>();
  413. var openIdList = new List<string>();
  414. var phoneList = new List<string>();
  415. var ccUsers = new List<string>();
  416. //消息分级,红色才抄送总部
  417. if (alertModel.预警等级 == (int)AlertLevelEnum.红色预警)
  418. {
  419. //处理总部配置
  420. var config = GetCloudMonitorConfig().AlertConfig;
  421. if (config.邮件推送开关 == "on")
  422. {
  423. var mailStr = config.邮箱推送账号;
  424. if (!string.IsNullOrEmpty(mailStr))
  425. {
  426. ccUsers.AddRange(mailStr.Split(';'));
  427. }
  428. }
  429. if (config.微信消息开关 == "on")
  430. {
  431. var phoneStr = config.微信推送帐号;
  432. if (!string.IsNullOrEmpty(phoneStr))
  433. {
  434. phoneList.AddRange(phoneStr.Split(';'));
  435. }
  436. }
  437. }
  438. //处理项目上的邮件推送和微信推送
  439. var itemInfo = dbCloudMonitor.GetProInfo(alertModel.项目ID);
  440. if (itemInfo != null && itemInfo.Rows.Count > 0)
  441. {
  442. var mailStr = itemInfo.Rows[0].GetValueByName<string>("邮件推送");
  443. if (!string.IsNullOrEmpty(mailStr))
  444. {
  445. toUsers.AddRange(mailStr.Split(';'));
  446. }
  447. var phoneStr = itemInfo.Rows[0].GetValueByName<string>("微信推送");
  448. if (!string.IsNullOrEmpty(phoneStr))
  449. {
  450. phoneList.AddRange(phoneStr.Split(';'));
  451. }
  452. }
  453. //处理渠道上的
  454. itemInfo = dbCloudMonitor.GetChannelInfo(alertModel.渠道ID);
  455. if (itemInfo != null && itemInfo.Rows.Count > 0)
  456. {
  457. var mailStr = itemInfo.Rows[0].GetValueByName<string>("技术联系人邮箱");
  458. if (!string.IsNullOrEmpty(mailStr))
  459. {
  460. ccUsers.AddRange(mailStr.Split(';'));
  461. }
  462. var phoneStr = itemInfo.Rows[0].GetValueByName<string>("技术联系人微信");
  463. if (!string.IsNullOrEmpty(phoneStr))
  464. {
  465. phoneList.AddRange(phoneStr.Split(';'));
  466. }
  467. //消息分级,红色才抄送渠道负责人
  468. if (alertModel.预警等级 == (int)AlertLevelEnum.红色预警)
  469. {
  470. mailStr = itemInfo.Rows[0].GetValueByName<string>("商务联系人邮箱");
  471. if (!string.IsNullOrEmpty(mailStr))
  472. {
  473. ccUsers.AddRange(mailStr.Split(';'));
  474. }
  475. phoneStr = itemInfo.Rows[0].GetValueByName<string>("商务联系人微信");
  476. if (!string.IsNullOrEmpty(phoneStr))
  477. {
  478. phoneList.AddRange(phoneStr.Split(';'));
  479. }
  480. }
  481. }
  482. //根据手机号获取openid
  483. openIdList = dbCloudMonitor.GetUserOpenIdByPhone(phoneList);
  484. var 处理状态 = alertModel.处理时间 == DateTime.MinValue ? "未处理" : "已处理";
  485. var title = $"【云监控】{alertModel.预警类型显示}预警{处理状态}";
  486. var url = $"{publishingAddress}/CloudMonitor/EarlyWarningInfo?id={alertModel.ID}";
  487. var body = $@"渠道名称:{alertModel.渠道名称}
  488. 项目名称:{alertModel.项目名称}
  489. 服务器IP:{alertModel.服务器IP}
  490. 负责人:{alertModel.负责人}
  491. 预警类型:{alertModel.预警类型显示}
  492. 预警等级:{alertModel.预警等级显示}
  493. 异常说明:{alertModel.异常说明}
  494. 处理状态:{处理状态}";
  495. if (处理状态 == "已处理")
  496. {
  497. body += $@"
  498. 处理说明:{alertModel.处理说明}";
  499. }
  500. SendMail(title, body, url, toUsers, ccUsers);
  501. Log.Info("开始准备发送微信消息:" + Strings.ObjectToJson(openIdList));
  502. SendWxMsg(title, url, openIdList);
  503. }
  504. /// <summary>
  505. /// 发送邮件
  506. /// </summary>
  507. /// <param name="title">邮件标题</param>
  508. /// <param name="body">邮件内容</param>
  509. /// <param name="toUsers">发送给谁</param>
  510. /// <param name="ccUsers">抄送给谁</param>
  511. private void SendMail(string title, string body, string url, List<string> toUsers, List<string> ccUsers)
  512. {
  513. if (toUsers == null) return;
  514. toUsers = toUsers.Distinct().ToList();
  515. toUsers = toUsers.Where(m => !string.IsNullOrEmpty(m)).ToList();
  516. if (toUsers.Count == 0) return;
  517. if (ccUsers == null) ccUsers = new List<string>();
  518. ccUsers = ccUsers.Distinct().ToList();
  519. ccUsers = ccUsers.Where(m => !string.IsNullOrEmpty(m)).ToList();
  520. var emailConfig = configBll.GetEmailConfig();
  521. var emailServerInfo = new QWPlatform.SystemLibrary.Email.EmailServerInfo(emailConfig.EmailServer, emailConfig.SendName, emailConfig.SendEmail, emailConfig.SendPassword, emailConfig.Port);
  522. //执行邮件发送
  523. QWPlatform.SystemLibrary.Email.SmtpEmail smtpEmail = new QWPlatform.SystemLibrary.Email.SmtpEmail(emailServerInfo);
  524. var emailInfo = new QWPlatform.SystemLibrary.Email.EmailInfo(title, body + $"\r\n\r\n查看详情:{url}", toUsers.ToArray(), ccUsers.ToArray());
  525. emailInfo.FromUser(emailConfig.SendEmail, emailConfig.SendName);
  526. var r = smtpEmail.Send(emailInfo);
  527. if (!r)
  528. {
  529. //送信失败
  530. Log.Warn("邮件发送失败,请检查密码或服务器配置是否正确");
  531. }
  532. }
  533. /// <summary>
  534. /// 发送微信消息
  535. /// </summary>
  536. /// <param name="title"></param>
  537. /// <param name="body"></param>
  538. /// <param name="openIdList"></param>
  539. private void SendWxMsg(string title, string url, List<string> openIdList)
  540. {
  541. if (openIdList == null) return;
  542. openIdList = openIdList.Distinct().ToList();
  543. openIdList = openIdList.Where(m => !string.IsNullOrEmpty(m)).ToList();
  544. if (openIdList.Count == 0) return;
  545. List<MessageDetailsDto> list = openIdList.Select(openid => new MessageDetailsDto() { 接收人id = openid }).ToList();
  546. NotificationDto no = new NotificationDto
  547. {
  548. style = "3",
  549. template_code = "OIE51OsXeECnoPxGgPTQ7acXybc7t1plgAbdlH-mMWE",
  550. template_value = "{\"first\":{\"value\":\"" + title + "\",\"color\":\"#173177\"},\"keyword1\":{\"value\":\"" + DateTime.Now + "\",\"color\":\"#173177\"},\"keyword2\":{\"value\":\"" + title + "\",\"color\":\"#173177\"},\"remark\":{\"value\":\"点击【查看详情】查看问题\",\"color\":\"#173177\"}}",
  551. url = url,
  552. record_items = list
  553. };
  554. Log.Info("发送微信消息:" + Strings.ObjectToJson(no));
  555. notice.SendWeChartTempletMessge(no);
  556. }
  557. /// <summary>
  558. /// 根据预警id获取服务器预警
  559. /// </summary>
  560. /// <returns></returns>
  561. public ServerAlertModel GetServerAlertByAlertlId(string alertlId)
  562. {
  563. var data = dbCloudMonitor.GetServerAlertByAlertlId(alertlId);
  564. WorkServerAlert(new List<ServerAlertModel>() { data });
  565. var 处理状态 = data.处理时间 == DateTime.MinValue ? "未处理" : "已处理";
  566. if (处理状态 == "已处理")
  567. {
  568. var processList = GetServerAlertProcessByAlertId(data.ID);
  569. data.处理说明 = processList.FirstOrDefault(m => m.处理状态 == (int)AlertStateEnum.已处理)?.处理说明;
  570. }
  571. return data;
  572. }
  573. /// <summary>
  574. /// 根据预警id获取服务器预警
  575. /// </summary>
  576. /// <returns></returns>
  577. public List<ServerAlertModel> GetServerAlertByAlertlId(List<string> alertlId)
  578. {
  579. var data = dbCloudMonitor.GetServerAlertByAlertlId(alertlId);
  580. WorkServerAlert(data);
  581. return data;
  582. }
  583. /// <summary>
  584. /// 获取所有服务器预警
  585. /// </summary>
  586. /// <returns></returns>
  587. public List<ServerAlertModel> GetServerAlertAll(string search)
  588. {
  589. var data = dbCloudMonitor.GetServerAlertAll(search);
  590. WorkServerAlert(data);
  591. return data;
  592. }
  593. /// <summary>
  594. /// 根据条件获取服务器预警
  595. /// </summary>
  596. /// <returns></returns>
  597. public List<ServerAlertModel> GetServerAlertBySearch(ServerAlertSearch search)
  598. {
  599. var config = GetCloudMonitorConfig().AlertConfig;
  600. var data = dbCloudMonitor.GetServerAlertBySearch(search, config);
  601. WorkServerAlert(data);
  602. return data;
  603. }
  604. /// <summary>
  605. /// 处理服务器预警信息
  606. /// </summary>
  607. /// <param name="data"></param>
  608. private void WorkServerAlert(List<ServerAlertModel> data)
  609. {
  610. // 定义一个批次大小
  611. int batchSize = 100;
  612. // 将数据拆分为多个批次
  613. IEnumerable<IEnumerable<string>> batches = data.Select((value, index) => new { value, index })
  614. .GroupBy(pair => pair.index / batchSize, pair => pair.value.ID)
  615. .Select(group => group.AsEnumerable());
  616. // 遍历每个批次并获取警报详情
  617. List<ServerAlertDetailModel> details = new List<ServerAlertDetailModel>();
  618. foreach (var batch in batches)
  619. {
  620. // 将批次中的 ID 列表转换为以逗号分隔的字符串
  621. string ids = string.Join(",", batch);
  622. // 确保 alertIds 不为空,然后获取相应的服务器警报详情
  623. if (!string.IsNullOrEmpty(ids))
  624. {
  625. var detail = dbCloudMonitor.GetServerAlertDetailByAlertlId(ids);
  626. details.AddRange(detail);
  627. }
  628. }
  629. //IEnumerable<string> list = data.Select(m => m.ID);
  630. //var alertIds = string.Join(",", list);
  631. //List<ServerAlertDetailModel> details = dbCloudMonitor.GetServerAlertDetailByAlertlId(alertIds);
  632. foreach (var item in data)
  633. {
  634. var curDetails = details.Where(m => item.ID == m.预警ID);
  635. //最新的一条记录
  636. var lasterDetail = curDetails.OrderByDescending(m => m.最后修改时间).FirstOrDefault();
  637. item.预警次数 = curDetails.Sum(m => m.预警次数);
  638. item.橙色预警次数 = curDetails.Where(m => m.预警等级 == (int)AlertLevelEnum.橙色预警).Sum(m => m.预警次数);
  639. item.红色预警次数 = curDetails.Where(m => m.预警等级 == (int)AlertLevelEnum.红色预警).Sum(m => m.预警次数);
  640. item.最后上报时间 = lasterDetail.最后修改时间;
  641. var lasterTitle = Enum.GetName(typeof(AlertLevelEnum), lasterDetail.预警等级);
  642. item.预警等级 = lasterDetail.预警等级;
  643. item.预警等级显示 = lasterTitle;
  644. switch (item.预警类型)
  645. {
  646. case (int)AlertTypeEnum.硬件CPU:
  647. case (int)AlertTypeEnum.硬件内存:
  648. case (int)AlertTypeEnum.硬件磁盘空间:
  649. item.异常说明 = $"{lasterTitle},{lasterDetail.预警名称}预警值{lasterDetail.预警说明},当前{lasterDetail.当前值}";
  650. break;
  651. case (int)AlertTypeEnum.数据库连接数不足:
  652. DbConnectInfo dbConnectInfo = Strings.JsonToModel<DbConnectInfo>(lasterDetail.预警说明 ?? "");
  653. item.异常说明 = $"{dbConnectInfo?.DbName}数据库连接数已达{dbConnectInfo.ConnectUsed},最大{dbConnectInfo.ConnectTotal}";
  654. break;
  655. case (int)AlertTypeEnum.数据库死锁:
  656. DbLockedInfo dbLockedInfo = Strings.JsonToModel<DbLockedInfo>(lasterDetail.预警说明 ?? "");
  657. item.异常说明 = $"{dbLockedInfo?.DbName}数据库出现死锁,当前锁定数为:{lasterDetail.当前值}";
  658. break;
  659. case (int)AlertTypeEnum.服务中断:
  660. var groups = curDetails.GroupBy(m => m.预警名称).Select(m => $"{m.Key}状态异常{m.Sum(n => n.预警次数)}次");
  661. item.异常说明 = string.Join("\r\n", groups);
  662. break;
  663. case (int)AlertTypeEnum.自定义指标:
  664. DbCustomAlertInfo dbCustomAlertInfo = Strings.JsonToModel<DbCustomAlertInfo>(lasterDetail.预警说明 ?? "");
  665. item.异常说明 = $"数据库:{dbCustomAlertInfo?.DbName},{dbCustomAlertInfo?.CustomName}:当前值为:{lasterDetail.当前值}";
  666. break;
  667. case (int)AlertTypeEnum.磁盘可用天数:
  668. item.异常说明 = $"{lasterTitle},{lasterDetail.预警名称},当前剩余可用天数:{lasterDetail.当前值}";
  669. break;
  670. case (int)AlertTypeEnum.采集中断:
  671. item.异常说明 = lasterDetail.预警名称 + " " + lasterDetail.预警说明 + " " + lasterDetail.当前值;
  672. break;
  673. case (int)AlertTypeEnum.自定义服务:
  674. item.异常说明 = lasterDetail.预警名称 + " " + lasterDetail.预警说明 + " " + lasterDetail.当前值;
  675. break;
  676. default:
  677. item.异常说明 = lasterDetail.预警名称 + " " + lasterDetail.预警说明 + " " + lasterDetail.当前值;
  678. break;
  679. }
  680. }
  681. }
  682. #endregion
  683. #region 服务器预警处理
  684. /// <summary>
  685. /// 插入服务器预警处理
  686. /// </summary>
  687. /// <param name="model"></param>
  688. /// <returns></returns>
  689. public bool InsertServerAlertProcess(ServerAlertProcessModel model)
  690. {
  691. var idStr = model.预警ID;
  692. var ids = idStr.Split(',').ToList();
  693. foreach (var id in ids)
  694. {
  695. var newModel = new ServerAlertProcessModel()
  696. {
  697. ID = Guid.NewGuid().ToString(),
  698. 预警ID = id,
  699. 创建时间 = DateTime.Now,
  700. 处理人 = model.处理人,
  701. 处理说明 = model.处理说明,
  702. 处理状态 = model.处理状态,
  703. };
  704. var data = dbCloudMonitor.InsertServerAlertProcess(newModel);
  705. dbCloudMonitor.ProcessServerAlert(newModel.预警ID, newModel.处理状态, newModel.创建时间);
  706. }
  707. if (model.处理状态 == (int)AlertStateEnum.已处理)
  708. {
  709. ThreadPool.QueueUserWorkItem(new WaitCallback(SendNotice), ids[0]);
  710. }
  711. return true;
  712. }
  713. /// <summary>
  714. /// 查询服务器预警处理过程
  715. /// </summary>
  716. /// <param name="alertId"></param>
  717. /// <returns></returns>
  718. public List<ServerAlertProcessModel> GetServerAlertProcessByAlertId(string alertId)
  719. {
  720. var data = dbCloudMonitor.GetServerAlertProcessByAlertId(alertId);
  721. return data;
  722. }
  723. #endregion
  724. #region 项目监控处理
  725. /// <summary>
  726. /// 启动或者停止项目监控
  727. /// </summary>
  728. /// <param name="projectId"></param>
  729. /// <param name="state"></param>
  730. public bool StartOrStopProjectMonitor(string projectId, bool state, string clientId = "")
  731. {
  732. _cacheProjectMonitorList = null;
  733. var info = dbCloudMonitor.GetProjectMonitorByProjectId(projectId);
  734. if (info == null)
  735. {
  736. info = new ProjectMonitorModel();
  737. info.ID = Guid.NewGuid().ToString("D");
  738. info.项目ID = projectId;
  739. info.首次监控日期 = DateTime.Now;
  740. info.最后监控日期 = info.首次监控日期;
  741. info.监控状态 = state ? 1 : 2;
  742. info.客户端ID = clientId;
  743. return dbCloudMonitor.InsertProjectMonitor(info);
  744. }
  745. else
  746. {
  747. info.最后监控日期 = DateTime.Now;
  748. info.监控状态 = state ? 1 : 2;
  749. info.客户端ID = clientId;
  750. return dbCloudMonitor.UpdateProjectMonitor(info);
  751. }
  752. }
  753. /// <summary>
  754. /// 获取状态为正常的项目监控数据
  755. /// </summary>
  756. /// <param name="projectId"></param>
  757. /// <returns></returns>
  758. public List<ProjectMonitorModel> GetProjectMonitor()
  759. {
  760. if (_cacheProjectMonitorList == null)
  761. _cacheProjectMonitorList = dbCloudMonitor.GetProjectMonitor();
  762. return _cacheProjectMonitorList;
  763. }
  764. /// <summary>
  765. /// 获取全部项目监控数据
  766. /// </summary>
  767. /// <returns></returns>
  768. public List<ProjectMonitorModel> GetProjectMonitorAll()
  769. {
  770. var data = dbCloudMonitor.GetProjectMonitorAll();
  771. return data;
  772. }
  773. /// <summary>
  774. /// 根据查询获取全部项目监控
  775. /// </summary>
  776. /// <returns></returns>
  777. public List<ProjectMonitorModel> GetProjectMonitorBySearch(ServerAlertSearch search)
  778. {
  779. var data = dbCloudMonitor.GetProjectMonitorBySearch(search);
  780. return data;
  781. }
  782. /// <summary>
  783. /// 获取项目的监控状态,根据渠道id过滤
  784. /// </summary>
  785. /// <param name="channelId"></param>
  786. /// <returns></returns>
  787. public List<ProjectMonitorModel> GetProjectMonitorByChannelId(string channelId)
  788. {
  789. var data = dbCloudMonitor.GetProjectMonitorByChannelId(channelId);
  790. return data;
  791. }
  792. #endregion
  793. #region 数据库管理
  794. /// <summary>
  795. /// 插入数据库数据
  796. /// </summary>
  797. /// <param name="model"></param>
  798. /// <returns></returns>
  799. public bool InsertDbInfo(DbInfoModel model)
  800. {
  801. model.ID = Guid.NewGuid().ToString("D");
  802. var data = dbCloudMonitor.InsertDbInfo(model);
  803. return data;
  804. }
  805. /// <summary>
  806. /// 修改数据库数据
  807. /// </summary>
  808. /// <param name="model"></param>
  809. /// <returns></returns>
  810. public bool UpdateDbInfo(DbInfoModel model)
  811. {
  812. var data = dbCloudMonitor.UpdateDbInfo(model);
  813. return data;
  814. }
  815. /// <summary>
  816. /// 获取数据库数据,根据服务器ID过滤
  817. /// </summary>
  818. /// <param name="channelId"></param>
  819. /// <returns></returns>
  820. public List<DbInfoModel> GetDbInfoByServerId(string serverId)
  821. {
  822. var data = dbCloudMonitor.GetDbInfoByServerId(serverId);
  823. return data;
  824. }
  825. /// <summary>
  826. /// 获取数据库数据,根据ID过滤
  827. /// </summary>
  828. /// <param name="channelId"></param>
  829. /// <returns></returns>
  830. public DbInfoModel GetDbInfoById(string id)
  831. {
  832. var data = dbCloudMonitor.GetDbInfoById(id);
  833. return data;
  834. }
  835. /// <summary>
  836. /// 删除数据库数据,根据ID
  837. /// </summary>
  838. /// <param name="id"></param>
  839. /// <returns></returns>
  840. public bool DeleteDbInfoById(string id)
  841. {
  842. var data = dbCloudMonitor.DeleteDbInfoById(id);
  843. return data;
  844. }
  845. #endregion
  846. #region 上报指标记录
  847. /// <summary>
  848. /// 插入数据库数据
  849. /// </summary>
  850. /// <param name="model"></param>
  851. /// <returns></returns>
  852. public bool InsertPushIndexDataByServerId(PushIndexDataModel model)
  853. {
  854. var data = dbCloudMonitor.InsertPushIndexDataByServerId(model);
  855. return data;
  856. }
  857. /// <summary>
  858. /// 查询上传指标数据
  859. /// </summary>
  860. /// <returns></returns>
  861. public PushIndexDataModelTablePage GetPushIndexData(IndexSearch search)
  862. {
  863. var data = dbCloudMonitor.GetPushIndexData(search);
  864. var total = dbCloudMonitor.GetPushIndexDataTotal(search);
  865. PushIndexDataModelTablePage pushIndexDataModelTablePage = new PushIndexDataModelTablePage();
  866. pushIndexDataModelTablePage.total = total;
  867. pushIndexDataModelTablePage.rows = data;
  868. return pushIndexDataModelTablePage;
  869. }
  870. #endregion
  871. #region 服务器信息上报
  872. /// <summary>
  873. /// 接收上报的服务器信息
  874. /// </summary>
  875. /// <param name="serverInfos"></param>
  876. public void ReceiveServerInfo(string clientId, List<Ret<ServerInfo>> serverInfos)
  877. {
  878. //如果这个客户端ID没有启动,直接退出
  879. if (!GetProjectMonitor().Any(m => m.客户端ID == clientId)) return;
  880. if (!WorkTimeCheckContinue(clientId + "ReceiveServerInfo")) return;
  881. foreach (var item in serverInfos)
  882. {
  883. if (!item.Success)
  884. {
  885. //上报指标记录
  886. InsertPushIndexDataByServerId(new PushIndexDataModel()
  887. {
  888. ID = Guid.NewGuid().ToString("D"),
  889. 服务器ID = item.Id,
  890. 预警ID = "",
  891. 类型 = (int)InfoTypeEnum.服务器硬件信息,
  892. 状态 = (int)PushStateTypeEnum.异常,
  893. 上报原始数据 = item.Msg,
  894. 创建时间 = item.CurrentTime,
  895. });
  896. continue;
  897. }
  898. var s = item.Data;
  899. ServerIndexInfoModel serverInfoModel = new ServerIndexInfoModel();
  900. serverInfoModel.最后修改时间 = s.CurrentTime;
  901. serverInfoModel.服务器ID = s.Id;
  902. serverInfoModel.CPU使用率 = s.CpuOccupancyRate;
  903. serverInfoModel.内存使用率 = s.MemoryUsed / s.MemoryTotal * 100;
  904. serverInfoModel.磁盘使用率 = s.DiskUsed / s.DiskTotal * 100;
  905. //处理预警
  906. var alertIds = ServerInfoAlert(serverInfoModel);
  907. //上报指标记录
  908. InsertPushIndexDataByServerId(new PushIndexDataModel()
  909. {
  910. ID = Guid.NewGuid().ToString("D"),
  911. 服务器ID = item.Id,
  912. 预警ID = string.Join(",", alertIds),
  913. 类型 = (int)InfoTypeEnum.服务器硬件信息,
  914. 状态 = (int)PushStateTypeEnum.正常,
  915. 上报原始数据 = Strings.ObjectToJson(s),
  916. 创建时间 = item.CurrentTime,
  917. });
  918. //取缓存的指标id
  919. if (_cacheIndexId.TryGetValue(s.Id, out string indexId))
  920. {
  921. //修改
  922. serverInfoModel.ID = indexId;
  923. dbCloudMonitor.UpdateServerInfo(serverInfoModel);
  924. }
  925. else
  926. {
  927. //没取到,尝试从服务器取
  928. var model = dbCloudMonitor.GetServerInfoByServerId(s.Id);
  929. if (model == null)
  930. {
  931. //新增 新增要查询出对应的渠道id 项目id
  932. indexId = Guid.NewGuid().ToString("D");
  933. serverInfoModel.ID = indexId;
  934. dbCloudMonitor.InsertServerInfo(serverInfoModel);
  935. }
  936. else
  937. {
  938. //修改
  939. indexId = model.ID;
  940. serverInfoModel.ID = indexId;
  941. dbCloudMonitor.UpdateServerInfo(serverInfoModel);
  942. }
  943. _cacheIndexId.Add(s.Id, indexId);
  944. }
  945. //处理指标详情
  946. ServerIndexDetailModel detailModel = new ServerIndexDetailModel();
  947. detailModel.ID = Guid.NewGuid().ToString("D");
  948. detailModel.指标ID = indexId;
  949. detailModel.服务器ID = s.Id;
  950. detailModel.CPU使用率 = s.CpuOccupancyRate;
  951. detailModel.内存使用 = s.MemoryUsed;
  952. detailModel.内存可用 = s.MemoryTotal - s.MemoryUsed;
  953. detailModel.磁盘使用 = s.DiskUsed;
  954. detailModel.磁盘可用 = s.DiskTotal - s.DiskUsed;
  955. detailModel.创建时间 = s.CurrentTime;
  956. dbCloudMonitor.InsertServerDetail(detailModel);
  957. }
  958. }
  959. /// <summary>
  960. /// 自动处理预警(指标正常后)
  961. /// </summary>
  962. /// <param name="外部唯一键"></param>
  963. private void WithdrawAlert(AutomaticWarningProcessingModel automaticWarning)
  964. {
  965. var config = GetCloudMonitorConfig();
  966. //持续时间 单位次 大白话:多少次连续预警后xxx
  967. var duration = 1;
  968. //频率 定时任务的执行频率,两个时间相减 并在执行频率内,则为持续时间
  969. var frequency = 1;
  970. switch (automaticWarning.预警类型)
  971. {
  972. case (int)AlertTypeEnum.硬件CPU:
  973. duration = config.AlertConfig.CPU预警持续时间;
  974. frequency = config.CollectionConfig.服务器硬件信息执行频率;
  975. break;
  976. case (int)AlertTypeEnum.硬件内存:
  977. duration = config.AlertConfig.内存预警持续时间;
  978. frequency = config.CollectionConfig.服务器硬件信息执行频率;
  979. break;
  980. case (int)AlertTypeEnum.硬件磁盘空间:
  981. duration = config.AlertConfig.磁盘预警续时间;
  982. frequency = config.CollectionConfig.服务器硬件信息执行频率;
  983. break;
  984. case (int)AlertTypeEnum.数据库连接数不足: break;
  985. case (int)AlertTypeEnum.数据库死锁: break;
  986. case (int)AlertTypeEnum.服务中断:
  987. duration = config.AlertConfig.后台服务中断高危;
  988. frequency = config.CollectionConfig.服务运行状态执行频率;
  989. break;
  990. case (int)AlertTypeEnum.自定义指标: break;
  991. case (int)AlertTypeEnum.采集中断:
  992. duration = config.AlertConfig.采集服务中断高危;
  993. frequency = config.CollectionConfig.采集服务中断执行频率;
  994. break;
  995. default:
  996. break;
  997. }
  998. //持续时间等于1,没啥需要处理的了,直接过
  999. if (duration == 1)
  1000. {
  1001. WithdrawProcessingAlert(automaticWarning.ID);
  1002. return;
  1003. }
  1004. //取上次预警的数据
  1005. _cacheDuration.TryGetValue(automaticWarning.ID, out var model);
  1006. //取到了判断是不是连续的,是连续的就把连续的+1
  1007. if (model != null)
  1008. {
  1009. var newModel = (AutomaticWarningProcessingModel)model;
  1010. var time = newModel.最后修改时间;
  1011. var timeSpan = automaticWarning.最后修改时间 - newModel.最后修改时间;
  1012. var minutes = timeSpan.TotalMinutes;
  1013. //对比两次时间和频率是相等的,则认为是连续的
  1014. //允许误差0.2分钟以内也认为是连续的
  1015. if (frequency - 0.2 <= minutes || minutes <= frequency + 0.2)
  1016. {
  1017. automaticWarning.连续预警次数 = newModel.连续预警次数 + 1;
  1018. }
  1019. }
  1020. //预警次数大于指定的,就移除缓存
  1021. //因为默认数字从0开始的,但是次数明显从1开始才合理,所以-1
  1022. if (automaticWarning.连续预警次数 >= duration - 1)
  1023. {
  1024. _cacheDuration.Remove(automaticWarning.ID);
  1025. WithdrawProcessingAlert(automaticWarning.ID);
  1026. //预警
  1027. return;
  1028. }
  1029. else
  1030. {
  1031. _cacheDuration[automaticWarning.ID] = automaticWarning;
  1032. }
  1033. }
  1034. /// <summary>
  1035. /// 处理撤回预警
  1036. /// </summary>
  1037. /// <param name="外部唯一键"></param>
  1038. void WithdrawProcessingAlert(string 外部唯一键)
  1039. {
  1040. var serverAlert = dbCloudMonitor.GetServerAlertByServerIdAndAlertType(外部唯一键);
  1041. if (serverAlert != null)
  1042. {
  1043. var newModel = new ServerAlertProcessModel()
  1044. {
  1045. ID = Guid.NewGuid().ToString(),
  1046. 预警ID = serverAlert.ID,
  1047. 创建时间 = DateTime.Now,
  1048. 处理人 = "自动撤回",
  1049. 处理说明 = "自动撤回预警,状态已恢复",
  1050. 处理状态 = 4,
  1051. };
  1052. var data = dbCloudMonitor.InsertServerAlertProcess(newModel);
  1053. dbCloudMonitor.ProcessServerAlert(newModel.预警ID, newModel.处理状态, newModel.创建时间);
  1054. ThreadPool.QueueUserWorkItem(new WaitCallback(SendNotice), serverAlert.ID);
  1055. }
  1056. }
  1057. /// <summary>
  1058. /// 服务信息预警处理
  1059. /// </summary>
  1060. /// <param name="serverInfo"></param>
  1061. private List<string> ServerInfoAlert(ServerIndexInfoModel serverInfoModel)
  1062. {
  1063. var config = GetCloudMonitorConfig().AlertConfig;
  1064. var currentValue = Math.Round(serverInfoModel.CPU使用率, 2);
  1065. var alertIds = new List<string>();
  1066. //CPU处理
  1067. if (config.CPU使用濒危 <= currentValue && currentValue < config.CPU使用高危)
  1068. {
  1069. //橙色预警
  1070. ServerAlertDetailModel model = new ServerAlertDetailModel
  1071. {
  1072. ID = Guid.NewGuid().ToString("D"),
  1073. 预警次数 = 1,
  1074. 预警名称 = "CPU使用率",
  1075. 预警说明 = config.CPU使用濒危 + "%",
  1076. 当前值 = currentValue + "%",
  1077. 预警等级 = (int)AlertLevelEnum.橙色预警,
  1078. 最后修改时间 = serverInfoModel.最后修改时间,
  1079. 服务器ID = serverInfoModel.服务器ID,
  1080. 预警类型 = (int)AlertTypeEnum.硬件CPU,
  1081. };
  1082. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1083. //生成预警
  1084. var alertId = CheckDuration(model, InsertServerAlert);
  1085. if (!string.IsNullOrEmpty(alertId))
  1086. {
  1087. alertIds.Add(alertId);
  1088. }
  1089. }
  1090. else if (config.CPU使用高危 <= currentValue)
  1091. {
  1092. //红色预警
  1093. ServerAlertDetailModel model = new ServerAlertDetailModel
  1094. {
  1095. ID = Guid.NewGuid().ToString("D"),
  1096. 预警次数 = 1,
  1097. 预警名称 = "CPU使用率",
  1098. 预警说明 = config.CPU使用高危 + "%",
  1099. 当前值 = currentValue + "%",
  1100. 预警等级 = (int)AlertLevelEnum.红色预警,
  1101. 最后修改时间 = serverInfoModel.最后修改时间,
  1102. 服务器ID = serverInfoModel.服务器ID,
  1103. 预警类型 = (int)AlertTypeEnum.硬件CPU
  1104. };
  1105. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1106. //生成预警
  1107. var alertId = CheckDuration(model, InsertServerAlert);
  1108. if (!string.IsNullOrEmpty(alertId))
  1109. {
  1110. alertIds.Add(alertId);
  1111. }
  1112. }
  1113. else
  1114. {
  1115. var 外部唯一键 = (int)AlertTypeEnum.硬件CPU + "_" + serverInfoModel.服务器ID;
  1116. AutomaticWarningProcessingModel auto = new AutomaticWarningProcessingModel
  1117. {
  1118. ID = 外部唯一键,
  1119. 预警类型 = (int)AlertTypeEnum.硬件CPU,
  1120. 预警次数 = 1,
  1121. 最后修改时间 = serverInfoModel.最后修改时间
  1122. };
  1123. WithdrawAlert(auto);
  1124. }
  1125. //内存处理
  1126. currentValue = Math.Round(serverInfoModel.内存使用率, 2);
  1127. if (config.内存使用濒危 <= currentValue && currentValue < config.内存使用高危)
  1128. {
  1129. //橙色预警
  1130. ServerAlertDetailModel model = new ServerAlertDetailModel
  1131. {
  1132. ID = Guid.NewGuid().ToString("D"),
  1133. 预警次数 = 1,
  1134. 预警名称 = "内存使用率",
  1135. 预警说明 = config.内存使用濒危 + "%",
  1136. 当前值 = currentValue + "%",
  1137. 预警等级 = (int)AlertLevelEnum.橙色预警,
  1138. 最后修改时间 = serverInfoModel.最后修改时间,
  1139. 服务器ID = serverInfoModel.服务器ID,
  1140. 预警类型 = (int)AlertTypeEnum.硬件内存
  1141. };
  1142. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1143. var alertId = CheckDuration(model, InsertServerAlert);
  1144. if (!string.IsNullOrEmpty(alertId))
  1145. {
  1146. alertIds.Add(alertId);
  1147. }
  1148. }
  1149. else if (config.内存使用高危 <= currentValue)
  1150. {
  1151. //红色预警
  1152. ServerAlertDetailModel model = new ServerAlertDetailModel
  1153. {
  1154. ID = Guid.NewGuid().ToString("D"),
  1155. 预警次数 = 1,
  1156. 预警名称 = "内存使用率",
  1157. 预警说明 = config.内存使用高危 + "%",
  1158. 当前值 = currentValue + "%",
  1159. 预警等级 = (int)AlertLevelEnum.红色预警,
  1160. 最后修改时间 = serverInfoModel.最后修改时间,
  1161. 服务器ID = serverInfoModel.服务器ID,
  1162. 预警类型 = (int)AlertTypeEnum.硬件内存
  1163. };
  1164. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1165. var alertId = CheckDuration(model, InsertServerAlert);
  1166. if (!string.IsNullOrEmpty(alertId))
  1167. {
  1168. alertIds.Add(alertId);
  1169. }
  1170. }
  1171. else
  1172. {
  1173. var 外部唯一键 = (int)AlertTypeEnum.硬件内存 + "_" + serverInfoModel.服务器ID;
  1174. AutomaticWarningProcessingModel auto = new AutomaticWarningProcessingModel
  1175. {
  1176. ID = 外部唯一键,
  1177. 预警类型 = (int)AlertTypeEnum.硬件内存,
  1178. 预警次数 = 1,
  1179. 最后修改时间 = serverInfoModel.最后修改时间
  1180. };
  1181. WithdrawAlert(auto);
  1182. }
  1183. //磁盘处理
  1184. currentValue = Math.Round(serverInfoModel.磁盘使用率, 2);
  1185. if (config.磁盘使用濒危 <= currentValue && currentValue < config.磁盘使用高危)
  1186. {
  1187. //橙色预警
  1188. ServerAlertDetailModel model = new ServerAlertDetailModel
  1189. {
  1190. ID = Guid.NewGuid().ToString("D"),
  1191. 预警次数 = 1,
  1192. 预警名称 = "磁盘使用率",
  1193. 预警说明 = config.磁盘使用濒危 + "%",
  1194. 当前值 = currentValue + "%",
  1195. 预警等级 = (int)AlertLevelEnum.橙色预警,
  1196. 最后修改时间 = serverInfoModel.最后修改时间,
  1197. 服务器ID = serverInfoModel.服务器ID,
  1198. 预警类型 = (int)AlertTypeEnum.硬件磁盘空间
  1199. };
  1200. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1201. var alertId = CheckDuration(model, InsertServerAlert);
  1202. if (!string.IsNullOrEmpty(alertId))
  1203. {
  1204. alertIds.Add(alertId);
  1205. }
  1206. }
  1207. else if (config.磁盘使用高危 <= currentValue)
  1208. {
  1209. //红色预警
  1210. ServerAlertDetailModel model = new ServerAlertDetailModel
  1211. {
  1212. ID = Guid.NewGuid().ToString("D"),
  1213. 预警次数 = 1,
  1214. 预警名称 = "磁盘使用率",
  1215. 预警说明 = config.磁盘使用高危 + "%",
  1216. 当前值 = currentValue + "%",
  1217. 预警等级 = (int)AlertLevelEnum.红色预警,
  1218. 最后修改时间 = serverInfoModel.最后修改时间,
  1219. 服务器ID = serverInfoModel.服务器ID,
  1220. 预警类型 = (int)AlertTypeEnum.硬件磁盘空间
  1221. };
  1222. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1223. var alertId = CheckDuration(model, InsertServerAlert);
  1224. if (!string.IsNullOrEmpty(alertId))
  1225. {
  1226. alertIds.Add(alertId);
  1227. }
  1228. }
  1229. else
  1230. {
  1231. var 外部唯一键 = (int)AlertTypeEnum.硬件磁盘空间 + "_" + serverInfoModel.服务器ID;
  1232. AutomaticWarningProcessingModel auto = new AutomaticWarningProcessingModel
  1233. {
  1234. ID = 外部唯一键,
  1235. 预警类型 = (int)AlertTypeEnum.硬件磁盘空间,
  1236. 预警次数 = 1,
  1237. 最后修改时间 = serverInfoModel.最后修改时间
  1238. };
  1239. WithdrawAlert(auto);
  1240. }
  1241. return alertIds;
  1242. }
  1243. /// <summary>
  1244. /// 检查持续时间
  1245. /// </summary>
  1246. /// <param name="alertModel"></param>
  1247. /// <param name="action"></param>
  1248. /// <returns>预警ID,没值代表没预警</returns>
  1249. private string CheckDuration(ServerAlertDetailModel alertModel, Func<ServerAlertDetailModel, string> action)
  1250. {
  1251. var cacheId = alertModel.预警名称 + alertModel.外部唯一键;
  1252. var config = GetCloudMonitorConfig();
  1253. //持续时间 单位次 大白话:多少次连续预警后xxx
  1254. var duration = 1;
  1255. //频率 定时任务的执行频率,两个时间相减 并在执行频率内,则为持续时间
  1256. var frequency = 1;
  1257. switch (alertModel.预警类型)
  1258. {
  1259. case (int)AlertTypeEnum.硬件CPU:
  1260. duration = config.AlertConfig.CPU预警持续时间;
  1261. frequency = config.CollectionConfig.服务器硬件信息执行频率;
  1262. break;
  1263. case (int)AlertTypeEnum.硬件内存:
  1264. duration = config.AlertConfig.内存预警持续时间;
  1265. frequency = config.CollectionConfig.服务器硬件信息执行频率;
  1266. break;
  1267. case (int)AlertTypeEnum.硬件磁盘空间:
  1268. duration = config.AlertConfig.磁盘预警续时间;
  1269. frequency = config.CollectionConfig.服务器硬件信息执行频率;
  1270. break;
  1271. case (int)AlertTypeEnum.数据库连接数不足: break;
  1272. case (int)AlertTypeEnum.数据库死锁: break;
  1273. case (int)AlertTypeEnum.服务中断:
  1274. duration = config.AlertConfig.后台服务中断高危;
  1275. frequency = config.CollectionConfig.服务运行状态执行频率;
  1276. break;
  1277. case (int)AlertTypeEnum.自定义指标: break;
  1278. case (int)AlertTypeEnum.采集中断:
  1279. duration = config.AlertConfig.采集服务中断高危;
  1280. frequency = config.CollectionConfig.采集服务中断执行频率;
  1281. break;
  1282. default:
  1283. break;
  1284. }
  1285. //持续时间等于1,没啥需要处理的了,直接过
  1286. if (duration == 1)
  1287. {
  1288. //预警
  1289. return action?.Invoke(alertModel);
  1290. }
  1291. //取上次预警的数据
  1292. _cacheDuration.TryGetValue(cacheId, out var model);
  1293. //取到了判断是不是连续的,是连续的就把连续的+1
  1294. if (model != null)
  1295. {
  1296. var newModel = (ServerAlertDetailModel)model;
  1297. var time = newModel.最后修改时间;
  1298. var timeSpan = alertModel.最后修改时间 - newModel.最后修改时间;
  1299. var minutes = timeSpan.TotalMinutes;
  1300. //对比两次时间和频率是相等的,则认为是连续的
  1301. //允许误差0.2分钟以内也认为是连续的
  1302. if (frequency - 0.2 <= minutes || minutes <= frequency + 0.2)
  1303. {
  1304. alertModel.连续预警次数 = newModel.连续预警次数 + 1;
  1305. }
  1306. }
  1307. //预警次数大于指定的,就移除缓存
  1308. //因为默认数字从0开始的,但是次数明显从1开始才合理,所以-1
  1309. if (alertModel.连续预警次数 >= duration - 1)
  1310. {
  1311. _cacheDuration.Remove(cacheId);
  1312. //预警
  1313. return action?.Invoke(alertModel);
  1314. }
  1315. else
  1316. {
  1317. _cacheDuration[cacheId] = alertModel;
  1318. }
  1319. return "";
  1320. }
  1321. #endregion
  1322. #region 数据库连接数信息上报
  1323. /// <summary>
  1324. /// 接收上报的数据库连接数信息
  1325. /// </summary>
  1326. /// <param name="dbConnectInfos"></param>
  1327. /// <returns></returns>
  1328. public void ReceiveDbConnectInfo(string clientId, List<Ret<DbConnectInfo>> dbConnectInfos)
  1329. {
  1330. //如果这个客户端ID没有启动,直接退出
  1331. if (!GetProjectMonitor().Any(m => m.客户端ID == clientId)) return;
  1332. if (!WorkTimeCheckContinue(clientId + "ReceiveDbConnectInfo")) return;
  1333. var config = GetCloudMonitorConfig().AlertConfig;
  1334. foreach (var item in dbConnectInfos)
  1335. {
  1336. if (!item.Success)
  1337. {
  1338. //上报指标记录
  1339. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1340. {
  1341. ID = Guid.NewGuid().ToString("D"),
  1342. 服务器ID = item.Id,
  1343. 预警ID = "",
  1344. 类型 = (int)InfoTypeEnum.数据库连接数,
  1345. 状态 = (int)PushStateTypeEnum.异常,
  1346. 上报原始数据 = item.Msg,
  1347. 创建时间 = item.CurrentTime,
  1348. 外部唯一键 = item.ExternalId
  1349. });
  1350. continue;
  1351. }
  1352. var info = item.Data;
  1353. var alertId = "";
  1354. var remain = info.ConnectTotal - info.ConnectUsed;
  1355. if (config.数据库剩余连接高危 < remain && remain <= config.数据库剩余连接濒危)
  1356. {
  1357. ServerAlertDetailModel model = new ServerAlertDetailModel
  1358. {
  1359. ID = Guid.NewGuid().ToString("D"),
  1360. 预警次数 = 1,
  1361. 预警名称 = "数据库连接数不足",
  1362. 预警说明 = Strings.ObjectToJson(info),
  1363. 当前值 = remain.ToString(),
  1364. 预警等级 = (int)AlertLevelEnum.橙色预警,
  1365. 最后修改时间 = info.CurrentTime,
  1366. 服务器ID = info.Id,
  1367. 预警类型 = (int)AlertTypeEnum.数据库连接数不足
  1368. };
  1369. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1370. alertId = CheckDuration(model, InsertServerAlert);
  1371. }
  1372. else if (remain <= config.数据库剩余连接高危)
  1373. {
  1374. ServerAlertDetailModel model = new ServerAlertDetailModel
  1375. {
  1376. ID = Guid.NewGuid().ToString("D"),
  1377. 预警次数 = 1,
  1378. 预警名称 = "数据库连接数不足",
  1379. 预警说明 = Strings.ObjectToJson(info),
  1380. 当前值 = remain.ToString(),
  1381. 预警等级 = (int)AlertLevelEnum.红色预警,
  1382. 最后修改时间 = info.CurrentTime,
  1383. 服务器ID = info.Id,
  1384. 预警类型 = (int)AlertTypeEnum.数据库连接数不足
  1385. };
  1386. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1387. alertId = CheckDuration(model, InsertServerAlert);
  1388. }
  1389. //上报指标记录
  1390. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1391. {
  1392. ID = Guid.NewGuid().ToString("D"),
  1393. 服务器ID = item.Id,
  1394. 预警ID = alertId,
  1395. 类型 = (int)InfoTypeEnum.数据库连接数,
  1396. 状态 = (int)PushStateTypeEnum.正常,
  1397. 上报原始数据 = Strings.ObjectToJson(info),
  1398. 创建时间 = item.CurrentTime,
  1399. 外部唯一键 = item.ExternalId
  1400. });
  1401. }
  1402. }
  1403. #endregion
  1404. #region 数据库死锁信息上报
  1405. /// <summary>
  1406. /// 接收上报的数据库死锁信息
  1407. /// </summary>
  1408. /// <param name="dbLockedInfos"></param>
  1409. /// <returns></returns>
  1410. public void ReceiveDbLockedInfo(string clientId, List<Ret<DbLockedInfo>> dbLockedInfos)
  1411. {
  1412. //如果这个客户端ID没有启动,直接退出
  1413. if (!GetProjectMonitor().Any(m => m.客户端ID == clientId)) return;
  1414. if (!WorkTimeCheckContinue(clientId + "ReceiveDbLockedInfo")) return;
  1415. foreach (var item in dbLockedInfos)
  1416. {
  1417. if (!item.Success)
  1418. {
  1419. //上报指标记录
  1420. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1421. {
  1422. ID = Guid.NewGuid().ToString("D"),
  1423. 服务器ID = item.Id,
  1424. 预警ID = "",
  1425. 类型 = (int)InfoTypeEnum.数据库死锁,
  1426. 状态 = (int)PushStateTypeEnum.异常,
  1427. 上报原始数据 = item.Msg,
  1428. 创建时间 = item.CurrentTime,
  1429. 外部唯一键 = item.ExternalId
  1430. });
  1431. continue;
  1432. }
  1433. var info = item.Data;
  1434. var alertId = "";
  1435. if (info.Lockused > 0)
  1436. {
  1437. ServerAlertDetailModel model = new ServerAlertDetailModel
  1438. {
  1439. ID = Guid.NewGuid().ToString("D"),
  1440. 预警次数 = 1,
  1441. 预警名称 = "数据库死锁",
  1442. 预警说明 = Strings.ObjectToJson(info),
  1443. 当前值 = info.Lockused.ToString(),
  1444. 预警等级 = (int)AlertLevelEnum.红色预警,
  1445. 最后修改时间 = info.CurrentTime,
  1446. 服务器ID = info.Id,
  1447. 预警类型 = (int)AlertTypeEnum.数据库死锁
  1448. };
  1449. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1450. alertId = CheckDuration(model, InsertServerAlert);
  1451. }
  1452. //上报指标记录
  1453. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1454. {
  1455. ID = Guid.NewGuid().ToString("D"),
  1456. 服务器ID = item.Id,
  1457. 预警ID = alertId,
  1458. 类型 = (int)InfoTypeEnum.数据库死锁,
  1459. 状态 = (int)PushStateTypeEnum.正常,
  1460. 上报原始数据 = Strings.ObjectToJson(info),
  1461. 创建时间 = item.CurrentTime,
  1462. 外部唯一键 = item.ExternalId
  1463. });
  1464. }
  1465. }
  1466. #endregion
  1467. #region 服务发现信息上报
  1468. /// <summary>
  1469. /// 接收上报的服务发现信息
  1470. /// </summary>
  1471. /// <returns></returns>
  1472. public void ReceiveServiceWorkStateInfo(string clientId, List<Ret<ServiceWorkStateInfo>> serviceWorkStateInfos)
  1473. {
  1474. //如果这个客户端ID没有启动,直接退出
  1475. if (!GetProjectMonitor().Any(m => m.客户端ID == clientId)) return;
  1476. if (!WorkTimeCheckContinue(clientId + "ReceiveServiceWorkStateInfo")) return;
  1477. foreach (var item in serviceWorkStateInfos)
  1478. {
  1479. if (!item.Success)
  1480. {
  1481. //上报指标记录
  1482. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1483. {
  1484. ID = Guid.NewGuid().ToString("D"),
  1485. 服务器ID = item.Id,
  1486. 预警ID = "",
  1487. 类型 = (int)InfoTypeEnum.服务运行状态,
  1488. 状态 = (int)PushStateTypeEnum.异常,
  1489. 上报原始数据 = item.Msg,
  1490. 创建时间 = item.CurrentTime,
  1491. });
  1492. continue;
  1493. }
  1494. var info = item.Data;
  1495. var alertId = "";
  1496. foreach (var state in info?.ServiceWorkStates)
  1497. {
  1498. if (state.Status != "passing")
  1499. {
  1500. ServerAlertDetailModel model = new ServerAlertDetailModel
  1501. {
  1502. ID = Guid.NewGuid().ToString("D"),
  1503. 预警次数 = 1,
  1504. 预警名称 = state.ServiceName,
  1505. 预警说明 = Strings.ObjectToJson(state),
  1506. 当前值 = state.Status,
  1507. 预警等级 = (int)AlertLevelEnum.红色预警,
  1508. 最后修改时间 = info.CurrentTime,
  1509. 服务器ID = info.Id,
  1510. 预警类型 = (int)AlertTypeEnum.服务中断
  1511. };
  1512. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1513. alertId = CheckDuration(model, InsertServerAlert);
  1514. }
  1515. }
  1516. //上报指标记录
  1517. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1518. {
  1519. ID = Guid.NewGuid().ToString("D"),
  1520. 服务器ID = item.Id,
  1521. 预警ID = alertId,
  1522. 类型 = (int)InfoTypeEnum.服务运行状态,
  1523. 状态 = (int)PushStateTypeEnum.正常,
  1524. 上报原始数据 = Strings.ObjectToJson(info),
  1525. 创建时间 = item.CurrentTime,
  1526. });
  1527. }
  1528. }
  1529. #endregion
  1530. #region 自定义预警信息上报
  1531. /// <summary>
  1532. /// 接收上报的自定义预警信息
  1533. /// </summary>
  1534. /// <returns></returns>
  1535. public void ReceiveDbCustomAlertInfo(string clientId, Ret<DbCustomAlertInfo> item)
  1536. {
  1537. //如果这个客户端ID没有启动,直接退出
  1538. if (!GetProjectMonitor().Any(m => m.客户端ID == clientId)) return;
  1539. if (!item.Success)
  1540. {
  1541. //上报指标记录
  1542. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1543. {
  1544. ID = Guid.NewGuid().ToString("D"),
  1545. 服务器ID = item.Id,
  1546. 预警ID = "",
  1547. 类型 = (int)InfoTypeEnum.自定义预警,
  1548. 状态 = (int)PushStateTypeEnum.异常,
  1549. 上报原始数据 = item.Msg,
  1550. 创建时间 = item.CurrentTime,
  1551. 外部唯一键 = item.ExternalId
  1552. });
  1553. return;
  1554. }
  1555. var info = item.Data;
  1556. var alertId = "";
  1557. //var customItem = GetCustomAlertModelByStart().FirstOrDefault(m => m.ID == info.CustomId);
  1558. //if (customItem == null) return;
  1559. if (info.Value != null)
  1560. {
  1561. ServerAlertDetailModel model = new ServerAlertDetailModel
  1562. {
  1563. ID = Guid.NewGuid().ToString("D"),
  1564. 预警次数 = 1,
  1565. 预警名称 = info.CustomId,
  1566. 预警说明 = Strings.ObjectToJson(info),
  1567. 当前值 = info.Value,
  1568. 预警等级 = (int)AlertLevelEnum.红色预警,
  1569. 最后修改时间 = info.CurrentTime,
  1570. 服务器ID = info.Id,
  1571. 预警类型 = (int)AlertTypeEnum.自定义指标,
  1572. };
  1573. model.外部唯一键 = model.预警类型 + "_" + info.CustomId;
  1574. alertId = CheckDuration(model, InsertServerAlert);
  1575. }
  1576. //上报指标记录
  1577. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1578. {
  1579. ID = Guid.NewGuid().ToString("D"),
  1580. 服务器ID = item.Id,
  1581. 预警ID = alertId,
  1582. 类型 = (int)InfoTypeEnum.自定义预警,
  1583. 状态 = (int)PushStateTypeEnum.正常,
  1584. 上报原始数据 = Strings.ObjectToJson(info),
  1585. 创建时间 = item.CurrentTime,
  1586. 外部唯一键 = item.ExternalId
  1587. });
  1588. }
  1589. #endregion
  1590. #region 自定义服务信息上报
  1591. /// <summary>
  1592. /// 接收上报的自定义服务信息
  1593. /// </summary>
  1594. /// <returns></returns>
  1595. public void ReceiveCustomServiceInfo(string clientId, Ret<CustomServiceInfo> item)
  1596. {
  1597. //如果这个客户端ID没有启动,直接退出
  1598. if (!GetProjectMonitor().Any(m => m.客户端ID == clientId)) return;
  1599. if (!item.Success)
  1600. {
  1601. //上报指标记录
  1602. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1603. {
  1604. ID = Guid.NewGuid().ToString("D"),
  1605. 服务器ID = item.Id,
  1606. 预警ID = "",
  1607. 类型 = (int)InfoTypeEnum.自定义服务,
  1608. 状态 = (int)PushStateTypeEnum.异常,
  1609. 上报原始数据 = item.Msg,
  1610. 创建时间 = item.CurrentTime,
  1611. 外部唯一键 = item.ExternalId
  1612. });
  1613. return;
  1614. }
  1615. var info = item.Data;
  1616. var alertId = "";
  1617. if (info.Value != null)
  1618. {
  1619. try
  1620. {
  1621. var customServiceInfo = dbCloudMonitor.GetCustomServiceInfoById(info.CustomServiceId);
  1622. var json = Strings.JsonToModel<CustomServiceAnalysis>(info.Value);
  1623. if (json.预警类型 <= 0) return;
  1624. ServerAlertDetailModel model = new ServerAlertDetailModel
  1625. {
  1626. ID = Guid.NewGuid().ToString("D"),
  1627. 预警次数 = 1,
  1628. 预警名称 = customServiceInfo.服务名称,
  1629. 预警说明 = Strings.ObjectToJson(info),
  1630. 当前值 = info.Value,
  1631. 预警等级 = json.预警类型,
  1632. 项目ID = customServiceInfo.项目ID,
  1633. 最后修改时间 = info.CurrentTime,
  1634. 预警类型 = (int)AlertTypeEnum.自定义服务,
  1635. };
  1636. model.外部唯一键 = model.预警类型 + "_" + info.CustomServiceId;
  1637. alertId = CheckDuration(model, InsertServerAlert);
  1638. }
  1639. catch (Exception ex)
  1640. {
  1641. //上报指标记录
  1642. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1643. {
  1644. ID = Guid.NewGuid().ToString("D"),
  1645. 服务器ID = item.Id,
  1646. 预警ID = "",
  1647. 类型 = (int)InfoTypeEnum.自定义服务,
  1648. 状态 = (int)PushStateTypeEnum.异常,
  1649. 上报原始数据 = "处理数据异常:" + ex.Message + " 原始内容:" + item.Msg,
  1650. 创建时间 = item.CurrentTime,
  1651. 外部唯一键 = item.ExternalId
  1652. });
  1653. return;
  1654. }
  1655. }
  1656. //上报指标记录
  1657. InsertPushIndexDataByServerId(new PushIndexDataModel()
  1658. {
  1659. ID = Guid.NewGuid().ToString("D"),
  1660. 服务器ID = item.Id,
  1661. 预警ID = alertId,
  1662. 类型 = (int)InfoTypeEnum.自定义服务,
  1663. 状态 = (int)PushStateTypeEnum.正常,
  1664. 上报原始数据 = Strings.ObjectToJson(info),
  1665. 创建时间 = item.CurrentTime,
  1666. 外部唯一键 = item.ExternalId
  1667. });
  1668. }
  1669. #endregion
  1670. #region 服务器定时任务
  1671. /// <summary>
  1672. /// 数据清理
  1673. /// </summary>
  1674. public void DataCleaning()
  1675. {
  1676. try
  1677. {
  1678. Log.Info("数据清理:开始");
  1679. var ret = dbCloudMonitor.DeleteServerIndexData();
  1680. Log.Info($"数据清理:服务器指标明{ret}条");
  1681. ret = dbCloudMonitor.DeletePushIndexData();
  1682. Log.Info($"数据清理:上报指标记录{ret}条");
  1683. Log.Info("数据清理:结束");
  1684. }
  1685. catch (Exception ex)
  1686. {
  1687. Log.Info("数据清理:错误:" + ex.Message);
  1688. }
  1689. }
  1690. /// <summary>
  1691. /// 磁盘可用天数扫描
  1692. /// </summary>
  1693. public void DiskAvailabilityScanning()
  1694. {
  1695. try
  1696. {
  1697. Log.Info("磁盘可用天数:开始");
  1698. var nowTime = DateTime.Now;
  1699. var lastTime = nowTime.AddDays(-1);
  1700. var config = GetCloudMonitorConfig().AlertConfig;
  1701. var projectList = GetProjectMonitor();
  1702. if (!projectList.Any()) return;
  1703. var projectIds = string.Join(",", projectList.Select(m => m.项目ID).ToList());
  1704. var serverInfoList = GetServerByItemId(projectIds);
  1705. foreach (var project in projectList)
  1706. {
  1707. //服务器列表
  1708. var serverInfos = serverInfoList.Where(m => m.项目ID == project.项目ID);
  1709. var lastIndexData = dbCloudMonitor.GetPushIndexDataByServerInfo(project.项目ID, lastTime);
  1710. var nowIndexData = dbCloudMonitor.GetPushIndexDataByServerInfo(project.项目ID, nowTime);
  1711. foreach (var serverInfo in serverInfos)
  1712. {
  1713. var lastInedx = lastIndexData.FirstOrDefault(m => m.服务器ID == serverInfo.ID);
  1714. var nowInedx = nowIndexData.FirstOrDefault(m => m.服务器ID == serverInfo.ID);
  1715. if (lastInedx != null && nowInedx != null)
  1716. {
  1717. if (lastInedx.状态 != (int)PushStateTypeEnum.正常 || nowInedx.状态 != (int)PushStateTypeEnum.正常)
  1718. {
  1719. //状态有问题。可以选择预警一下
  1720. continue;
  1721. }
  1722. var lastInfo = Strings.JsonToModel<ServerInfo>(lastInedx.上报原始数据);
  1723. var nowInfo = Strings.JsonToModel<ServerInfo>(nowInedx.上报原始数据);
  1724. var oldDisk = lastInfo.DiskTotal - lastInfo.DiskUsed;
  1725. var nowDisk = nowInfo.DiskTotal - nowInfo.DiskUsed;
  1726. //一天使用的磁盘容量
  1727. var oneDayUse = oldDisk - nowDisk;
  1728. //小于10M的话,和没用没啥区别,不记录
  1729. if (oneDayUse > 10)
  1730. {
  1731. //可用天数
  1732. var availableDay = nowDisk / oneDayUse;
  1733. if (config.磁盘预计可用天数高危 < availableDay && availableDay <= config.磁盘预计可用天数濒危)
  1734. {
  1735. ServerAlertDetailModel model = new ServerAlertDetailModel
  1736. {
  1737. ID = Guid.NewGuid().ToString("D"),
  1738. 预警次数 = 1,
  1739. 预警名称 = "磁盘可用天数不足",
  1740. 预警说明 = "",
  1741. 当前值 = availableDay.ToString(),
  1742. 预警等级 = (int)AlertLevelEnum.红色预警,
  1743. 最后修改时间 = DateTime.Now,
  1744. 服务器ID = serverInfo.ID,
  1745. 预警类型 = (int)AlertTypeEnum.磁盘可用天数
  1746. };
  1747. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1748. CheckDuration(model, InsertServerAlert);
  1749. }
  1750. else if (availableDay <= config.磁盘预计可用天数高危)
  1751. {
  1752. ServerAlertDetailModel model = new ServerAlertDetailModel
  1753. {
  1754. ID = Guid.NewGuid().ToString("D"),
  1755. 预警次数 = 1,
  1756. 预警名称 = "磁盘可用天数不足",
  1757. 预警说明 = "",
  1758. 当前值 = availableDay.ToString(),
  1759. 预警等级 = (int)AlertLevelEnum.红色预警,
  1760. 最后修改时间 = DateTime.Now,
  1761. 服务器ID = serverInfo.ID,
  1762. 预警类型 = (int)AlertTypeEnum.磁盘可用天数
  1763. };
  1764. model.外部唯一键 = model.预警类型 + "_" + model.服务器ID;
  1765. CheckDuration(model, InsertServerAlert);
  1766. }
  1767. }
  1768. }
  1769. }
  1770. }
  1771. Log.Info("磁盘可用天数:结束");
  1772. }
  1773. catch (Exception ex)
  1774. {
  1775. Log.Info("磁盘可用天数:错误:" + ex.Message);
  1776. }
  1777. //数据清理
  1778. DataCleaning();
  1779. }
  1780. /// <summary>
  1781. /// 采集中断扫描
  1782. /// </summary>
  1783. public void CollectionInterruptScanning()
  1784. {
  1785. try
  1786. {
  1787. Log.Info("采集中断:开始");
  1788. var config = GetCloudMonitorConfig().CollectionConfig;
  1789. var projectList = GetProjectMonitor();
  1790. if (!projectList.Any()) return;
  1791. var projectIds = string.Join(",", projectList.Select(m => m.项目ID).ToList());
  1792. var serverInfoList = GetServerByItemId(projectIds);
  1793. foreach (var project in projectList)
  1794. {
  1795. var list = new List<ServerAlertDetailModel>();
  1796. var indexData = dbCloudMonitor.GetPushIndexDataByProjectId(project.项目ID, config.采集服务中断执行频率);
  1797. //服务器列表
  1798. var serverInfos = serverInfoList.Where(m => m.项目ID == project.项目ID);
  1799. list.AddRange(HandleServerInfo(serverInfos.ToList(), indexData.Where(m => m.类型 == (int)InfoTypeEnum.服务器硬件信息)));
  1800. //判断服务发现服务器
  1801. var serviceDiscoverys = serverInfos.Where(m => m.安装服务?.Split(',')?.Contains("7") == true).ToList();
  1802. list.AddRange(HandleServiceDiscovery(serviceDiscoverys, indexData.Where(m => m.类型 == (int)InfoTypeEnum.服务运行状态)));
  1803. //判断数据库服务器
  1804. var dbServers = serverInfos.Where(m => m.安装服务?.Split(',')?.Contains("9") == true).ToList();
  1805. list.AddRange(HandleDbConnect(dbServers, indexData.Where(m => m.类型 == (int)InfoTypeEnum.数据库连接数)));
  1806. list.AddRange(HandleDbLocked(dbServers, indexData.Where(m => m.类型 == (int)InfoTypeEnum.数据库死锁)));
  1807. var total = serverInfos.Count() + serviceDiscoverys.Count + (dbServers.Sum(m => m.数据库.Count) * 2);
  1808. //代表是整体中断
  1809. if (total == list.Count(m => m.预警说明 != "状态异常"))
  1810. {
  1811. CheckDuration(new ServerAlertDetailModel()
  1812. {
  1813. ID = Guid.NewGuid().ToString("D"),
  1814. 预警次数 = 1,
  1815. 预警名称 = "前置机中断",
  1816. 预警说明 = "未能查询到上报数据",
  1817. 当前值 = "",
  1818. 预警等级 = (int)AlertLevelEnum.红色预警,
  1819. 最后修改时间 = DateTime.Now,
  1820. 服务器ID = "",
  1821. 预警类型 = (int)AlertTypeEnum.采集中断,
  1822. 项目ID = project.项目ID,
  1823. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + project.项目ID
  1824. }, InsertServerAlert);
  1825. }
  1826. else
  1827. {
  1828. foreach (var item in list)
  1829. {
  1830. CheckDuration(item, InsertServerAlert);
  1831. }
  1832. }
  1833. }
  1834. Log.Info("采集中断:结束");
  1835. }
  1836. catch (Exception ex)
  1837. {
  1838. Log.Info("采集中断:错误:" + ex.Message);
  1839. }
  1840. }
  1841. /// <summary>
  1842. /// 处理服务器
  1843. /// </summary>
  1844. /// <param name="data"></param>
  1845. /// <param name="indexData"></param>
  1846. private List<ServerAlertDetailModel> HandleServerInfo(List<ServerInfoModel> data, IEnumerable<PushIndexDataModel> indexData)
  1847. {
  1848. var config = GetCloudMonitorConfig().CollectionConfig;
  1849. var frequency = config.服务器硬件信息执行频率;
  1850. var list = new List<ServerAlertDetailModel>();
  1851. foreach (var serverInfo in data)
  1852. {
  1853. //获取当前服务器的并且最新的一条
  1854. var lastIndex = indexData.Where(m => m.服务器ID == serverInfo.ID)
  1855. .OrderByDescending(m => m.创建时间).FirstOrDefault();
  1856. //一条指标都没查到,为服务中断
  1857. if (lastIndex == null)
  1858. {
  1859. list.Add(new ServerAlertDetailModel()
  1860. {
  1861. ID = Guid.NewGuid().ToString("D"),
  1862. 预警次数 = 1,
  1863. 预警名称 = "服务器硬件信息中断",
  1864. 预警说明 = "未能查询到上报数据",
  1865. 当前值 = "",
  1866. 预警等级 = (int)AlertLevelEnum.红色预警,
  1867. 最后修改时间 = DateTime.Now,
  1868. 服务器ID = serverInfo.ID,
  1869. 预警类型 = (int)AlertTypeEnum.采集中断,
  1870. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.服务器硬件信息 + "_" + serverInfo.ID
  1871. });
  1872. continue;
  1873. }
  1874. var timeSpan = DateTime.Now - lastIndex.创建时间;
  1875. var minutes = timeSpan.TotalMinutes;
  1876. //对比两次时间和频率是相等的,则认为是连续的
  1877. //允许误差0.2分钟以内也认为是连续的
  1878. if (frequency - 0.2 <= minutes || minutes <= frequency + 0.2)
  1879. {
  1880. //这儿是代表上报成功,继续处理数据是否有效
  1881. if (lastIndex.状态 == (int)PushStateTypeEnum.异常)
  1882. {
  1883. list.Add(new ServerAlertDetailModel()
  1884. {
  1885. ID = Guid.NewGuid().ToString("D"),
  1886. 预警次数 = 1,
  1887. 预警名称 = "服务器硬件信息中断",
  1888. 预警说明 = "状态异常",
  1889. 当前值 = $"异常说明:{lastIndex.上报原始数据}",
  1890. 预警等级 = (int)AlertLevelEnum.红色预警,
  1891. 最后修改时间 = DateTime.Now,
  1892. 服务器ID = serverInfo.ID,
  1893. 预警类型 = (int)AlertTypeEnum.采集中断,
  1894. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.服务器硬件信息 + "_" + serverInfo.ID
  1895. });
  1896. }
  1897. }
  1898. else
  1899. {
  1900. //这儿是代表在预定的时间未能成功上报指标记录
  1901. list.Add(new ServerAlertDetailModel()
  1902. {
  1903. ID = Guid.NewGuid().ToString("D"),
  1904. 预警次数 = 1,
  1905. 预警名称 = "服务器硬件信息中断",
  1906. 预警说明 = "预定时间未能成功上报数据",
  1907. 当前值 = $"上次上报时间:{lastIndex.创建时间:yyyy-MM-dd HH:mm:ss}",
  1908. 预警等级 = (int)AlertLevelEnum.红色预警,
  1909. 最后修改时间 = DateTime.Now,
  1910. 服务器ID = serverInfo.ID,
  1911. 预警类型 = (int)AlertTypeEnum.采集中断,
  1912. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.服务器硬件信息 + "_" + serverInfo.ID
  1913. });
  1914. }
  1915. }
  1916. return list;
  1917. }
  1918. /// <summary>
  1919. /// 处理服务发现
  1920. /// </summary>
  1921. private List<ServerAlertDetailModel> HandleServiceDiscovery(List<ServerInfoModel> data, IEnumerable<PushIndexDataModel> indexData)
  1922. {
  1923. var config = GetCloudMonitorConfig().CollectionConfig;
  1924. var frequency = config.服务运行状态执行频率;
  1925. var list = new List<ServerAlertDetailModel>();
  1926. foreach (var serverInfo in data)
  1927. {
  1928. //获取当前服务器的并且最新的一条
  1929. var lastIndex = indexData.Where(m => m.服务器ID == serverInfo.ID)
  1930. .OrderByDescending(m => m.创建时间).FirstOrDefault();
  1931. //一条指标都没查到,为服务中断
  1932. if (lastIndex == null)
  1933. {
  1934. list.Add(new ServerAlertDetailModel()
  1935. {
  1936. ID = Guid.NewGuid().ToString("D"),
  1937. 预警次数 = 1,
  1938. 预警名称 = "服务运行状态中断",
  1939. 预警说明 = "未能查询到上报数据",
  1940. 当前值 = "",
  1941. 预警等级 = (int)AlertLevelEnum.红色预警,
  1942. 最后修改时间 = DateTime.Now,
  1943. 服务器ID = serverInfo.ID,
  1944. 预警类型 = (int)AlertTypeEnum.采集中断,
  1945. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.服务运行状态 + "_" + serverInfo.ID
  1946. });
  1947. continue;
  1948. }
  1949. var timeSpan = DateTime.Now - lastIndex.创建时间;
  1950. var minutes = timeSpan.TotalMinutes;
  1951. //对比两次时间和频率是相等的,则认为是连续的
  1952. //允许误差0.2分钟以内也认为是连续的
  1953. if (frequency - 0.2 <= minutes || minutes <= frequency + 0.2)
  1954. {
  1955. //这儿是代表上报成功,继续处理数据是否有效
  1956. if (lastIndex.状态 == (int)PushStateTypeEnum.异常)
  1957. {
  1958. list.Add(new ServerAlertDetailModel()
  1959. {
  1960. ID = Guid.NewGuid().ToString("D"),
  1961. 预警次数 = 1,
  1962. 预警名称 = "服务运行状态中断",
  1963. 预警说明 = "状态异常",
  1964. 当前值 = $"异常说明:{lastIndex.上报原始数据}",
  1965. 预警等级 = (int)AlertLevelEnum.红色预警,
  1966. 最后修改时间 = DateTime.Now,
  1967. 服务器ID = serverInfo.ID,
  1968. 预警类型 = (int)AlertTypeEnum.采集中断,
  1969. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.服务运行状态 + "_" + serverInfo.ID
  1970. });
  1971. }
  1972. }
  1973. else
  1974. {
  1975. //这儿是代表在预定的时间未能成功上报指标记录
  1976. list.Add(new ServerAlertDetailModel()
  1977. {
  1978. ID = Guid.NewGuid().ToString("D"),
  1979. 预警次数 = 1,
  1980. 预警名称 = "服务运行状态中断",
  1981. 预警说明 = "预定时间未能成功上报数据",
  1982. 当前值 = $"上次上报时间:{lastIndex.创建时间:yyyy-MM-dd HH:mm:ss}",
  1983. 预警等级 = (int)AlertLevelEnum.红色预警,
  1984. 最后修改时间 = DateTime.Now,
  1985. 服务器ID = serverInfo.ID,
  1986. 预警类型 = (int)AlertTypeEnum.采集中断,
  1987. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.服务运行状态 + "_" + serverInfo.ID
  1988. });
  1989. }
  1990. }
  1991. return list;
  1992. }
  1993. /// <summary>
  1994. /// 处理数据库连接
  1995. /// </summary>
  1996. /// <param name="data"></param>
  1997. /// <param name="indexData"></param>
  1998. private List<ServerAlertDetailModel> HandleDbConnect(List<ServerInfoModel> data, IEnumerable<PushIndexDataModel> indexData)
  1999. {
  2000. var config = GetCloudMonitorConfig().CollectionConfig;
  2001. var frequency = config.数据库连接数执行频率;
  2002. var list = new List<ServerAlertDetailModel>();
  2003. foreach (var serverInfo in data)
  2004. {
  2005. foreach (var dbInfo in serverInfo.数据库)
  2006. {
  2007. //获取当前服务器的并且最新的一条
  2008. var lastIndex = indexData.Where(m => m.服务器ID == serverInfo.ID)
  2009. .Where(m => m.外部唯一键 == dbInfo.ID)
  2010. .OrderByDescending(m => m.创建时间).FirstOrDefault();
  2011. //一条指标都没查到,为服务中断
  2012. if (lastIndex == null)
  2013. {
  2014. list.Add(new ServerAlertDetailModel()
  2015. {
  2016. ID = Guid.NewGuid().ToString("D"),
  2017. 预警次数 = 1,
  2018. 预警名称 = "数据库连接数中断",
  2019. 预警说明 = "未能查询到上报数据",
  2020. 当前值 = "",
  2021. 预警等级 = (int)AlertLevelEnum.红色预警,
  2022. 最后修改时间 = DateTime.Now,
  2023. 服务器ID = serverInfo.ID,
  2024. 预警类型 = (int)AlertTypeEnum.采集中断,
  2025. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.数据库连接数 + dbInfo.ID + "_" + serverInfo.ID
  2026. });
  2027. continue;
  2028. }
  2029. var timeSpan = DateTime.Now - lastIndex.创建时间;
  2030. var minutes = timeSpan.TotalMinutes;
  2031. //对比两次时间和频率是相等的,则认为是连续的
  2032. //允许误差0.2分钟以内也认为是连续的
  2033. if (frequency - 0.2 <= minutes || minutes <= frequency + 0.2)
  2034. {
  2035. //这儿是代表上报成功,继续处理数据是否有效
  2036. if (lastIndex.状态 == (int)PushStateTypeEnum.异常)
  2037. {
  2038. list.Add(new ServerAlertDetailModel()
  2039. {
  2040. ID = Guid.NewGuid().ToString("D"),
  2041. 预警次数 = 1,
  2042. 预警名称 = "数据库连接数中断",
  2043. 预警说明 = "状态异常",
  2044. 当前值 = $"异常说明:{lastIndex.上报原始数据}",
  2045. 预警等级 = (int)AlertLevelEnum.红色预警,
  2046. 最后修改时间 = DateTime.Now,
  2047. 服务器ID = serverInfo.ID,
  2048. 预警类型 = (int)AlertTypeEnum.采集中断,
  2049. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.数据库连接数 + dbInfo.ID + "_" + serverInfo.ID
  2050. });
  2051. }
  2052. }
  2053. else
  2054. {
  2055. //这儿是代表在预定的时间未能成功上报指标记录
  2056. list.Add(new ServerAlertDetailModel()
  2057. {
  2058. ID = Guid.NewGuid().ToString("D"),
  2059. 预警次数 = 1,
  2060. 预警名称 = "数据库连接数中断",
  2061. 预警说明 = "预定时间未能成功上报数据",
  2062. 当前值 = $"上次上报时间:{lastIndex.创建时间:yyyy-MM-dd HH:mm:ss}",
  2063. 预警等级 = (int)AlertLevelEnum.红色预警,
  2064. 最后修改时间 = DateTime.Now,
  2065. 服务器ID = serverInfo.ID,
  2066. 预警类型 = (int)AlertTypeEnum.采集中断,
  2067. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.数据库连接数 + dbInfo.ID + "_" + serverInfo.ID
  2068. });
  2069. }
  2070. }
  2071. }
  2072. return list;
  2073. }
  2074. /// <summary>
  2075. /// 处理数据库锁定
  2076. /// </summary>
  2077. /// <param name="data"></param>
  2078. /// <param name="indexData"></param>
  2079. private List<ServerAlertDetailModel> HandleDbLocked(List<ServerInfoModel> data, IEnumerable<PushIndexDataModel> indexData)
  2080. {
  2081. var config = GetCloudMonitorConfig().CollectionConfig;
  2082. var frequency = config.数据库死锁执行频率;
  2083. var list = new List<ServerAlertDetailModel>();
  2084. foreach (var serverInfo in data)
  2085. {
  2086. foreach (var dbInfo in serverInfo.数据库)
  2087. {
  2088. //获取当前服务器的并且最新的一条
  2089. var lastIndex = indexData.Where(m => m.服务器ID == serverInfo.ID)
  2090. .Where(m => m.外部唯一键 == dbInfo.ID)
  2091. .OrderByDescending(m => m.创建时间).FirstOrDefault();
  2092. //一条指标都没查到,为服务中断
  2093. if (lastIndex == null)
  2094. {
  2095. list.Add(new ServerAlertDetailModel()
  2096. {
  2097. ID = Guid.NewGuid().ToString("D"),
  2098. 预警次数 = 1,
  2099. 预警名称 = "数据库死锁中断",
  2100. 预警说明 = "未能查询到上报数据",
  2101. 当前值 = "",
  2102. 预警等级 = (int)AlertLevelEnum.红色预警,
  2103. 最后修改时间 = DateTime.Now,
  2104. 服务器ID = serverInfo.ID,
  2105. 预警类型 = (int)AlertTypeEnum.采集中断,
  2106. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.数据库死锁 + dbInfo.ID + "_" + serverInfo.ID
  2107. });
  2108. continue;
  2109. }
  2110. var timeSpan = DateTime.Now - lastIndex.创建时间;
  2111. var minutes = timeSpan.TotalMinutes;
  2112. //对比两次时间和频率是相等的,则认为是连续的
  2113. //允许误差0.2分钟以内也认为是连续的
  2114. if (frequency - 0.2 <= minutes || minutes <= frequency + 0.2)
  2115. {
  2116. //这儿是代表上报成功,继续处理数据是否有效
  2117. if (lastIndex.状态 == (int)PushStateTypeEnum.异常)
  2118. {
  2119. list.Add(new ServerAlertDetailModel()
  2120. {
  2121. ID = Guid.NewGuid().ToString("D"),
  2122. 预警次数 = 1,
  2123. 预警名称 = "数据库死锁中断",
  2124. 预警说明 = "状态异常",
  2125. 当前值 = $"异常说明:{lastIndex.上报原始数据}",
  2126. 预警等级 = (int)AlertLevelEnum.红色预警,
  2127. 最后修改时间 = DateTime.Now,
  2128. 服务器ID = serverInfo.ID,
  2129. 预警类型 = (int)AlertTypeEnum.采集中断,
  2130. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.数据库死锁 + dbInfo.ID + "_" + serverInfo.ID
  2131. });
  2132. }
  2133. }
  2134. else
  2135. {
  2136. //这儿是代表在预定的时间未能成功上报指标记录
  2137. list.Add(new ServerAlertDetailModel()
  2138. {
  2139. ID = Guid.NewGuid().ToString("D"),
  2140. 预警次数 = 1,
  2141. 预警名称 = "数据库死锁中断",
  2142. 预警说明 = "预定时间未能成功上报数据",
  2143. 当前值 = $"上次上报时间:{lastIndex.创建时间:yyyy-MM-dd HH:mm:ss}",
  2144. 预警等级 = (int)AlertLevelEnum.红色预警,
  2145. 最后修改时间 = DateTime.Now,
  2146. 服务器ID = serverInfo.ID,
  2147. 预警类型 = (int)AlertTypeEnum.采集中断,
  2148. 外部唯一键 = (int)AlertTypeEnum.采集中断 + "_" + (int)InfoTypeEnum.数据库死锁 + dbInfo.ID + "_" + serverInfo.ID
  2149. });
  2150. }
  2151. }
  2152. }
  2153. return list;
  2154. }
  2155. #endregion
  2156. #region 工作时间
  2157. /// <summary>
  2158. /// 表示非工作时间的采集频率
  2159. /// </summary>
  2160. private const int workFrequency = 15;
  2161. private static Dictionary<string, int> _cacheWorkTime = new Dictionary<string, int>();
  2162. /// <summary>
  2163. /// 判断工作时间,是否继续
  2164. /// </summary>
  2165. /// <param name="id"></param>
  2166. /// <returns></returns>
  2167. private bool WorkTimeCheckContinue(string id)
  2168. {
  2169. //不是工作时间直接继续
  2170. if (!IsWorkTime()) return true;
  2171. if (_cacheWorkTime.TryGetValue(id, out var num))
  2172. {
  2173. num++;
  2174. if (num >= workFrequency)
  2175. {
  2176. _cacheWorkTime[id] = 0;
  2177. return true;
  2178. }
  2179. }
  2180. else
  2181. {
  2182. _cacheWorkTime[id] = 1;
  2183. }
  2184. return false;
  2185. }
  2186. /// <summary>
  2187. /// 判断当前时间是否工作时间
  2188. /// </summary>
  2189. /// <returns></returns>
  2190. private bool IsWorkTime()
  2191. {
  2192. var config = GetCloudMonitorConfig();
  2193. AlertConfig alertConfig = config.AlertConfig;
  2194. // 当前时间的小时和分钟
  2195. var currentTime = DateTime.Now.TimeOfDay;
  2196. // 将字符串时间转换为 TimeSpan
  2197. var startTime = TimeSpan.Parse(alertConfig.工作开始时间);
  2198. var endTime = TimeSpan.Parse(alertConfig.工作结束时间);
  2199. // 检查当前时间是否在时间区间内
  2200. if (currentTime >= startTime && currentTime <= endTime)
  2201. {
  2202. return true;
  2203. }
  2204. else
  2205. {
  2206. return false;
  2207. }
  2208. }
  2209. #endregion
  2210. }
  2211. }
  2212. ;