predict_edb.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442
  1. package models
  2. import (
  3. "encoding/json"
  4. "errors"
  5. "eta/eta_index_lib/utils"
  6. "fmt"
  7. "github.com/beego/beego/v2/client/orm"
  8. "github.com/shopspring/decimal"
  9. "github.com/yidane/formula"
  10. "strings"
  11. "time"
  12. )
  13. // CalculateRule 预测指标 规则 计算
  14. type CalculateRule struct {
  15. EdbInfoId int `description:"指标id"`
  16. ConfigId int `description:"配置id"`
  17. TrendsCalculateMappingList []*PredictEdbConfCalculateMapping
  18. EdbInfoList []*EdbInfo
  19. EdbInfoIdBytes []string
  20. Formula string
  21. RuleType int `description:"预测规则,1:最新,2:固定值,3:同比,4:同差,5:环比,6:环差,7:N期移动均值,8:N期段线性外推值,9:动态环差"`
  22. EndDate string `description:"截止日期"`
  23. EdbInfoIdArr []EdbInfoFromTag `description:"指标信息"`
  24. EmptyType int `description:"空值处理类型(0查找前后35天,1不计算,2前值填充,3后值填充,4等于0)"`
  25. MaxEmptyType int `description:"MAX、MIN公式空值处理类型(1、等于0;2、跳过空值)"`
  26. }
  27. // RefreshCalculateByRuleBy9 刷新计算
  28. func RefreshCalculateByRuleBy9(rule CalculateRule) (resultDataList []*EdbInfoSearchData, err error) {
  29. o := orm.NewOrm()
  30. to, err := o.Begin()
  31. if err != nil {
  32. return
  33. }
  34. defer func() {
  35. if err != nil {
  36. to.Rollback()
  37. } else {
  38. err = to.Commit()
  39. }
  40. }()
  41. resultDataList, err = CalculateByRuleBy9(to, rule)
  42. return
  43. }
  44. // CalculateByRuleBy9 动态环差规则计算入库
  45. func CalculateByRuleBy9(to orm.TxOrmer, rule CalculateRule) (resultDataList []*EdbInfoSearchData, err error) {
  46. realSaveDataMap := make(map[string]map[int]float64)
  47. saveDataMap := make(map[string]map[int]float64)
  48. // 最小的结束日期 , 最晚的数据开始日期
  49. var minLatestDate, maxStartDate time.Time
  50. dateList := make([]string, 0) // 第一个指标的日期数据
  51. formulaStr := strings.ToUpper(rule.Formula)
  52. // 获取关联指标数据
  53. for edbInfoIndex, v := range rule.EdbInfoList {
  54. dataList, tmpErr := GetPredictEdbDataListAll(v, 1)
  55. if tmpErr != nil {
  56. err = tmpErr
  57. return
  58. }
  59. //lenData := len(dataList)
  60. for _, dv := range dataList {
  61. // 现有实际数据
  62. if val, ok := realSaveDataMap[dv.DataTime]; ok {
  63. if _, ok := val[v.EdbInfoId]; !ok {
  64. val[v.EdbInfoId] = dv.Value
  65. }
  66. } else {
  67. temp := make(map[int]float64)
  68. temp[v.EdbInfoId] = dv.Value
  69. realSaveDataMap[dv.DataTime] = temp
  70. }
  71. // 待处理的数据
  72. if val, ok := saveDataMap[dv.DataTime]; ok {
  73. if _, ok := val[v.EdbInfoId]; !ok {
  74. val[v.EdbInfoId] = dv.Value
  75. }
  76. } else {
  77. temp := make(map[int]float64)
  78. temp[v.EdbInfoId] = dv.Value
  79. saveDataMap[dv.DataTime] = temp
  80. }
  81. // 以第一个指标的日期作为基准日期
  82. if edbInfoIndex == 0 {
  83. dateList = append(dateList, dv.DataTime)
  84. tmpDate, _ := time.ParseInLocation(utils.FormatDate, dv.DataTime, time.Local)
  85. if minLatestDate.IsZero() || tmpDate.After(minLatestDate) {
  86. minLatestDate = tmpDate
  87. }
  88. if maxStartDate.IsZero() || tmpDate.Before(maxStartDate) {
  89. maxStartDate = tmpDate
  90. }
  91. }
  92. }
  93. /*if lenData > 0 {
  94. tmpLatestDate, _ := time.ParseInLocation(utils.FormatDate, dataList[lenData-1].DataTime, time.Local)
  95. if minLatestDate.IsZero() || minLatestDate.After(tmpLatestDate) {
  96. minLatestDate = tmpLatestDate
  97. }
  98. tmpStartDate, _ := time.ParseInLocation(utils.FormatDate, dataList[0].DataTime, time.Local)
  99. if maxStartDate.IsZero() || maxStartDate.Before(tmpStartDate) {
  100. maxStartDate = tmpStartDate
  101. }
  102. }*/
  103. }
  104. // todo 数据处理,将日期内不全的数据做填补
  105. HandleDateSaveDataMap(dateList, maxStartDate, minLatestDate, realSaveDataMap, saveDataMap, rule.EdbInfoList, rule.EmptyType)
  106. // 添加数据
  107. addDataList := make([]*PredictEdbRuleData, 0)
  108. // 计算规则
  109. formulaDateSlice, formulaDateMap, err := utils.HandleFormulaJson(formulaStr, minLatestDate)
  110. if err != nil {
  111. return
  112. }
  113. //获取指标所有数据
  114. dataList := make([]*PredictEdbRuleData, 0)
  115. sql := `SELECT * FROM predict_edb_rule_data WHERE config_id = ?`
  116. _, err = to.Raw(sql, rule.ConfigId).QueryRows(&dataList)
  117. if err != nil {
  118. return
  119. }
  120. dataMap := make(map[string]*PredictEdbRuleData)
  121. for _, v := range dataList {
  122. dataMap[v.DataTime] = v
  123. }
  124. existDataMap := make(map[string]string)
  125. removeDateList := make([]string, 0) //需要移除的日期
  126. // 判断是否特殊处理max和min函数
  127. maxDealFlag := false
  128. if rule.EmptyType == 4 && rule.MaxEmptyType == 2 {
  129. maxDealFlag = true
  130. }
  131. for sk, sv := range saveDataMap {
  132. // 当空值处理类型选择了不计算时,只要有一个指标在某个日期没有值(即空值),则计算指标在该日期没有值
  133. if rule.EmptyType == 1 {
  134. if len(sv) != len(rule.EdbInfoList) {
  135. continue
  136. }
  137. }
  138. //fmt.Println(sk, sv)
  139. // 根据时间范围,选择对应的公式
  140. formulaMap := make(map[string]string)
  141. formulaStr = ""
  142. for _, fv := range formulaDateSlice {
  143. if sk < fv {
  144. if f, ok := formulaDateMap[fv]; ok {
  145. formulaStr = f
  146. formulaMap = utils.CheckFormula(formulaStr)
  147. }
  148. break
  149. }
  150. }
  151. if formulaStr == "" {
  152. continue
  153. }
  154. svMax := make(map[int]float64)
  155. if maxDealFlag {
  156. // 特殊处理max和min函数,如果原本的值为空,则选择空值参与运算
  157. if svMaxData, ok := realSaveDataMap[sk]; ok {
  158. svMax = svMaxData
  159. }
  160. }
  161. formulaStr = strings.ToUpper(formulaStr)
  162. //fmt.Println(sk, sv)
  163. formulaFormStr := ReplaceFormula(rule.EdbInfoList, sv, svMax, formulaMap, formulaStr, rule.EdbInfoIdBytes, maxDealFlag)
  164. //计算公式异常,那么就移除该指标
  165. if formulaFormStr == "" {
  166. removeDateList = append(removeDateList, sk)
  167. continue
  168. }
  169. //utils.FileLog.Info(fmt.Sprintf("formulaFormStr:%s", formulaFormStr))
  170. expression := formula.NewExpression(formulaFormStr)
  171. calResult, tmpErr := expression.Evaluate()
  172. if tmpErr != nil {
  173. // 分母为0的报错
  174. if strings.Contains(tmpErr.Error(), "divide by zero") {
  175. removeDateList = append(removeDateList, sk)
  176. continue
  177. }
  178. err = errors.New("计算失败:Err:" + tmpErr.Error() + ";formulaStr:" + formulaFormStr)
  179. //fmt.Println(err)
  180. return
  181. }
  182. calVal, tmpErr := calResult.Float64()
  183. if tmpErr != nil {
  184. err = errors.New("计算失败:获取计算值失败 Err:" + tmpErr.Error() + ";formulaStr:" + formulaFormStr)
  185. //fmt.Println(err)
  186. return
  187. }
  188. nanCheck := fmt.Sprintf("%0.f", calVal)
  189. if nanCheck == "NaN" || nanCheck == "+Inf" || nanCheck == "-Inf" {
  190. removeDateList = append(removeDateList, sk)
  191. continue
  192. }
  193. saveValue := decimal.NewFromFloat(calVal).RoundCeil(4).String() //utils.SubFloatToString(calVal, 4)
  194. existPredictEdbRuleData, ok := dataMap[sk]
  195. if !ok {
  196. dataTime, _ := time.ParseInLocation(utils.FormatDate, sk, time.Local)
  197. timestamp := dataTime.UnixNano() / 1e6
  198. if _, existOk := existDataMap[sk]; !existOk {
  199. tmpPredictEdbRuleData := &PredictEdbRuleData{
  200. //PredictEdbRuleDataId: 0,
  201. EdbInfoId: rule.EdbInfoId,
  202. ConfigId: rule.ConfigId,
  203. DataTime: sk,
  204. Value: saveValue,
  205. CreateTime: time.Now(),
  206. ModifyTime: time.Now(),
  207. DataTimestamp: timestamp,
  208. }
  209. addDataList = append(addDataList, tmpPredictEdbRuleData)
  210. }
  211. existDataMap[sk] = sk
  212. } else {
  213. existValDecimal, tmpErr := decimal.NewFromString(existPredictEdbRuleData.Value)
  214. if tmpErr != nil {
  215. err = tmpErr
  216. return
  217. }
  218. existStr := existValDecimal.String()
  219. if existStr != saveValue {
  220. existPredictEdbRuleData.Value = saveValue
  221. existPredictEdbRuleData.ModifyTime = time.Now()
  222. _, err = to.Update(existPredictEdbRuleData, "Value", "ModifyTime")
  223. if err != nil {
  224. return
  225. }
  226. }
  227. }
  228. // 计算出来的结果集
  229. resultDataList = append(resultDataList, &EdbInfoSearchData{
  230. //EdbDataId: 0,
  231. DataTime: sk,
  232. Value: calVal,
  233. })
  234. }
  235. // 添加计算出来的值入库
  236. lenAddDataList := len(addDataList)
  237. if lenAddDataList > 0 {
  238. _, err = to.InsertMulti(lenAddDataList, addDataList)
  239. if err != nil {
  240. return
  241. }
  242. }
  243. //删除多余的值
  244. lenRemoveDateList := len(removeDateList)
  245. if lenRemoveDateList > 0 {
  246. //如果拼接指标变更了,那么需要删除所有的指标数据
  247. sql := ` DELETE FROM predict_edb_rule_data WHERE config_id = ? and data_time in (` + utils.GetOrmInReplace(lenRemoveDateList) + `) `
  248. _, err = to.Raw(sql, rule.ConfigId, removeDateList).Exec()
  249. if err != nil {
  250. err = fmt.Errorf("删除计算失败的预测规则计算指标数据失败,Err:" + err.Error())
  251. return
  252. }
  253. }
  254. return
  255. }
  256. // RefreshCalculateByRuleByLineNh 刷新动态结果计算(线性拟合)
  257. func RefreshCalculateByRuleByLineNh(predictEdbInfo EdbInfo, predictEdbConfAndDataList []*PredictEdbConfAndData, rule PredictEdbConf) (err error, errMsg string) {
  258. o := orm.NewOrm()
  259. to, err := o.Begin()
  260. if err != nil {
  261. return
  262. }
  263. defer func() {
  264. if err != nil {
  265. to.Rollback()
  266. } else {
  267. err = to.Commit()
  268. }
  269. }()
  270. err, errMsg = CalculateByRuleByRuleLineNh(to, predictEdbInfo, predictEdbConfAndDataList, rule)
  271. return
  272. }
  273. // CalculateByRuleByRuleLineNh 一元线性拟合规则计算入库
  274. func CalculateByRuleByRuleLineNh(to orm.TxOrmer, predictEdbInfo EdbInfo, predictEdbConfAndDataList []*PredictEdbConfAndData, rule PredictEdbConf) (err error, errMsg string) {
  275. var secondDataList []*EdbInfoSearchData
  276. predictEdbInfoId := predictEdbInfo.EdbInfoId // 预测指标id
  277. // 规则
  278. var ruleConf RuleLineNhConf
  279. tmpErr := json.Unmarshal([]byte(rule.Value), &ruleConf)
  280. if tmpErr != nil {
  281. errMsg = `季节性配置信息异常`
  282. err = errors.New("季节性配置信息异常:" + tmpErr.Error())
  283. return
  284. }
  285. // 获取自身指标的数据
  286. {
  287. // 来源指标
  288. var sourceEdbInfoItem *EdbInfo
  289. sql := ` SELECT * FROM edb_info WHERE edb_info_id=? `
  290. err = to.Raw(sql, rule.SourceEdbInfoId).QueryRow(&sourceEdbInfoItem)
  291. if err != nil {
  292. return
  293. }
  294. predictEdbInfo.EdbInfoId = 0
  295. secondDataList, err, _ = GetPredictDataListByPredictEdbConfList(&predictEdbInfo, sourceEdbInfoItem, predictEdbConfAndDataList, 1, ``)
  296. if err != nil {
  297. return
  298. }
  299. }
  300. lenSecondData := len(secondDataList)
  301. if lenSecondData <= 0 {
  302. return
  303. }
  304. newNhccDataMap, err, errMsg := getCalculateNhccData(secondDataList, ruleConf)
  305. if err != nil {
  306. return
  307. }
  308. //将最后计算出来的结果数据处理(新增入库、编辑日期的值、删除日期)
  309. {
  310. // 获取需要预测的日期
  311. startDateStr := secondDataList[lenSecondData-1].DataTime
  312. startDate, _ := time.ParseInLocation(utils.FormatDate, startDateStr, time.Local)
  313. //endDate, _ := time.ParseInLocation(utils.FormatDate, ruleConf.EndDate, time.Local)
  314. endDate := rule.EndDate
  315. dayList := getPredictEdbDayList(startDate, endDate, predictEdbInfo.Frequency, predictEdbInfo.DataDateType)
  316. if len(dayList) <= 0 { // 如果未来没有日期的话,那么就退出当前循环,进入下一个循环
  317. return
  318. }
  319. //获取该配置的所有数据
  320. dataList := make([]*PredictEdbRuleData, 0)
  321. sql := `SELECT * FROM predict_edb_rule_data WHERE config_id = ?`
  322. _, err = to.Raw(sql, rule.ConfigId).QueryRows(&dataList)
  323. if err != nil {
  324. return
  325. }
  326. dataMap := make(map[string]*PredictEdbRuleData)
  327. for _, v := range dataList {
  328. dataMap[v.DataTime] = v
  329. }
  330. //需要移除的日期
  331. removeDateList := make([]string, 0)
  332. // 已经操作过的日期
  333. existDataMap := make(map[string]string)
  334. // 添加数据
  335. addDataList := make([]*PredictEdbRuleData, 0)
  336. for _, currentDate := range dayList {
  337. // 动态拟合残差值数据
  338. currentDateStr := currentDate.Format(utils.FormatDate)
  339. val, ok := newNhccDataMap[currentDateStr]
  340. // 找不到数据,那么就移除该日期的数据
  341. if !ok {
  342. removeDateList = append(removeDateList, currentDateStr)
  343. continue
  344. }
  345. saveValue := decimal.NewFromFloat(val).RoundCeil(4).String() //utils.SubFloatToString(calVal, 4)
  346. existPredictEdbRuleData, ok := dataMap[currentDateStr]
  347. if !ok {
  348. timestamp := currentDate.UnixNano() / 1e6
  349. if _, existOk := existDataMap[currentDateStr]; !existOk {
  350. tmpPredictEdbRuleData := &PredictEdbRuleData{
  351. //PredictEdbRuleDataId: 0,
  352. EdbInfoId: predictEdbInfoId,
  353. ConfigId: rule.ConfigId,
  354. DataTime: currentDateStr,
  355. Value: saveValue,
  356. CreateTime: time.Now(),
  357. ModifyTime: time.Now(),
  358. DataTimestamp: timestamp,
  359. }
  360. addDataList = append(addDataList, tmpPredictEdbRuleData)
  361. }
  362. existDataMap[currentDateStr] = currentDateStr
  363. } else {
  364. existValDecimal, tmpErr := decimal.NewFromString(existPredictEdbRuleData.Value)
  365. if tmpErr != nil {
  366. err = tmpErr
  367. return
  368. }
  369. existStr := existValDecimal.String()
  370. if existStr != saveValue {
  371. existPredictEdbRuleData.Value = saveValue
  372. existPredictEdbRuleData.ModifyTime = time.Now()
  373. _, err = to.Update(existPredictEdbRuleData, "Value", "ModifyTime")
  374. if err != nil {
  375. return
  376. }
  377. }
  378. }
  379. }
  380. // 添加计算出来的值入库
  381. lenAddDataList := len(addDataList)
  382. if lenAddDataList > 0 {
  383. _, err = to.InsertMulti(lenAddDataList, addDataList)
  384. if err != nil {
  385. return
  386. }
  387. }
  388. //删除多余的值
  389. lenRemoveDateList := len(removeDateList)
  390. if lenRemoveDateList > 0 {
  391. //如果拼接指标变更了,那么需要删除所有的指标数据
  392. sql := ` DELETE FROM predict_edb_rule_data WHERE config_id = ? and data_time in (` + utils.GetOrmInReplace(lenRemoveDateList) + `) `
  393. _, err = to.Raw(sql, rule.ConfigId, removeDateList).Exec()
  394. if err != nil {
  395. err = fmt.Errorf("删除计算失败的预测规则计算指标数据失败,Err:" + err.Error())
  396. return
  397. }
  398. }
  399. }
  400. return
  401. }