edb_data_calculate_percentile.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488
  1. package models
  2. import (
  3. "encoding/json"
  4. "errors"
  5. "eta/eta_index_lib/utils"
  6. "fmt"
  7. "github.com/beego/beego/v2/client/orm"
  8. "github.com/shopspring/decimal"
  9. "reflect"
  10. "strconv"
  11. "strings"
  12. "time"
  13. )
  14. // Percentile 百分位
  15. type Percentile struct {
  16. }
  17. // Add 添加
  18. func (obj Percentile) Add(params AddCalculateBatchParams) (edbInfo *EdbInfo, err error, errMsg string) {
  19. req := params.Req
  20. fromEdbInfo := params.FromEdbInfo
  21. edbCode := params.EdbCode
  22. o := orm.NewOrm()
  23. to, err := o.Begin()
  24. if err != nil {
  25. return
  26. }
  27. defer func() {
  28. if err != nil {
  29. _ = to.Rollback()
  30. fmt.Println(reflect.TypeOf(obj).Name(), ";Add,Err:"+err.Error())
  31. } else {
  32. _ = to.Commit()
  33. }
  34. }()
  35. edbInfo = new(EdbInfo)
  36. edbInfo.Source = obj.GetSource()
  37. edbInfo.SourceName = obj.GetSourceName()
  38. edbInfo.EdbCode = edbCode
  39. edbInfo.EdbName = req.EdbName
  40. edbInfo.EdbNameSource = req.EdbName
  41. edbInfo.Frequency = req.Frequency
  42. edbInfo.Unit = req.Unit
  43. edbInfo.ClassifyId = req.ClassifyId
  44. edbInfo.SysUserId = params.SysUserId
  45. edbInfo.SysUserRealName = params.SysUserRealName
  46. edbInfo.CreateTime = time.Now()
  47. edbInfo.ModifyTime = time.Now()
  48. edbInfo.UniqueCode = params.UniqueCode
  49. edbInfo.CalculateFormula = req.Formula
  50. edbInfo.EdbNameEn = req.EdbName
  51. edbInfo.UnitEn = req.Unit
  52. edbInfo.EdbType = obj.GetEdbType()
  53. newEdbInfoId, tmpErr := to.Insert(edbInfo)
  54. if tmpErr != nil {
  55. err = tmpErr
  56. return
  57. }
  58. edbInfo.EdbInfoId = int(newEdbInfoId)
  59. //关联关系
  60. {
  61. calculateMappingItem := new(EdbInfoCalculateMapping)
  62. calculateMappingItem.CreateTime = time.Now()
  63. calculateMappingItem.ModifyTime = time.Now()
  64. calculateMappingItem.Sort = 1
  65. calculateMappingItem.EdbCode = edbCode
  66. calculateMappingItem.EdbInfoId = edbInfo.EdbInfoId
  67. calculateMappingItem.FromEdbInfoId = fromEdbInfo.EdbInfoId
  68. calculateMappingItem.FromEdbCode = fromEdbInfo.EdbCode
  69. calculateMappingItem.FromEdbName = fromEdbInfo.EdbName
  70. calculateMappingItem.FromSource = fromEdbInfo.Source
  71. calculateMappingItem.FromSourceName = fromEdbInfo.SourceName
  72. calculateMappingItem.FromTag = ""
  73. calculateMappingItem.Source = edbInfo.Source
  74. calculateMappingItem.SourceName = edbInfo.SourceName
  75. calculateMappingItem.FromSubSource = fromEdbInfo.SubSource
  76. _, err = to.Insert(calculateMappingItem)
  77. if err != nil {
  78. return
  79. }
  80. }
  81. //计算数据
  82. err, errMsg = obj.refresh(to, edbInfo, fromEdbInfo, edbInfo.EdbCode)
  83. return
  84. }
  85. // Edit 编辑
  86. func (obj Percentile) Edit(params EditCalculateBatchParams) (err error, errMsg string) {
  87. req := params.Req
  88. edbInfo := params.EdbInfo
  89. fromEdbInfo := params.FromEdbInfo
  90. o := orm.NewOrm()
  91. to, err := o.Begin()
  92. if err != nil {
  93. return
  94. }
  95. defer func() {
  96. if err != nil {
  97. _ = to.Rollback()
  98. fmt.Println(reflect.TypeOf(obj).Name(), ";Edit,Err:"+err.Error())
  99. } else {
  100. _ = to.Commit()
  101. }
  102. }()
  103. tableName := GetEdbDataTableName(edbInfo.Source, edbInfo.SubSource)
  104. oldEdbInfo := *edbInfo
  105. //修改指标信息
  106. edbInfo.EdbName = req.EdbName
  107. edbInfo.EdbNameSource = req.EdbName
  108. edbInfo.Frequency = req.Frequency
  109. edbInfo.Unit = req.Unit
  110. edbInfo.ClassifyId = req.ClassifyId
  111. edbInfo.CalculateFormula = req.Formula
  112. edbInfo.EdbNameEn = req.EdbNameEn
  113. edbInfo.UnitEn = req.UnitEn
  114. edbInfo.ModifyTime = time.Now()
  115. _, err = to.Update(edbInfo, "EdbName", "EdbNameSource", "Frequency", "Unit", "ClassifyId", "CalculateFormula", "ModifyTime", "EdbNameEn", "UnitEn")
  116. if err != nil {
  117. return
  118. }
  119. var existCondition string
  120. var existPars []interface{}
  121. existCondition += " AND edb_info_id=? AND from_edb_info_id=? "
  122. existPars = append(existPars, edbInfo.EdbInfoId, req.FromEdbInfoId)
  123. //判断计算指标是否被更换
  124. count, err := GetEdbInfoCalculateCountByCondition(existCondition, existPars)
  125. if err != nil {
  126. err = errors.New("判断指标是否改变失败,Err:" + err.Error())
  127. return
  128. }
  129. if count > 0 { // 指标未被替换,无需处理逻辑
  130. // 如果相关配置更改了,那么重新计算
  131. if oldEdbInfo.CalculateFormula != edbInfo.CalculateFormula {
  132. err, errMsg = obj.refresh(to, edbInfo, fromEdbInfo, edbInfo.EdbCode)
  133. }
  134. return
  135. }
  136. //删除,计算指标关联的,基础指标的关联关系
  137. sql := ` DELETE FROM edb_info_calculate_mapping WHERE edb_info_id = ? `
  138. _, err = to.Raw(sql, edbInfo.EdbInfoId).Exec()
  139. if err != nil {
  140. return
  141. }
  142. //清空原有数据
  143. sql = ` DELETE FROM ` + tableName + ` WHERE edb_info_id = ? `
  144. _, err = to.Raw(sql, edbInfo.EdbInfoId).Exec()
  145. if err != nil {
  146. return
  147. }
  148. //关联关系
  149. {
  150. calculateMappingItem := &EdbInfoCalculateMapping{
  151. EdbInfoCalculateMappingId: 0,
  152. EdbInfoId: edbInfo.EdbInfoId,
  153. Source: obj.GetSource(),
  154. SourceName: obj.GetSourceName(),
  155. EdbCode: edbInfo.EdbCode,
  156. FromEdbInfoId: fromEdbInfo.EdbInfoId,
  157. FromEdbCode: fromEdbInfo.EdbCode,
  158. FromEdbName: fromEdbInfo.EdbName,
  159. FromSource: fromEdbInfo.Source,
  160. FromSourceName: fromEdbInfo.SourceName,
  161. FromTag: "",
  162. Sort: 1,
  163. CreateTime: time.Now(),
  164. ModifyTime: time.Now(),
  165. FromSubSource: fromEdbInfo.SubSource,
  166. }
  167. _, err = to.Insert(calculateMappingItem)
  168. if err != nil {
  169. return
  170. }
  171. }
  172. //计算数据
  173. err, errMsg = obj.refresh(to, edbInfo, fromEdbInfo, edbInfo.EdbCode)
  174. return
  175. }
  176. // Refresh 刷新
  177. func (obj Percentile) Refresh(params RefreshParams) (err error, errMsg string) {
  178. calculateMapping, err := GetEdbInfoCalculateMappingDetail(params.EdbInfo.EdbInfoId)
  179. if err != nil {
  180. errMsg = "GetEdbInfoCalculateLjzzyDetail Err:" + err.Error()
  181. return
  182. }
  183. fromEdbInfo, err := GetEdbInfoById(calculateMapping.FromEdbInfoId)
  184. if err != nil {
  185. errMsg = "GetEdbInfoById Err:" + err.Error()
  186. return
  187. }
  188. o := orm.NewOrm()
  189. to, err := o.Begin()
  190. if err != nil {
  191. return
  192. }
  193. defer func() {
  194. if err != nil {
  195. _ = to.Rollback()
  196. fmt.Println(reflect.TypeOf(obj).Name(), ";Refresh,Err:"+err.Error())
  197. } else {
  198. _ = to.Commit()
  199. }
  200. }()
  201. // 计算数据
  202. err, errMsg = obj.refresh(to, params.EdbInfo, fromEdbInfo, params.EdbInfo.EdbCode)
  203. return
  204. }
  205. // GetSource 获取来源编码id
  206. func (obj Percentile) GetSource() int {
  207. return utils.DATA_SOURCE_CALCULATE_PERCENTILE
  208. }
  209. // GetSourceName 获取来源名称
  210. func (obj Percentile) GetSourceName() string {
  211. return utils.DATA_SOURCE_NAME_CALCULATE_PERCENTILE
  212. }
  213. // GetEdbType 获取指标类型
  214. func (obj Percentile) GetEdbType() int {
  215. return utils.CALCULATE_EDB_TYPE
  216. }
  217. // PercentileConfig 百分位的配置
  218. type PercentileConfig struct {
  219. CalculateValue int `description:"时间长度期数"`
  220. CalculateUnit string `description:"时间长度频度"`
  221. PercentType int `description:"百分位:0-数据区间(兼容历史数据); 1-数据个数;"`
  222. }
  223. // refresh 刷新
  224. func (obj Percentile) refresh(to orm.TxOrmer, edbInfo, fromEdbInfo *EdbInfo, edbCode string) (err error, errMsg string) {
  225. edbInfoId := edbInfo.EdbInfoId
  226. dataTableName := GetEdbDataTableName(edbInfo.Source, edbInfo.SubSource)
  227. edbInfoIdStr := strconv.Itoa(edbInfoId)
  228. var percentileConfig PercentileConfig
  229. err = json.Unmarshal([]byte(edbInfo.CalculateFormula), &percentileConfig)
  230. if err != nil {
  231. return
  232. }
  233. // 获取百分位的指标数据
  234. fromDataList, err, errMsg := obj.getPercentileData(fromEdbInfo, percentileConfig.CalculateValue, percentileConfig.CalculateUnit, percentileConfig.PercentType)
  235. if err != nil {
  236. return
  237. }
  238. //获取指标所有数据
  239. existDataList := make([]*EdbData, 0)
  240. sql := `SELECT * FROM %s WHERE edb_info_id=? `
  241. sql = fmt.Sprintf(sql, dataTableName)
  242. _, err = to.Raw(sql, edbInfoId).QueryRows(&existDataList)
  243. if err != nil {
  244. return
  245. }
  246. existDataMap := make(map[string]string)
  247. removeDataTimeMap := make(map[string]int) //需要移除的日期数据
  248. for _, v := range existDataList {
  249. existDataMap[v.DataTime] = v.Value
  250. removeDataTimeMap[v.DataTime] = 1
  251. }
  252. needAddDateMap := make(map[time.Time]int)
  253. addSql := ` INSERT INTO ` + dataTableName + `(edb_info_id,edb_code,data_time,value,create_time,modify_time,data_timestamp) values `
  254. var isAdd bool
  255. for _, tmpData := range fromDataList {
  256. currDateStr := tmpData.DataTime
  257. currTime, tmpErr := time.ParseInLocation(utils.FormatDate, currDateStr, time.Local)
  258. if tmpErr != nil {
  259. err = tmpErr
  260. return
  261. }
  262. // 当前的实际值
  263. saveValue := decimal.NewFromFloat(tmpData.Value).Round(4).String()
  264. existVal, ok := existDataMap[currDateStr]
  265. // 如果库中已经存在该数据的话,那么就进行值的变更操作
  266. if ok {
  267. //校验待删除日期数据里面是否存在该元素,如果存在的话,那么移除该日期
  268. delete(removeDataTimeMap, currDateStr)
  269. if existVal != saveValue {
  270. sql := ` UPDATE %s SET value=?,modify_time=NOW() WHERE edb_info_id=? AND data_time=? `
  271. sql = fmt.Sprintf(sql, dataTableName)
  272. _, err = to.Raw(sql, saveValue, edbInfoId, currDateStr).Exec()
  273. if err != nil {
  274. return
  275. }
  276. }
  277. continue
  278. }
  279. // 库中不存在该日期的数据
  280. timestamp := currTime.UnixNano() / 1e6
  281. timeStr := fmt.Sprintf("%d", timestamp)
  282. if _, existOk := needAddDateMap[currTime]; !existOk {
  283. addSql += GetAddSql(edbInfoIdStr, edbCode, currDateStr, timeStr, saveValue)
  284. isAdd = true
  285. }
  286. needAddDateMap[currTime] = 1
  287. }
  288. //删除已经不存在的指标数据(由于该指标当日的数据删除了)
  289. {
  290. removeDateList := make([]string, 0)
  291. for dateTime := range removeDataTimeMap {
  292. removeDateList = append(removeDateList, dateTime)
  293. }
  294. removeNum := len(removeDateList)
  295. if removeNum > 0 {
  296. sql := fmt.Sprintf(` DELETE FROM %s WHERE edb_info_id = ? and data_time in (`+utils.GetOrmInReplace(removeNum)+`) `, dataTableName)
  297. _, err = to.Raw(sql, edbInfo.EdbInfoId, removeDateList).Exec()
  298. if err != nil {
  299. fmt.Println(reflect.TypeOf(obj).Name(), " add data ;delete Err", err.Error())
  300. err = fmt.Errorf("删除不存在的指标数据失败,Err:" + err.Error())
  301. return
  302. }
  303. }
  304. }
  305. if isAdd {
  306. addSql = strings.TrimRight(addSql, ",")
  307. _, err = to.Raw(addSql).Exec()
  308. if err != nil {
  309. fmt.Println(reflect.TypeOf(obj).Name(), " add data Err", err.Error())
  310. return
  311. }
  312. }
  313. return
  314. }
  315. func (obj Percentile) calculate(edbInfoId int, date, edbInfoIdStr, edbCode, dataTableName, addSql string, val float64, dataMap, existDataMap map[string]string, to orm.TxOrmer) (newSql string, isAdd bool, err error) {
  316. newSql = addSql
  317. saveValue := utils.SubFloatToString(val, 4)
  318. //判断数据是否存在
  319. if existVal, ok := dataMap[date]; !ok {
  320. dataTime, _ := time.ParseInLocation(utils.FormatDate, date, time.Local)
  321. timestamp := dataTime.UnixNano() / 1e6
  322. timeStr := fmt.Sprintf("%d", timestamp)
  323. if _, existOk := existDataMap[date]; !existOk {
  324. newSql += GetAddSql(edbInfoIdStr, edbCode, date, timeStr, saveValue)
  325. isAdd = true
  326. }
  327. existDataMap[date] = date
  328. } else {
  329. if existVal != saveValue {
  330. sql := ` UPDATE %s SET value=?,modify_time=NOW() WHERE edb_info_id=? AND data_time=? `
  331. sql = fmt.Sprintf(sql, dataTableName)
  332. _, err = to.Raw(sql, saveValue, edbInfoId, date).Exec()
  333. }
  334. }
  335. return
  336. }
  337. // GetPercentileData 获取百分位图表的指标数据
  338. func (obj Percentile) getPercentileData(fromEdbInfo *EdbInfo, calculateValue int, calculateUnit string, percentType int) (newDataList []EdbInfoSearchData, err error, errMsg string) {
  339. // 获取时间基准指标在时间区间内的值
  340. dataList := make([]*EdbInfoSearchData, 0)
  341. switch fromEdbInfo.EdbInfoType {
  342. case 0:
  343. //获取来源指标的数据
  344. dataList, err = GetEdbDataListAll(fromEdbInfo.Source, fromEdbInfo.SubSource, FindEdbDataListAllCond{
  345. EdbInfoId: fromEdbInfo.EdbInfoId,
  346. }, 1)
  347. case 1:
  348. dataList, err = GetPredictEdbDataListAllByStartDate(fromEdbInfo, 1, "")
  349. default:
  350. err = errors.New(fmt.Sprint("获取失败,指标base类型异常", fromEdbInfo.EdbInfoType))
  351. return
  352. }
  353. moveUnitDays, ok := utils.FrequencyDaysMap[calculateUnit]
  354. if !ok {
  355. errMsg = `错误的周期`
  356. err = errors.New(errMsg)
  357. return
  358. }
  359. calculateDay := calculateValue * moveUnitDays
  360. // 指标对应的所有数据
  361. newDataList = make([]EdbInfoSearchData, 0)
  362. dataMap := make(map[time.Time]float64, 0)
  363. for _, tmpData := range dataList {
  364. currDateTime, _ := time.ParseInLocation(utils.FormatDate, tmpData.DataTime, time.Local)
  365. dataMap[currDateTime] = tmpData.Value
  366. }
  367. //百分位:对所选指标滚动地取对应时间长度的数据值,取最大值Max,最小值Min,计算Max-Min,百分位=(现值-Min)/(Max-Min),Max=Min时不予计算。
  368. if percentType == utils.PercentCalculateTypeRange {
  369. for i, tmpData := range dataList {
  370. currDateTime, _ := time.ParseInLocation(utils.FormatDate, tmpData.DataTime, time.Local)
  371. maxVal := tmpData.Value
  372. minVal := tmpData.Value
  373. for k := 0; k < calculateDay; k++ {
  374. preVal, ok2 := dataMap[currDateTime.AddDate(0, 0, -k)]
  375. if ok2 {
  376. if preVal > maxVal {
  377. maxVal = preVal
  378. }
  379. if preVal < minVal {
  380. minVal = preVal
  381. }
  382. }
  383. }
  384. if maxVal == minVal {
  385. continue
  386. }
  387. tmpV := (tmpData.Value - minVal) / (maxVal - minVal) * 100
  388. tmpV, _ = decimal.NewFromFloat(tmpV).Round(4).Float64()
  389. //百分位=(现值-Min)/(Max-Min)
  390. newDataList = append(newDataList, EdbInfoSearchData{
  391. EdbDataId: i,
  392. DataTime: dataList[i].DataTime,
  393. Value: tmpV,
  394. })
  395. }
  396. }
  397. // 百分位数据个数算法
  398. // 数据区间第一个和最后一个数据点的时间和数据分别为(T1,S1)(T2,S2); N=T1到T2指标数据个数, n=小于等于S2的数据个数
  399. // 个数百分位=(n-1)/(N-1)
  400. maxDay := len(dataList) // 往前找数据的边界
  401. if percentType == utils.PercentCalculateTypeNum {
  402. for i, d := range dataList {
  403. // T2为当前日期
  404. s2 := decimal.NewFromFloat(d.Value)
  405. t2, _ := time.ParseInLocation(utils.FormatDate, d.DataTime, time.Local)
  406. // 计算N和n
  407. var bigN, tinyN int
  408. for k := 0; k < maxDay; k++ {
  409. // 往前找(时间长度)个有数据的, N理论上只有最前面几个日期<calculateDay, 后面的N=calculateDay
  410. if bigN >= calculateDay {
  411. break
  412. }
  413. preVal, preOk := dataMap[t2.AddDate(0, 0, -k)]
  414. if !preOk {
  415. continue
  416. }
  417. bigN += 1
  418. if decimal.NewFromFloat(preVal).LessThanOrEqual(s2) {
  419. tinyN += 1
  420. }
  421. }
  422. // N<=1时说明计算无效
  423. if bigN <= 1 {
  424. continue
  425. }
  426. numerator := decimal.NewFromInt(int64(tinyN - 1))
  427. denominator := decimal.NewFromInt(int64(bigN - 1))
  428. // 因为是百分位所以这里是要*100, 跟之前的算法保持同步
  429. percentVal, _ := numerator.Div(denominator).Mul(decimal.NewFromFloat(100)).Round(4).Float64()
  430. // 写进数组并判断指标最大最小值
  431. newDataList = append(newDataList, EdbInfoSearchData{
  432. EdbDataId: i,
  433. DataTime: dataList[i].DataTime,
  434. Value: percentVal,
  435. })
  436. }
  437. }
  438. return
  439. }