random.go 3.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129
  1. package main
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "fmt"
  6. "github.com/emqx/kuiper/common"
  7. "github.com/emqx/kuiper/xstream/api"
  8. "math/rand"
  9. "time"
  10. )
  11. const dedupStateKey = "input"
  12. type randomSourceConfig struct {
  13. Interval int `json:"interval"`
  14. Seed int `json:"seed"`
  15. Pattern map[string]interface{} `json:"pattern"`
  16. // how long will the source trace for deduplication. If 0, deduplicate is disabled; if negative, deduplicate will be the whole life time
  17. Deduplicate int `json:"deduplicate"`
  18. }
  19. //Emit data randomly with only a string field
  20. type randomSource struct {
  21. conf *randomSourceConfig
  22. list [][]byte
  23. }
  24. func (s *randomSource) Configure(topic string, props map[string]interface{}) error {
  25. cfg := &randomSourceConfig{}
  26. err := common.MapToStruct(props, cfg)
  27. if err != nil {
  28. return fmt.Errorf("read properties %v fail with error: %v", props, err)
  29. }
  30. if cfg.Interval <= 0 {
  31. return fmt.Errorf("source `random` property `interval` must be a positive integer but got %d", cfg.Interval)
  32. }
  33. if cfg.Pattern == nil {
  34. return fmt.Errorf("source `random` property `pattern` is required")
  35. }
  36. if cfg.Interval <= 0 {
  37. return fmt.Errorf("source `random` property `seed` must be a positive integer but got %d", cfg.Seed)
  38. }
  39. s.conf = cfg
  40. return nil
  41. }
  42. func (s *randomSource) Open(ctx api.StreamContext, consumer chan<- api.SourceTuple, errCh chan<- error) {
  43. logger := ctx.GetLogger()
  44. logger.Debugf("open random source with deduplicate %d", s.conf.Deduplicate)
  45. if s.conf.Deduplicate != 0 {
  46. list, err := ctx.GetState(dedupStateKey)
  47. if err != nil {
  48. errCh <- err
  49. return
  50. }
  51. if list == nil {
  52. list = make([][]byte, 0)
  53. } else {
  54. if l, ok := list.([][]byte); ok {
  55. logger.Debugf("restore list %v", l)
  56. s.list = l
  57. } else {
  58. s.list = make([][]byte, 0)
  59. logger.Warnf("random source gets invalid state, ignore it")
  60. }
  61. }
  62. }
  63. t := time.NewTicker(time.Duration(s.conf.Interval) * time.Millisecond)
  64. defer t.Stop()
  65. for {
  66. select {
  67. case <-t.C:
  68. next := randomize(s.conf.Pattern, s.conf.Seed)
  69. if s.conf.Deduplicate != 0 && s.isDup(ctx, next) {
  70. logger.Debugf("find duplicate")
  71. continue
  72. }
  73. logger.Debugf("Send out data %v", next)
  74. consumer <- api.NewDefaultSourceTuple(next, nil)
  75. case <-ctx.Done():
  76. return
  77. }
  78. }
  79. }
  80. func randomize(p map[string]interface{}, seed int) map[string]interface{} {
  81. r := make(map[string]interface{})
  82. for k, v := range p {
  83. //TODO other data types
  84. vi, err := common.ToInt(v)
  85. if err != nil {
  86. break
  87. }
  88. r[k] = vi + rand.Intn(seed)
  89. }
  90. return r
  91. }
  92. func (s *randomSource) isDup(ctx api.StreamContext, next map[string]interface{}) bool {
  93. logger := ctx.GetLogger()
  94. ns, err := json.Marshal(next)
  95. if err != nil {
  96. logger.Warnf("invalid input data %v", next)
  97. return true
  98. }
  99. for _, ps := range s.list {
  100. if bytes.Compare(ns, ps) == 0 {
  101. logger.Debugf("got duplicate %s", ns)
  102. return true
  103. }
  104. }
  105. logger.Debugf("no duplicate %s", ns)
  106. if s.conf.Deduplicate > 0 && len(s.list) >= s.conf.Deduplicate {
  107. s.list = s.list[1:]
  108. }
  109. s.list = append(s.list, ns)
  110. ctx.PutState(dedupStateKey, s.list)
  111. return false
  112. }
  113. func (s *randomSource) Close(_ api.StreamContext) error {
  114. return nil
  115. }
  116. func Random() api.Source {
  117. return &randomSource{}
  118. }