123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129 |
- package main
- import (
- "bytes"
- "encoding/json"
- "fmt"
- "github.com/emqx/kuiper/common"
- "github.com/emqx/kuiper/xstream/api"
- "math/rand"
- "time"
- )
- const dedupStateKey = "input"
- type randomSourceConfig struct {
- Interval int `json:"interval"`
- Seed int `json:"seed"`
- Pattern map[string]interface{} `json:"pattern"`
- // how long will the source trace for deduplication. If 0, deduplicate is disabled; if negative, deduplicate will be the whole life time
- Deduplicate int `json:"deduplicate"`
- }
- //Emit data randomly with only a string field
- type randomSource struct {
- conf *randomSourceConfig
- list [][]byte
- }
- func (s *randomSource) Configure(topic string, props map[string]interface{}) error {
- cfg := &randomSourceConfig{}
- err := common.MapToStruct(props, cfg)
- if err != nil {
- return fmt.Errorf("read properties %v fail with error: %v", props, err)
- }
- if cfg.Interval <= 0 {
- return fmt.Errorf("source `random` property `interval` must be a positive integer but got %d", cfg.Interval)
- }
- if cfg.Pattern == nil {
- return fmt.Errorf("source `random` property `pattern` is required")
- }
- if cfg.Interval <= 0 {
- return fmt.Errorf("source `random` property `seed` must be a positive integer but got %d", cfg.Seed)
- }
- s.conf = cfg
- return nil
- }
- func (s *randomSource) Open(ctx api.StreamContext, consumer chan<- api.SourceTuple, errCh chan<- error) {
- logger := ctx.GetLogger()
- logger.Debugf("open random source with deduplicate %d", s.conf.Deduplicate)
- if s.conf.Deduplicate != 0 {
- list, err := ctx.GetState(dedupStateKey)
- if err != nil {
- errCh <- err
- return
- }
- if list == nil {
- list = make([][]byte, 0)
- } else {
- if l, ok := list.([][]byte); ok {
- logger.Debugf("restore list %v", l)
- s.list = l
- } else {
- s.list = make([][]byte, 0)
- logger.Warnf("random source gets invalid state, ignore it")
- }
- }
- }
- t := time.NewTicker(time.Duration(s.conf.Interval) * time.Millisecond)
- defer t.Stop()
- for {
- select {
- case <-t.C:
- next := randomize(s.conf.Pattern, s.conf.Seed)
- if s.conf.Deduplicate != 0 && s.isDup(ctx, next) {
- logger.Debugf("find duplicate")
- continue
- }
- logger.Debugf("Send out data %v", next)
- consumer <- api.NewDefaultSourceTuple(next, nil)
- case <-ctx.Done():
- return
- }
- }
- }
- func randomize(p map[string]interface{}, seed int) map[string]interface{} {
- r := make(map[string]interface{})
- for k, v := range p {
- //TODO other data types
- vi, err := common.ToInt(v)
- if err != nil {
- break
- }
- r[k] = vi + rand.Intn(seed)
- }
- return r
- }
- func (s *randomSource) isDup(ctx api.StreamContext, next map[string]interface{}) bool {
- logger := ctx.GetLogger()
- ns, err := json.Marshal(next)
- if err != nil {
- logger.Warnf("invalid input data %v", next)
- return true
- }
- for _, ps := range s.list {
- if bytes.Compare(ns, ps) == 0 {
- logger.Debugf("got duplicate %s", ns)
- return true
- }
- }
- logger.Debugf("no duplicate %s", ns)
- if s.conf.Deduplicate > 0 && len(s.list) >= s.conf.Deduplicate {
- s.list = s.list[1:]
- }
- s.list = append(s.list, ns)
- ctx.PutState(dedupStateKey, s.list)
- return false
- }
- func (s *randomSource) Close(_ api.StreamContext) error {
- return nil
- }
- func Random() api.Source {
- return &randomSource{}
- }
|