123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383 |
- package nodes
- import (
- "bytes"
- "encoding/json"
- "fmt"
- "github.com/emqx/kuiper/common"
- "github.com/emqx/kuiper/common/templates"
- "github.com/emqx/kuiper/plugins"
- "github.com/emqx/kuiper/xstream/api"
- "github.com/emqx/kuiper/xstream/sinks"
- "sync"
- "text/template"
- "time"
- )
- type SinkNode struct {
- *defaultSinkNode
- //static
- sinkType string
- mutex sync.RWMutex
- //configs (also static for sinks)
- options map[string]interface{}
- isMock bool
- //states varies after restart
- sinks []api.Sink
- tch chan struct{} //channel to trigger cache saved, will be trigger by checkpoint only
- }
- func NewSinkNode(name string, sinkType string, props map[string]interface{}) *SinkNode {
- bufferLength := 1024
- if c, ok := props["bufferLength"]; ok {
- if t, err := common.ToInt(c); err != nil || t <= 0 {
- //invalid property bufferLength
- } else {
- bufferLength = t
- }
- }
- return &SinkNode{
- defaultSinkNode: &defaultSinkNode{
- input: make(chan interface{}, bufferLength),
- defaultNode: &defaultNode{
- name: name,
- concurrency: 1,
- ctx: nil,
- },
- },
- sinkType: sinkType,
- options: props,
- }
- }
- //Only for mock source, do not use it in production
- func NewSinkNodeWithSink(name string, sink api.Sink, props map[string]interface{}) *SinkNode {
- return &SinkNode{
- defaultSinkNode: &defaultSinkNode{
- input: make(chan interface{}, 1024),
- defaultNode: &defaultNode{
- name: name,
- concurrency: 1,
- ctx: nil,
- },
- },
- sinks: []api.Sink{sink},
- options: props,
- isMock: true,
- }
- }
- func (m *SinkNode) Open(ctx api.StreamContext, result chan<- error) {
- m.ctx = ctx
- logger := ctx.GetLogger()
- logger.Debugf("open sink node %s", m.name)
- if m.qos >= api.AtLeastOnce {
- m.tch = make(chan struct{})
- }
- go func() {
- if c, ok := m.options["concurrency"]; ok {
- if t, err := common.ToInt(c); err != nil || t <= 0 {
- logger.Warnf("invalid type for concurrency property, should be positive integer but found %t", c)
- } else {
- m.concurrency = t
- }
- }
- runAsync := false
- if c, ok := m.options["runAsync"]; ok {
- if t, ok := c.(bool); !ok {
- logger.Warnf("invalid type for runAsync property, should be bool but found %t", c)
- } else {
- runAsync = t
- }
- }
- retryInterval := 1000
- if c, ok := m.options["retryInterval"]; ok {
- if t, err := common.ToInt(c); err != nil || t < 0 {
- logger.Warnf("invalid type for retryInterval property, should be positive integer but found %t", c)
- } else {
- retryInterval = t
- }
- }
- cacheLength := 1024
- if c, ok := m.options["cacheLength"]; ok {
- if t, err := common.ToInt(c); err != nil || t < 0 {
- logger.Warnf("invalid type for cacheLength property, should be positive integer but found %t", c)
- } else {
- cacheLength = t
- }
- }
- cacheSaveInterval := 1000
- if c, ok := m.options["cacheSaveInterval"]; ok {
- if t, err := common.ToInt(c); err != nil || t < 0 {
- logger.Warnf("invalid type for cacheSaveInterval property, should be positive integer but found %t", c)
- } else {
- cacheSaveInterval = t
- }
- }
- omitIfEmpty := false
- if c, ok := m.options["omitIfEmpty"]; ok {
- if t, ok := c.(bool); !ok {
- logger.Warnf("invalid type for omitIfEmpty property, should be a bool value 'true/false'.", c)
- } else {
- omitIfEmpty = t
- }
- }
- sendSingle := false
- if c, ok := m.options["sendSingle"]; ok {
- if t, ok := c.(bool); !ok {
- logger.Warnf("invalid type for sendSingle property, should be a bool value 'true/false'.", c)
- } else {
- sendSingle = t
- }
- }
- var tp *template.Template = nil
- if c, ok := m.options["dataTemplate"]; ok {
- if t, ok := c.(string); !ok {
- logger.Warnf("invalid type for dateTemplate property, should be a string value.", c)
- } else {
- funcMap := template.FuncMap{
- "json": templates.JsonMarshal,
- "base64": templates.Base64Encode,
- "add": templates.Add,
- }
- temp, err := template.New("sink").Funcs(funcMap).Parse(t)
- if err != nil {
- msg := fmt.Sprintf("property dataTemplate %v is invalid: %v", t, err)
- result <- fmt.Errorf(msg)
- logger.Warnf(msg)
- return
- } else {
- tp = temp
- }
- }
- }
- m.reset()
- logger.Infof("open sink node %d instances", m.concurrency)
- for i := 0; i < m.concurrency; i++ { // workers
- go func(instance int) {
- var sink api.Sink
- var err error
- if !m.isMock {
- sink, err = getSink(m.sinkType, m.options)
- if err != nil {
- m.drainError(result, err, ctx, logger)
- return
- }
- m.mutex.Lock()
- m.sinks = append(m.sinks, sink)
- m.mutex.Unlock()
- if err := sink.Open(ctx); err != nil {
- m.drainError(result, err, ctx, logger)
- return
- }
- } else {
- sink = m.sinks[instance]
- }
- stats, err := NewStatManager("sink", ctx)
- if err != nil {
- m.drainError(result, err, ctx, logger)
- return
- }
- m.mutex.Lock()
- m.statManagers = append(m.statManagers, stats)
- m.mutex.Unlock()
- var cache *Cache
- if m.qos >= api.AtLeastOnce {
- cache = NewCheckpointbasedCache(m.input, cacheLength, m.tch, result, ctx)
- } else {
- cache = NewTimebasedCache(m.input, cacheLength, cacheSaveInterval, result, ctx)
- }
- for {
- select {
- case data := <-cache.Out:
- if newdata, processed := m.preprocess(data.data); processed {
- break
- } else {
- data.data = newdata
- }
- stats.SetBufferLength(int64(cache.Length()))
- if runAsync {
- go doCollect(sink, data, stats, retryInterval, omitIfEmpty, sendSingle, tp, cache.Complete, ctx)
- } else {
- doCollect(sink, data, stats, retryInterval, omitIfEmpty, sendSingle, tp, cache.Complete, ctx)
- }
- case <-ctx.Done():
- logger.Infof("sink node %s instance %d done", m.name, instance)
- if err := sink.Close(ctx); err != nil {
- logger.Warnf("close sink node %s instance %d fails: %v", m.name, instance, err)
- }
- return
- }
- }
- }(i)
- }
- }()
- }
- func (m *SinkNode) reset() {
- if !m.isMock {
- m.sinks = nil
- }
- m.statManagers = nil
- }
- func extractInput(v []byte) ([]map[string]interface{}, error) {
- var j []map[string]interface{}
- if err := json.Unmarshal(v, &j); err != nil {
- return nil, fmt.Errorf("fail to decode the input %s as json: %v", v, err)
- }
- return j, nil
- }
- func doCollect(sink api.Sink, item *CacheTuple, stats StatManager, retryInterval int, omitIfEmpty bool, sendSingle bool, tp *template.Template, signalCh chan<- int, ctx api.StreamContext) {
- stats.IncTotalRecordsIn()
- stats.ProcessTimeStart()
- defer stats.ProcessTimeEnd()
- logger := ctx.GetLogger()
- var outdatas [][]byte
- switch val := item.data.(type) {
- case []byte:
- if omitIfEmpty && string(val) == "[{}]" {
- return
- }
- var (
- err error
- j []map[string]interface{}
- )
- if sendSingle || tp != nil {
- j, err = extractInput(val)
- if err != nil {
- stats.IncTotalExceptions()
- logger.Warnf("sink node %s instance %d publish %s error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
- return
- }
- logger.Debugf("receive %d records", len(j))
- }
- if !sendSingle {
- if tp != nil {
- var output bytes.Buffer
- err := tp.Execute(&output, j)
- if err != nil {
- logger.Warnf("sink node %s instance %d publish %s decode template error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
- stats.IncTotalExceptions()
- return
- }
- outdatas = append(outdatas, output.Bytes())
- } else {
- outdatas = [][]byte{val}
- }
- } else {
- for _, r := range j {
- var output bytes.Buffer
- err := tp.Execute(&output, r)
- if err != nil {
- logger.Warnf("sink node %s instance %d publish %s decode template error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
- stats.IncTotalExceptions()
- return
- }
- outdatas = append(outdatas, output.Bytes())
- }
- }
- case error:
- outdatas = [][]byte{[]byte(fmt.Sprintf(`[{"error":"%s"}]`, val.Error()))}
- default:
- outdatas = [][]byte{[]byte(fmt.Sprintf(`[{"error":"result is not a string but found %#v"}]`, val))}
- }
- for _, outdata := range outdatas {
- outerloop:
- for {
- select {
- case <-ctx.Done():
- logger.Infof("sink node %s instance %d stops data resending", ctx.GetOpId(), ctx.GetInstanceId())
- return
- default:
- if err := sink.Collect(ctx, outdata); err != nil {
- stats.IncTotalExceptions()
- logger.Warnf("sink node %s instance %d publish %s error: %v", ctx.GetOpId(), ctx.GetInstanceId(), outdata, err)
- if retryInterval > 0 {
- time.Sleep(time.Duration(retryInterval) * time.Millisecond)
- logger.Debugf("try again")
- } else {
- break outerloop
- }
- } else {
- logger.Debugf("success")
- stats.IncTotalRecordsOut()
- signalCh <- item.index
- break outerloop
- }
- }
- }
- }
- }
- func doGetSink(name string, action map[string]interface{}) (api.Sink, error) {
- var (
- s api.Sink
- err error
- )
- switch name {
- case "log":
- s = sinks.NewLogSink()
- case "logToMemory":
- s = sinks.NewLogSinkToMemory()
- case "mqtt":
- s = &sinks.MQTTSink{}
- case "rest":
- s = &sinks.RestSink{}
- case "nop":
- s = &sinks.NopSink{}
- default:
- s, err = plugins.GetSink(name)
- if err != nil {
- return nil, err
- }
- }
- err = s.Configure(action)
- if err != nil {
- return nil, err
- }
- return s, nil
- }
- //Override defaultNode
- func (m *SinkNode) AddOutput(_ chan<- interface{}, name string) error {
- return fmt.Errorf("fail to add output %s, sink %s cannot add output", name, m.name)
- }
- //Override defaultNode
- func (m *SinkNode) Broadcast(_ interface{}) error {
- return fmt.Errorf("sink %s cannot add broadcast", m.name)
- }
- func (m *SinkNode) drainError(errCh chan<- error, err error, ctx api.StreamContext, logger api.Logger) {
- go func() {
- select {
- case errCh <- err:
- ctx.GetLogger().Errorf("error in sink %s", err)
- case <-ctx.Done():
- m.close(ctx, logger)
- }
- }()
- }
- func (m *SinkNode) close(ctx api.StreamContext, logger api.Logger) {
- for _, s := range m.sinks {
- if err := s.Close(ctx); err != nil {
- logger.Warnf("close sink fails: %v", err)
- }
- }
- if m.tch != nil {
- close(m.tch)
- m.tch = nil
- }
- }
- // Only called when checkpoint enabled
- func (m *SinkNode) SaveCache() {
- m.tch <- struct{}{}
- }
|