sink_node.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459
  1. package node
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "fmt"
  6. "github.com/emqx/kuiper/internal/conf"
  7. "github.com/emqx/kuiper/internal/plugin"
  8. ct "github.com/emqx/kuiper/internal/template"
  9. "github.com/emqx/kuiper/internal/topo/sink"
  10. "github.com/emqx/kuiper/pkg/api"
  11. "github.com/emqx/kuiper/pkg/cast"
  12. "sync"
  13. "text/template"
  14. "time"
  15. )
  16. type SinkNode struct {
  17. *defaultSinkNode
  18. //static
  19. sinkType string
  20. mutex sync.RWMutex
  21. //configs (also static for sinks)
  22. options map[string]interface{}
  23. isMock bool
  24. //states varies after restart
  25. sinks []api.Sink
  26. tch chan struct{} //channel to trigger cache saved, will be trigger by checkpoint only
  27. }
  28. func NewSinkNode(name string, sinkType string, props map[string]interface{}) *SinkNode {
  29. bufferLength := 1024
  30. if c, ok := props["bufferLength"]; ok {
  31. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t <= 0 {
  32. //invalid property bufferLength
  33. } else {
  34. bufferLength = t
  35. }
  36. }
  37. return &SinkNode{
  38. defaultSinkNode: &defaultSinkNode{
  39. input: make(chan interface{}, bufferLength),
  40. defaultNode: &defaultNode{
  41. name: name,
  42. concurrency: 1,
  43. ctx: nil,
  44. },
  45. },
  46. sinkType: sinkType,
  47. options: props,
  48. }
  49. }
  50. //Only for mock source, do not use it in production
  51. func NewSinkNodeWithSink(name string, sink api.Sink, props map[string]interface{}) *SinkNode {
  52. return &SinkNode{
  53. defaultSinkNode: &defaultSinkNode{
  54. input: make(chan interface{}, 1024),
  55. defaultNode: &defaultNode{
  56. name: name,
  57. concurrency: 1,
  58. ctx: nil,
  59. },
  60. },
  61. sinks: []api.Sink{sink},
  62. options: props,
  63. isMock: true,
  64. }
  65. }
  66. func (m *SinkNode) Open(ctx api.StreamContext, result chan<- error) {
  67. m.ctx = ctx
  68. logger := ctx.GetLogger()
  69. logger.Debugf("open sink node %s", m.name)
  70. if m.qos >= api.AtLeastOnce {
  71. m.tch = make(chan struct{})
  72. }
  73. go func() {
  74. if c, ok := m.options["concurrency"]; ok {
  75. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t <= 0 {
  76. logger.Warnf("invalid type for concurrency property, should be positive integer but found %t", c)
  77. } else {
  78. m.concurrency = t
  79. }
  80. }
  81. runAsync := false
  82. if c, ok := m.options["runAsync"]; ok {
  83. if t, ok := c.(bool); !ok {
  84. logger.Warnf("invalid type for runAsync property, should be bool but found %t", c)
  85. } else {
  86. runAsync = t
  87. }
  88. }
  89. retryInterval := 1000
  90. if c, ok := m.options["retryInterval"]; ok {
  91. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t < 0 {
  92. logger.Warnf("invalid type for retryInterval property, should be positive integer but found %t", c)
  93. } else {
  94. retryInterval = t
  95. }
  96. }
  97. retryCount := 3
  98. if c, ok := m.options["retryCount"]; ok {
  99. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t < 0 {
  100. logger.Warnf("invalid type for retryCount property, should be positive integer but found %t", c)
  101. } else {
  102. retryCount = t
  103. }
  104. }
  105. cacheLength := 1024
  106. if c, ok := m.options["cacheLength"]; ok {
  107. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t < 0 {
  108. logger.Warnf("invalid type for cacheLength property, should be positive integer but found %t", c)
  109. } else {
  110. cacheLength = t
  111. }
  112. }
  113. cacheSaveInterval := 1000
  114. if c, ok := m.options["cacheSaveInterval"]; ok {
  115. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t < 0 {
  116. logger.Warnf("invalid type for cacheSaveInterval property, should be positive integer but found %t", c)
  117. } else {
  118. cacheSaveInterval = t
  119. }
  120. }
  121. omitIfEmpty := false
  122. if c, ok := m.options["omitIfEmpty"]; ok {
  123. if t, ok := c.(bool); !ok {
  124. logger.Warnf("invalid type for omitIfEmpty property, should be a bool value 'true/false'.", c)
  125. } else {
  126. omitIfEmpty = t
  127. }
  128. }
  129. sendSingle := false
  130. if c, ok := m.options["sendSingle"]; ok {
  131. if t, ok := c.(bool); !ok {
  132. logger.Warnf("invalid type for sendSingle property, should be a bool value 'true/false'.", c)
  133. } else {
  134. sendSingle = t
  135. }
  136. }
  137. var tp *template.Template = nil
  138. if c, ok := m.options["dataTemplate"]; ok {
  139. if t, ok := c.(string); !ok {
  140. logger.Warnf("invalid type for dateTemplate property, should be a string value.", c)
  141. } else {
  142. temp, err := template.New("sink").Funcs(ct.FuncMap).Parse(t)
  143. if err != nil {
  144. msg := fmt.Sprintf("property dataTemplate %v is invalid: %v", t, err)
  145. logger.Warnf(msg)
  146. result <- fmt.Errorf(msg)
  147. return
  148. } else {
  149. tp = temp
  150. }
  151. }
  152. }
  153. m.reset()
  154. logger.Infof("open sink node %d instances", m.concurrency)
  155. for i := 0; i < m.concurrency; i++ { // workers
  156. go func(instance int) {
  157. var sink api.Sink
  158. var err error
  159. if !m.isMock {
  160. logger.Debugf("Trying to get sink for rule %s with options %v\n", ctx.GetRuleId(), m.options)
  161. sink, err = getSink(m.sinkType, m.options)
  162. if err != nil {
  163. m.drainError(result, err, ctx, logger)
  164. return
  165. }
  166. logger.Debugf("Successfully get the sink %s", m.sinkType)
  167. m.mutex.Lock()
  168. m.sinks = append(m.sinks, sink)
  169. m.mutex.Unlock()
  170. logger.Debugf("Now is to open sink for rule %s.\n", ctx.GetRuleId())
  171. if err := sink.Open(ctx); err != nil {
  172. m.drainError(result, err, ctx, logger)
  173. return
  174. }
  175. logger.Debugf("Successfully open sink for rule %s.\n", ctx.GetRuleId())
  176. } else {
  177. sink = m.sinks[instance]
  178. }
  179. stats, err := NewStatManager("sink", ctx)
  180. if err != nil {
  181. m.drainError(result, err, ctx, logger)
  182. return
  183. }
  184. m.mutex.Lock()
  185. m.statManagers = append(m.statManagers, stats)
  186. m.mutex.Unlock()
  187. if conf.Config.Sink.DisableCache {
  188. for {
  189. select {
  190. case data := <-m.input:
  191. if newdata, processed := m.preprocess(data); processed {
  192. break
  193. } else {
  194. data = newdata
  195. }
  196. stats.SetBufferLength(int64(len(m.input)))
  197. if runAsync {
  198. go doCollect(sink, data, stats, omitIfEmpty, sendSingle, tp, ctx)
  199. } else {
  200. doCollect(sink, data, stats, omitIfEmpty, sendSingle, tp, ctx)
  201. }
  202. case <-ctx.Done():
  203. logger.Infof("sink node %s instance %d done", m.name, instance)
  204. if err := sink.Close(ctx); err != nil {
  205. logger.Warnf("close sink node %s instance %d fails: %v", m.name, instance, err)
  206. }
  207. return
  208. case <-m.tch:
  209. logger.Debugf("rule %s sink receive checkpoint, do nothing", ctx.GetRuleId())
  210. }
  211. }
  212. } else {
  213. logger.Infof("Creating sink cache")
  214. var cache *Cache
  215. if m.qos >= api.AtLeastOnce {
  216. cache = NewCheckpointbasedCache(m.input, cacheLength, m.tch, result, ctx)
  217. } else {
  218. cache = NewTimebasedCache(m.input, cacheLength, cacheSaveInterval, result, ctx)
  219. }
  220. for {
  221. select {
  222. case data := <-cache.Out:
  223. if newdata, processed := m.preprocess(data.data); processed {
  224. break
  225. } else {
  226. data.data = newdata
  227. }
  228. stats.SetBufferLength(int64(len(m.input)))
  229. if runAsync {
  230. go doCollectCacheTuple(sink, data, stats, retryInterval, retryCount, omitIfEmpty, sendSingle, tp, cache.Complete, ctx)
  231. } else {
  232. doCollectCacheTuple(sink, data, stats, retryInterval, retryCount, omitIfEmpty, sendSingle, tp, cache.Complete, ctx)
  233. }
  234. case <-ctx.Done():
  235. logger.Infof("sink node %s instance %d done", m.name, instance)
  236. if err := sink.Close(ctx); err != nil {
  237. logger.Warnf("close sink node %s instance %d fails: %v", m.name, instance, err)
  238. }
  239. return
  240. }
  241. }
  242. }
  243. }(i)
  244. }
  245. }()
  246. }
  247. func (m *SinkNode) reset() {
  248. if !m.isMock {
  249. m.sinks = nil
  250. }
  251. m.statManagers = nil
  252. }
  253. func extractInput(v []byte) ([]map[string]interface{}, error) {
  254. var j []map[string]interface{}
  255. if err := json.Unmarshal(v, &j); err != nil {
  256. return nil, fmt.Errorf("fail to decode the input %s as json: %v", v, err)
  257. }
  258. return j, nil
  259. }
  260. func doCollect(sink api.Sink, item interface{}, stats StatManager, omitIfEmpty bool, sendSingle bool, tp *template.Template, ctx api.StreamContext) {
  261. stats.IncTotalRecordsIn()
  262. stats.ProcessTimeStart()
  263. defer stats.ProcessTimeEnd()
  264. logger := ctx.GetLogger()
  265. outdatas := getOutData(stats, ctx, item, omitIfEmpty, sendSingle, tp)
  266. for _, outdata := range outdatas {
  267. if err := sink.Collect(ctx, outdata); err != nil {
  268. stats.IncTotalExceptions()
  269. logger.Warnf("sink node %s instance %d publish %s error: %v", ctx.GetOpId(), ctx.GetInstanceId(), outdata, err)
  270. } else {
  271. stats.IncTotalRecordsOut()
  272. }
  273. }
  274. }
  275. func getOutData(stats StatManager, ctx api.StreamContext, item interface{}, omitIfEmpty bool, sendSingle bool, tp *template.Template) [][]byte {
  276. logger := ctx.GetLogger()
  277. var outdatas [][]byte
  278. switch val := item.(type) {
  279. case []byte:
  280. if omitIfEmpty && string(val) == "[{}]" {
  281. return nil
  282. }
  283. var (
  284. err error
  285. j []map[string]interface{}
  286. )
  287. if sendSingle || tp != nil {
  288. j, err = extractInput(val)
  289. if err != nil {
  290. logger.Warnf("sink node %s instance %d publish %s error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
  291. stats.IncTotalExceptions()
  292. return nil
  293. }
  294. logger.Debugf("receive %d records", len(j))
  295. }
  296. if !sendSingle {
  297. if tp != nil {
  298. var output bytes.Buffer
  299. err := tp.Execute(&output, j)
  300. if err != nil {
  301. logger.Warnf("sink node %s instance %d publish %s decode template error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
  302. stats.IncTotalExceptions()
  303. return nil
  304. }
  305. outdatas = append(outdatas, output.Bytes())
  306. } else {
  307. outdatas = [][]byte{val}
  308. }
  309. } else {
  310. for _, r := range j {
  311. if tp != nil {
  312. var output bytes.Buffer
  313. err := tp.Execute(&output, r)
  314. if err != nil {
  315. logger.Warnf("sink node %s instance %d publish %s decode template error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
  316. stats.IncTotalExceptions()
  317. return nil
  318. }
  319. outdatas = append(outdatas, output.Bytes())
  320. } else {
  321. if ot, e := json.Marshal(r); e != nil {
  322. logger.Warnf("sink node %s instance %d publish %s marshal error: %v", ctx.GetOpId(), ctx.GetInstanceId(), r, e)
  323. stats.IncTotalExceptions()
  324. return nil
  325. } else {
  326. outdatas = append(outdatas, ot)
  327. }
  328. }
  329. }
  330. }
  331. case error:
  332. outdatas = [][]byte{[]byte(fmt.Sprintf(`[{"error":"%s"}]`, val.Error()))}
  333. default:
  334. outdatas = [][]byte{[]byte(fmt.Sprintf(`[{"error":"result is not a string but found %#v"}]`, val))}
  335. }
  336. return outdatas
  337. }
  338. func doCollectCacheTuple(sink api.Sink, item *CacheTuple, stats StatManager, retryInterval, retryCount int, omitIfEmpty bool, sendSingle bool, tp *template.Template, signalCh chan<- int, ctx api.StreamContext) {
  339. stats.IncTotalRecordsIn()
  340. stats.ProcessTimeStart()
  341. defer stats.ProcessTimeEnd()
  342. logger := ctx.GetLogger()
  343. outdatas := getOutData(stats, ctx, item.data, omitIfEmpty, sendSingle, tp)
  344. for _, outdata := range outdatas {
  345. outerloop:
  346. for {
  347. select {
  348. case <-ctx.Done():
  349. logger.Infof("sink node %s instance %d stops data resending", ctx.GetOpId(), ctx.GetInstanceId())
  350. return
  351. default:
  352. if err := sink.Collect(ctx, outdata); err != nil {
  353. stats.IncTotalExceptions()
  354. logger.Warnf("sink node %s instance %d publish %s error: %v", ctx.GetOpId(), ctx.GetInstanceId(), outdata, err)
  355. if retryInterval > 0 && retryCount > 0 {
  356. retryCount--
  357. time.Sleep(time.Duration(retryInterval) * time.Millisecond)
  358. logger.Debugf("try again")
  359. } else {
  360. break outerloop
  361. }
  362. } else {
  363. logger.Debugf("success")
  364. stats.IncTotalRecordsOut()
  365. select {
  366. case signalCh <- item.index:
  367. default:
  368. logger.Warnf("sink cache missing response for %d", item.index)
  369. }
  370. break outerloop
  371. }
  372. }
  373. }
  374. }
  375. }
  376. func doGetSink(name string, action map[string]interface{}) (api.Sink, error) {
  377. var (
  378. s api.Sink
  379. err error
  380. )
  381. switch name {
  382. case "log":
  383. s = sink.NewLogSink()
  384. case "logToMemory":
  385. s = sink.NewLogSinkToMemory()
  386. case "mqtt":
  387. s = &sink.MQTTSink{}
  388. case "rest":
  389. s = &sink.RestSink{}
  390. case "nop":
  391. s = &sink.NopSink{}
  392. default:
  393. s, err = plugin.GetSink(name)
  394. if err != nil {
  395. return nil, err
  396. }
  397. }
  398. err = s.Configure(action)
  399. if err != nil {
  400. return nil, err
  401. }
  402. return s, nil
  403. }
  404. //Override defaultNode
  405. func (m *SinkNode) AddOutput(_ chan<- interface{}, name string) error {
  406. return fmt.Errorf("fail to add output %s, sink %s cannot add output", name, m.name)
  407. }
  408. //Override defaultNode
  409. func (m *SinkNode) Broadcast(_ interface{}) error {
  410. return fmt.Errorf("sink %s cannot add broadcast", m.name)
  411. }
  412. func (m *SinkNode) drainError(errCh chan<- error, err error, ctx api.StreamContext, logger api.Logger) {
  413. go func() {
  414. select {
  415. case errCh <- err:
  416. ctx.GetLogger().Errorf("error in sink %s", err)
  417. case <-ctx.Done():
  418. m.close(ctx, logger)
  419. }
  420. }()
  421. }
  422. func (m *SinkNode) close(ctx api.StreamContext, logger api.Logger) {
  423. for _, s := range m.sinks {
  424. if err := s.Close(ctx); err != nil {
  425. logger.Warnf("close sink fails: %v", err)
  426. }
  427. }
  428. if m.tch != nil {
  429. close(m.tch)
  430. m.tch = nil
  431. }
  432. }
  433. // Only called when checkpoint enabled
  434. func (m *SinkNode) SaveCache() {
  435. m.tch <- struct{}{}
  436. }