sink_node.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473
  1. // Copyright 2021 EMQ Technologies Co., Ltd.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package node
  15. import (
  16. "bytes"
  17. "encoding/json"
  18. "fmt"
  19. "github.com/lf-edge/ekuiper/internal/conf"
  20. "github.com/lf-edge/ekuiper/internal/plugin"
  21. ct "github.com/lf-edge/ekuiper/internal/template"
  22. "github.com/lf-edge/ekuiper/internal/topo/sink"
  23. "github.com/lf-edge/ekuiper/pkg/api"
  24. "github.com/lf-edge/ekuiper/pkg/cast"
  25. "sync"
  26. "text/template"
  27. "time"
  28. )
  29. type SinkNode struct {
  30. *defaultSinkNode
  31. //static
  32. sinkType string
  33. mutex sync.RWMutex
  34. //configs (also static for sinks)
  35. options map[string]interface{}
  36. isMock bool
  37. //states varies after restart
  38. sinks []api.Sink
  39. tch chan struct{} //channel to trigger cache saved, will be trigger by checkpoint only
  40. }
  41. func NewSinkNode(name string, sinkType string, props map[string]interface{}) *SinkNode {
  42. bufferLength := 1024
  43. if c, ok := props["bufferLength"]; ok {
  44. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t <= 0 {
  45. //invalid property bufferLength
  46. } else {
  47. bufferLength = t
  48. }
  49. }
  50. return &SinkNode{
  51. defaultSinkNode: &defaultSinkNode{
  52. input: make(chan interface{}, bufferLength),
  53. defaultNode: &defaultNode{
  54. name: name,
  55. concurrency: 1,
  56. ctx: nil,
  57. },
  58. },
  59. sinkType: sinkType,
  60. options: props,
  61. }
  62. }
  63. //Only for mock source, do not use it in production
  64. func NewSinkNodeWithSink(name string, sink api.Sink, props map[string]interface{}) *SinkNode {
  65. return &SinkNode{
  66. defaultSinkNode: &defaultSinkNode{
  67. input: make(chan interface{}, 1024),
  68. defaultNode: &defaultNode{
  69. name: name,
  70. concurrency: 1,
  71. ctx: nil,
  72. },
  73. },
  74. sinks: []api.Sink{sink},
  75. options: props,
  76. isMock: true,
  77. }
  78. }
  79. func (m *SinkNode) Open(ctx api.StreamContext, result chan<- error) {
  80. m.ctx = ctx
  81. logger := ctx.GetLogger()
  82. logger.Debugf("open sink node %s", m.name)
  83. if m.qos >= api.AtLeastOnce {
  84. m.tch = make(chan struct{})
  85. }
  86. go func() {
  87. if c, ok := m.options["concurrency"]; ok {
  88. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t <= 0 {
  89. logger.Warnf("invalid type for concurrency property, should be positive integer but found %t", c)
  90. } else {
  91. m.concurrency = t
  92. }
  93. }
  94. runAsync := false
  95. if c, ok := m.options["runAsync"]; ok {
  96. if t, ok := c.(bool); !ok {
  97. logger.Warnf("invalid type for runAsync property, should be bool but found %t", c)
  98. } else {
  99. runAsync = t
  100. }
  101. }
  102. retryInterval := 1000
  103. if c, ok := m.options["retryInterval"]; ok {
  104. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t < 0 {
  105. logger.Warnf("invalid type for retryInterval property, should be positive integer but found %t", c)
  106. } else {
  107. retryInterval = t
  108. }
  109. }
  110. retryCount := 3
  111. if c, ok := m.options["retryCount"]; ok {
  112. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t < 0 {
  113. logger.Warnf("invalid type for retryCount property, should be positive integer but found %t", c)
  114. } else {
  115. retryCount = t
  116. }
  117. }
  118. cacheLength := 1024
  119. if c, ok := m.options["cacheLength"]; ok {
  120. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t < 0 {
  121. logger.Warnf("invalid type for cacheLength property, should be positive integer but found %t", c)
  122. } else {
  123. cacheLength = t
  124. }
  125. }
  126. cacheSaveInterval := 1000
  127. if c, ok := m.options["cacheSaveInterval"]; ok {
  128. if t, err := cast.ToInt(c, cast.STRICT); err != nil || t < 0 {
  129. logger.Warnf("invalid type for cacheSaveInterval property, should be positive integer but found %t", c)
  130. } else {
  131. cacheSaveInterval = t
  132. }
  133. }
  134. omitIfEmpty := false
  135. if c, ok := m.options["omitIfEmpty"]; ok {
  136. if t, ok := c.(bool); !ok {
  137. logger.Warnf("invalid type for omitIfEmpty property, should be a bool value 'true/false'.", c)
  138. } else {
  139. omitIfEmpty = t
  140. }
  141. }
  142. sendSingle := false
  143. if c, ok := m.options["sendSingle"]; ok {
  144. if t, ok := c.(bool); !ok {
  145. logger.Warnf("invalid type for sendSingle property, should be a bool value 'true/false'.", c)
  146. } else {
  147. sendSingle = t
  148. }
  149. }
  150. var tp *template.Template = nil
  151. if c, ok := m.options["dataTemplate"]; ok {
  152. if t, ok := c.(string); !ok {
  153. logger.Warnf("invalid type for dateTemplate property, should be a string value.", c)
  154. } else {
  155. temp, err := template.New("sink").Funcs(ct.FuncMap).Parse(t)
  156. if err != nil {
  157. msg := fmt.Sprintf("property dataTemplate %v is invalid: %v", t, err)
  158. logger.Warnf(msg)
  159. result <- fmt.Errorf(msg)
  160. return
  161. } else {
  162. tp = temp
  163. }
  164. }
  165. }
  166. m.reset()
  167. logger.Infof("open sink node %d instances", m.concurrency)
  168. for i := 0; i < m.concurrency; i++ { // workers
  169. go func(instance int) {
  170. var sink api.Sink
  171. var err error
  172. if !m.isMock {
  173. logger.Debugf("Trying to get sink for rule %s with options %v\n", ctx.GetRuleId(), m.options)
  174. sink, err = getSink(m.sinkType, m.options)
  175. if err != nil {
  176. m.drainError(result, err, ctx, logger)
  177. return
  178. }
  179. logger.Debugf("Successfully get the sink %s", m.sinkType)
  180. m.mutex.Lock()
  181. m.sinks = append(m.sinks, sink)
  182. m.mutex.Unlock()
  183. logger.Debugf("Now is to open sink for rule %s.\n", ctx.GetRuleId())
  184. if err := sink.Open(ctx); err != nil {
  185. m.drainError(result, err, ctx, logger)
  186. return
  187. }
  188. logger.Debugf("Successfully open sink for rule %s.\n", ctx.GetRuleId())
  189. } else {
  190. sink = m.sinks[instance]
  191. }
  192. stats, err := NewStatManager("sink", ctx)
  193. if err != nil {
  194. m.drainError(result, err, ctx, logger)
  195. return
  196. }
  197. m.mutex.Lock()
  198. m.statManagers = append(m.statManagers, stats)
  199. m.mutex.Unlock()
  200. if conf.Config.Sink.DisableCache {
  201. for {
  202. select {
  203. case data := <-m.input:
  204. if newdata, processed := m.preprocess(data); processed {
  205. break
  206. } else {
  207. data = newdata
  208. }
  209. stats.SetBufferLength(int64(len(m.input)))
  210. if runAsync {
  211. go doCollect(sink, data, stats, omitIfEmpty, sendSingle, tp, ctx)
  212. } else {
  213. doCollect(sink, data, stats, omitIfEmpty, sendSingle, tp, ctx)
  214. }
  215. case <-ctx.Done():
  216. logger.Infof("sink node %s instance %d done", m.name, instance)
  217. if err := sink.Close(ctx); err != nil {
  218. logger.Warnf("close sink node %s instance %d fails: %v", m.name, instance, err)
  219. }
  220. return
  221. case <-m.tch:
  222. logger.Debugf("rule %s sink receive checkpoint, do nothing", ctx.GetRuleId())
  223. }
  224. }
  225. } else {
  226. logger.Infof("Creating sink cache")
  227. var cache *Cache
  228. if m.qos >= api.AtLeastOnce {
  229. cache = NewCheckpointbasedCache(m.input, cacheLength, m.tch, result, ctx)
  230. } else {
  231. cache = NewTimebasedCache(m.input, cacheLength, cacheSaveInterval, result, ctx)
  232. }
  233. for {
  234. select {
  235. case data := <-cache.Out:
  236. if newdata, processed := m.preprocess(data.data); processed {
  237. break
  238. } else {
  239. data.data = newdata
  240. }
  241. stats.SetBufferLength(int64(len(m.input)))
  242. if runAsync {
  243. go doCollectCacheTuple(sink, data, stats, retryInterval, retryCount, omitIfEmpty, sendSingle, tp, cache.Complete, ctx)
  244. } else {
  245. doCollectCacheTuple(sink, data, stats, retryInterval, retryCount, omitIfEmpty, sendSingle, tp, cache.Complete, ctx)
  246. }
  247. case <-ctx.Done():
  248. logger.Infof("sink node %s instance %d done", m.name, instance)
  249. if err := sink.Close(ctx); err != nil {
  250. logger.Warnf("close sink node %s instance %d fails: %v", m.name, instance, err)
  251. }
  252. return
  253. }
  254. }
  255. }
  256. }(i)
  257. }
  258. }()
  259. }
  260. func (m *SinkNode) reset() {
  261. if !m.isMock {
  262. m.sinks = nil
  263. }
  264. m.statManagers = nil
  265. }
  266. func extractInput(v []byte) ([]map[string]interface{}, error) {
  267. var j []map[string]interface{}
  268. if err := json.Unmarshal(v, &j); err != nil {
  269. return nil, fmt.Errorf("fail to decode the input %s as json: %v", v, err)
  270. }
  271. return j, nil
  272. }
  273. func doCollect(sink api.Sink, item interface{}, stats StatManager, omitIfEmpty bool, sendSingle bool, tp *template.Template, ctx api.StreamContext) {
  274. stats.IncTotalRecordsIn()
  275. stats.ProcessTimeStart()
  276. defer stats.ProcessTimeEnd()
  277. logger := ctx.GetLogger()
  278. outdatas := getOutData(stats, ctx, item, omitIfEmpty, sendSingle, tp)
  279. for _, outdata := range outdatas {
  280. if err := sink.Collect(ctx, outdata); err != nil {
  281. stats.IncTotalExceptions()
  282. logger.Warnf("sink node %s instance %d publish %s error: %v", ctx.GetOpId(), ctx.GetInstanceId(), outdata, err)
  283. } else {
  284. stats.IncTotalRecordsOut()
  285. }
  286. }
  287. }
  288. func getOutData(stats StatManager, ctx api.StreamContext, item interface{}, omitIfEmpty bool, sendSingle bool, tp *template.Template) [][]byte {
  289. logger := ctx.GetLogger()
  290. var outdatas [][]byte
  291. switch val := item.(type) {
  292. case []byte:
  293. if omitIfEmpty && string(val) == "[{}]" {
  294. return nil
  295. }
  296. var (
  297. err error
  298. j []map[string]interface{}
  299. )
  300. if sendSingle || tp != nil {
  301. j, err = extractInput(val)
  302. if err != nil {
  303. logger.Warnf("sink node %s instance %d publish %s error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
  304. stats.IncTotalExceptions()
  305. return nil
  306. }
  307. logger.Debugf("receive %d records", len(j))
  308. }
  309. if !sendSingle {
  310. if tp != nil {
  311. var output bytes.Buffer
  312. err := tp.Execute(&output, j)
  313. if err != nil {
  314. logger.Warnf("sink node %s instance %d publish %s decode template error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
  315. stats.IncTotalExceptions()
  316. return nil
  317. }
  318. outdatas = append(outdatas, output.Bytes())
  319. } else {
  320. outdatas = [][]byte{val}
  321. }
  322. } else {
  323. for _, r := range j {
  324. if tp != nil {
  325. var output bytes.Buffer
  326. err := tp.Execute(&output, r)
  327. if err != nil {
  328. logger.Warnf("sink node %s instance %d publish %s decode template error: %v", ctx.GetOpId(), ctx.GetInstanceId(), val, err)
  329. stats.IncTotalExceptions()
  330. return nil
  331. }
  332. outdatas = append(outdatas, output.Bytes())
  333. } else {
  334. if ot, e := json.Marshal(r); e != nil {
  335. logger.Warnf("sink node %s instance %d publish %s marshal error: %v", ctx.GetOpId(), ctx.GetInstanceId(), r, e)
  336. stats.IncTotalExceptions()
  337. return nil
  338. } else {
  339. outdatas = append(outdatas, ot)
  340. }
  341. }
  342. }
  343. }
  344. case error:
  345. outdatas = [][]byte{[]byte(fmt.Sprintf(`[{"error":"%s"}]`, val.Error()))}
  346. default:
  347. outdatas = [][]byte{[]byte(fmt.Sprintf(`[{"error":"result is not a string but found %#v"}]`, val))}
  348. }
  349. return outdatas
  350. }
  351. func doCollectCacheTuple(sink api.Sink, item *CacheTuple, stats StatManager, retryInterval, retryCount int, omitIfEmpty bool, sendSingle bool, tp *template.Template, signalCh chan<- int, ctx api.StreamContext) {
  352. stats.IncTotalRecordsIn()
  353. stats.ProcessTimeStart()
  354. defer stats.ProcessTimeEnd()
  355. logger := ctx.GetLogger()
  356. outdatas := getOutData(stats, ctx, item.data, omitIfEmpty, sendSingle, tp)
  357. for _, outdata := range outdatas {
  358. outerloop:
  359. for {
  360. select {
  361. case <-ctx.Done():
  362. logger.Infof("sink node %s instance %d stops data resending", ctx.GetOpId(), ctx.GetInstanceId())
  363. return
  364. default:
  365. if err := sink.Collect(ctx, outdata); err != nil {
  366. stats.IncTotalExceptions()
  367. logger.Warnf("sink node %s instance %d publish %s error: %v", ctx.GetOpId(), ctx.GetInstanceId(), outdata, err)
  368. if retryInterval > 0 && retryCount > 0 {
  369. retryCount--
  370. time.Sleep(time.Duration(retryInterval) * time.Millisecond)
  371. logger.Debugf("try again")
  372. } else {
  373. break outerloop
  374. }
  375. } else {
  376. logger.Debugf("success")
  377. stats.IncTotalRecordsOut()
  378. select {
  379. case signalCh <- item.index:
  380. default:
  381. logger.Warnf("sink cache missing response for %d", item.index)
  382. }
  383. break outerloop
  384. }
  385. }
  386. }
  387. }
  388. }
  389. func doGetSink(name string, action map[string]interface{}) (api.Sink, error) {
  390. var (
  391. s api.Sink
  392. err error
  393. )
  394. switch name {
  395. case "log":
  396. s = sink.NewLogSink()
  397. case "logToMemory":
  398. s = sink.NewLogSinkToMemory()
  399. case "mqtt":
  400. s = &sink.MQTTSink{}
  401. case "rest":
  402. s = &sink.RestSink{}
  403. case "nop":
  404. s = &sink.NopSink{}
  405. default:
  406. s, err = plugin.GetSink(name)
  407. if err != nil {
  408. return nil, err
  409. }
  410. }
  411. err = s.Configure(action)
  412. if err != nil {
  413. return nil, err
  414. }
  415. return s, nil
  416. }
  417. //Override defaultNode
  418. func (m *SinkNode) AddOutput(_ chan<- interface{}, name string) error {
  419. return fmt.Errorf("fail to add output %s, sink %s cannot add output", name, m.name)
  420. }
  421. //Override defaultNode
  422. func (m *SinkNode) Broadcast(_ interface{}) error {
  423. return fmt.Errorf("sink %s cannot add broadcast", m.name)
  424. }
  425. func (m *SinkNode) drainError(errCh chan<- error, err error, ctx api.StreamContext, logger api.Logger) {
  426. go func() {
  427. select {
  428. case errCh <- err:
  429. ctx.GetLogger().Errorf("error in sink %s", err)
  430. case <-ctx.Done():
  431. m.close(ctx, logger)
  432. }
  433. }()
  434. }
  435. func (m *SinkNode) close(ctx api.StreamContext, logger api.Logger) {
  436. for _, s := range m.sinks {
  437. if err := s.Close(ctx); err != nil {
  438. logger.Warnf("close sink fails: %v", err)
  439. }
  440. }
  441. if m.tch != nil {
  442. close(m.tch)
  443. m.tch = nil
  444. }
  445. }
  446. // Only called when checkpoint enabled
  447. func (m *SinkNode) SaveCache() {
  448. m.tch <- struct{}{}
  449. }