123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213 |
- package nodes
- import (
- "github.com/emqx/kuiper/common"
- "github.com/emqx/kuiper/plugins"
- "github.com/emqx/kuiper/xsql"
- "github.com/emqx/kuiper/xstream/api"
- "github.com/emqx/kuiper/xstream/extensions"
- "sync"
- )
- type SourceNode struct {
- *defaultNode
- streamType xsql.StreamType
- sourceType string
- options map[string]string
- isMock bool
- mutex sync.RWMutex
- sources []api.Source
- }
- func NewSourceNode(name string, st xsql.StreamType, options map[string]string) *SourceNode {
- t, ok := options["TYPE"]
- if !ok {
- if st == xsql.TypeStream {
- t = "mqtt"
- } else if st == xsql.TypeTable {
- t = "file"
- }
- }
- return &SourceNode{
- sourceType: t,
- defaultNode: &defaultNode{
- name: name,
- outputs: make(map[string]chan<- interface{}),
- concurrency: 1,
- },
- options: options,
- }
- }
- const OFFSET_KEY = "$$offset"
- //Only for mock source, do not use it in production
- func NewSourceNodeWithSource(name string, source api.Source, options map[string]string) *SourceNode {
- return &SourceNode{
- sources: []api.Source{source},
- defaultNode: &defaultNode{
- name: name,
- outputs: make(map[string]chan<- interface{}),
- concurrency: 1,
- },
- options: options,
- isMock: true,
- }
- }
- func (m *SourceNode) Open(ctx api.StreamContext, errCh chan<- error) {
- m.ctx = ctx
- logger := ctx.GetLogger()
- logger.Infof("open source node %s with option %v", m.name, m.options)
- go func() {
- props := getSourceConf(ctx, m.sourceType, m.options)
- if c, ok := props["concurrency"]; ok {
- if t, err := common.ToInt(c, common.STRICT); err != nil || t <= 0 {
- logger.Warnf("invalid type for concurrency property, should be positive integer but found %t", c)
- } else {
- m.concurrency = t
- }
- }
- bl := 102400
- if c, ok := props["bufferLength"]; ok {
- if t, err := common.ToInt(c, common.STRICT); err != nil || t <= 0 {
- logger.Warnf("invalid type for bufferLength property, should be positive integer but found %t", c)
- } else {
- bl = t
- }
- }
- m.reset()
- logger.Infof("open source node %d instances", m.concurrency)
- for i := 0; i < m.concurrency; i++ { // workers
- go func(instance int) {
- //Do open source instances
- var source api.Source
- var err error
- if !m.isMock {
- source, err = getSource(m.sourceType)
- if err != nil {
- m.drainError(errCh, err, ctx, logger)
- return
- }
- err = source.Configure(m.options["DATASOURCE"], props)
- if err != nil {
- m.drainError(errCh, err, ctx, logger)
- return
- }
- m.mutex.Lock()
- m.sources = append(m.sources, source)
- m.mutex.Unlock()
- } else {
- logger.Debugf("get source instance %d from %d sources", instance, len(m.sources))
- source = m.sources[instance]
- }
- stats, err := NewStatManager("source", ctx)
- if err != nil {
- m.drainError(errCh, err, ctx, logger)
- return
- }
- m.mutex.Lock()
- m.statManagers = append(m.statManagers, stats)
- m.mutex.Unlock()
- if rw, ok := source.(api.Rewindable); ok {
- if offset, err := ctx.GetState(OFFSET_KEY); err != nil {
- m.drainError(errCh, err, ctx, logger)
- } else if offset != nil {
- logger.Infof("Source rewind from %v", offset)
- err = rw.Rewind(offset)
- if err != nil {
- m.drainError(errCh, err, ctx, logger)
- }
- }
- }
- buffer := NewDynamicChannelBuffer()
- buffer.SetLimit(bl)
- sourceErrCh := make(chan error)
- go source.Open(ctx.WithInstance(instance), buffer.In, sourceErrCh)
- logger.Infof("Start source %s instance %d successfully", m.name, instance)
- for {
- select {
- case <-ctx.Done():
- logger.Infof("source %s done", m.name)
- m.close(ctx, logger)
- buffer.Close()
- return
- case err := <-sourceErrCh:
- m.drainError(errCh, err, ctx, logger)
- return
- case data := <-buffer.Out:
- stats.IncTotalRecordsIn()
- stats.ProcessTimeStart()
- tuple := &xsql.Tuple{Emitter: m.name, Message: data.Message(), Timestamp: common.GetNowInMilli(), Metadata: data.Meta()}
- stats.ProcessTimeEnd()
- logger.Debugf("source node %s is sending tuple %+v of timestamp %d", m.name, tuple, tuple.Timestamp)
- //blocking
- m.Broadcast(tuple)
- stats.IncTotalRecordsOut()
- stats.SetBufferLength(int64(buffer.GetLength()))
- if rw, ok := source.(api.Rewindable); ok {
- if offset, err := rw.GetOffset(); err != nil {
- m.drainError(errCh, err, ctx, logger)
- } else {
- err = ctx.PutState(OFFSET_KEY, offset)
- if err != nil {
- m.drainError(errCh, err, ctx, logger)
- }
- logger.Debugf("Source save offset %v", offset)
- }
- }
- logger.Debugf("source node %s has consumed tuple of timestamp %d", m.name, tuple.Timestamp)
- }
- }
- }(i)
- }
- }()
- }
- func (m *SourceNode) reset() {
- if !m.isMock {
- m.sources = nil
- }
- m.statManagers = nil
- }
- func doGetSource(t string) (api.Source, error) {
- var (
- s api.Source
- err error
- )
- switch t {
- case "mqtt":
- s = &extensions.MQTTSource{}
- case "httppull":
- s = &extensions.HTTPPullSource{}
- case "file":
- s = &extensions.FileSource{}
- default:
- s, err = plugins.GetSource(t)
- if err != nil {
- return nil, err
- }
- }
- return s, nil
- }
- func (m *SourceNode) drainError(errCh chan<- error, err error, ctx api.StreamContext, logger api.Logger) {
- select {
- case errCh <- err:
- case <-ctx.Done():
- m.close(ctx, logger)
- }
- return
- }
- func (m *SourceNode) close(ctx api.StreamContext, logger api.Logger) {
- for _, s := range m.sources {
- if err := s.Close(ctx); err != nil {
- logger.Warnf("close source fails: %v", err)
- }
- }
- }
|