table_processor.go 3.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103
  1. // Copyright 2021 EMQ Technologies Co., Ltd.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package operator
  15. import (
  16. "fmt"
  17. "github.com/lf-edge/ekuiper/internal/xsql"
  18. "github.com/lf-edge/ekuiper/pkg/api"
  19. "github.com/lf-edge/ekuiper/pkg/ast"
  20. )
  21. type TableProcessor struct {
  22. //Pruned stream fields. Could be streamField(with data type info) or string
  23. defaultFieldProcessor
  24. isSchemaless bool
  25. isBatchInput bool // whether the inputs are batched, such as file which sends multiple messages at a batch. If batch input, only fires when EOF is received. This is mutual exclusive with retainSize.
  26. retainSize int // how many(maximum) messages to be retained for each output
  27. emitterName string
  28. // States
  29. output xsql.WindowTuples // current batched message collection
  30. batchEmitted bool // if batch input, this is the signal for whether the last batch has emitted. If true, reinitialize.
  31. }
  32. func NewTableProcessor(isSchemaless bool, name string, fields []interface{}, options *ast.Options) (*TableProcessor, error) {
  33. p := &TableProcessor{emitterName: name, batchEmitted: true, retainSize: 1, isSchemaless: isSchemaless}
  34. p.defaultFieldProcessor = defaultFieldProcessor{
  35. streamFields: fields, isBinary: false, timestampFormat: options.TIMESTAMP_FORMAT,
  36. strictValidation: options.STRICT_VALIDATION,
  37. }
  38. if options.RETAIN_SIZE > 0 {
  39. p.retainSize = options.RETAIN_SIZE
  40. p.isBatchInput = false
  41. } else if isBatch(options.TYPE) {
  42. p.isBatchInput = true
  43. p.retainSize = 0
  44. }
  45. return p, nil
  46. }
  47. /*
  48. * input: *xsql.Tuple or BatchCount
  49. * output: WindowTuples
  50. */
  51. func (p *TableProcessor) Apply(ctx api.StreamContext, data interface{}, fv *xsql.FunctionValuer, _ *xsql.AggregateFunctionValuer) interface{} {
  52. logger := ctx.GetLogger()
  53. tuple, ok := data.(*xsql.Tuple)
  54. if !ok {
  55. return fmt.Errorf("expect *xsql.Tuple data type")
  56. }
  57. logger.Debugf("preprocessor receive %v", tuple)
  58. if p.batchEmitted {
  59. p.output = xsql.WindowTuples{
  60. Emitter: p.emitterName,
  61. Tuples: make([]xsql.Tuple, 0),
  62. }
  63. p.batchEmitted = false
  64. }
  65. if tuple.Message != nil {
  66. if !p.isSchemaless && p.streamFields != nil {
  67. result, err := p.processField(tuple, nil)
  68. if err != nil {
  69. return fmt.Errorf("error in preprocessor: %s", err)
  70. }
  71. tuple.Message = result
  72. }
  73. var newTuples []xsql.Tuple
  74. for i, ot := range p.output.Tuples {
  75. if p.retainSize > 0 && len(p.output.Tuples) == p.retainSize && i == 0 {
  76. continue
  77. }
  78. newTuples = append(newTuples, ot)
  79. }
  80. newTuples = append(newTuples, *tuple)
  81. p.output = xsql.WindowTuples{
  82. Emitter: p.emitterName,
  83. Tuples: newTuples,
  84. }
  85. if !p.isBatchInput {
  86. return p.output
  87. }
  88. } else if p.isBatchInput { // EOF
  89. p.batchEmitted = true
  90. return p.output
  91. }
  92. return nil
  93. }
  94. func isBatch(t string) bool {
  95. return t == "file" || t == ""
  96. }