barrier_handler.go 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180
  1. package checkpoints
  2. import "github.com/emqx/kuiper/xstream/api"
  3. type BarrierHandler interface {
  4. Process(data *BufferOrEvent, ctx api.StreamContext) bool //If data is barrier return true, else return false
  5. SetOutput(chan<- *BufferOrEvent) //It is using for block a channel
  6. }
  7. //For qos 1, simple track barriers
  8. type BarrierTracker struct {
  9. responder Responder
  10. inputCount int
  11. pendingCheckpoints map[int64]int
  12. }
  13. func NewBarrierTracker(responder Responder, inputCount int) *BarrierTracker {
  14. return &BarrierTracker{
  15. responder: responder,
  16. inputCount: inputCount,
  17. pendingCheckpoints: make(map[int64]int),
  18. }
  19. }
  20. func (h *BarrierTracker) Process(data *BufferOrEvent, ctx api.StreamContext) bool {
  21. d := data.Data
  22. if b, ok := d.(*Barrier); ok {
  23. h.processBarrier(b, ctx)
  24. return true
  25. }
  26. return false
  27. }
  28. func (h *BarrierTracker) SetOutput(_ chan<- *BufferOrEvent) {
  29. //do nothing, does not need it
  30. }
  31. func (h *BarrierTracker) processBarrier(b *Barrier, ctx api.StreamContext) {
  32. logger := ctx.GetLogger()
  33. if h.inputCount == 1 {
  34. err := h.responder.TriggerCheckpoint(b.CheckpointId)
  35. if err != nil {
  36. logger.Errorf("trigger checkpoint for %s err: %s", h.responder.GetName(), err)
  37. }
  38. return
  39. }
  40. if c, ok := h.pendingCheckpoints[b.CheckpointId]; ok {
  41. c += 1
  42. if c == h.inputCount {
  43. err := h.responder.TriggerCheckpoint(b.CheckpointId)
  44. if err != nil {
  45. logger.Errorf("trigger checkpoint for %s err: %s", h.responder.GetName(), err)
  46. return
  47. }
  48. delete(h.pendingCheckpoints, b.CheckpointId)
  49. for cid := range h.pendingCheckpoints {
  50. if cid < b.CheckpointId {
  51. delete(h.pendingCheckpoints, cid)
  52. }
  53. }
  54. } else {
  55. h.pendingCheckpoints[b.CheckpointId] = c
  56. }
  57. } else {
  58. h.pendingCheckpoints[b.CheckpointId] = 1
  59. }
  60. }
  61. //For qos 2, block an input until all barriers are received
  62. type BarrierAligner struct {
  63. responder Responder
  64. inputCount int
  65. currentCheckpointId int64
  66. output chan<- *BufferOrEvent
  67. blockedChannels map[string]bool
  68. buffer []*BufferOrEvent
  69. }
  70. func NewBarrierAligner(responder Responder, inputCount int) *BarrierAligner {
  71. ba := &BarrierAligner{
  72. responder: responder,
  73. inputCount: inputCount,
  74. blockedChannels: make(map[string]bool),
  75. }
  76. return ba
  77. }
  78. func (h *BarrierAligner) Process(data *BufferOrEvent, ctx api.StreamContext) bool {
  79. switch d := data.Data.(type) {
  80. case *Barrier:
  81. h.processBarrier(d, ctx)
  82. return true
  83. default:
  84. //If blocking, save to buffer
  85. if h.inputCount > 1 && len(h.blockedChannels) > 0 {
  86. if _, ok := h.blockedChannels[data.Channel]; ok {
  87. h.buffer = append(h.buffer, data)
  88. return true
  89. }
  90. }
  91. }
  92. return false
  93. }
  94. func (h *BarrierAligner) processBarrier(b *Barrier, ctx api.StreamContext) {
  95. logger := ctx.GetLogger()
  96. logger.Debugf("Aligner process barrier %+v", b)
  97. if h.inputCount == 1 {
  98. if b.CheckpointId > h.currentCheckpointId {
  99. h.currentCheckpointId = b.CheckpointId
  100. err := h.responder.TriggerCheckpoint(b.CheckpointId)
  101. if err != nil {
  102. logger.Errorf("trigger checkpoint for %s err: %s", h.responder.GetName(), err)
  103. }
  104. }
  105. return
  106. }
  107. if len(h.blockedChannels) > 0 {
  108. if b.CheckpointId == h.currentCheckpointId {
  109. h.onBarrier(b.OpId, ctx)
  110. } else if b.CheckpointId > h.currentCheckpointId {
  111. logger.Infof("Received checkpoint barrier for checkpoint %d before complete current checkpoint %d. Skipping current checkpoint.", b.CheckpointId, h.currentCheckpointId)
  112. //TODO Abort checkpoint
  113. h.releaseBlocksAndResetBarriers()
  114. h.beginNewAlignment(b, ctx)
  115. } else {
  116. return
  117. }
  118. } else if b.CheckpointId > h.currentCheckpointId {
  119. logger.Debugf("Aligner process new alignment", b)
  120. h.beginNewAlignment(b, ctx)
  121. } else {
  122. return
  123. }
  124. if len(h.blockedChannels) == h.inputCount {
  125. logger.Debugf("Received all barriers, triggering checkpoint %d", b.CheckpointId)
  126. err := h.responder.TriggerCheckpoint(b.CheckpointId)
  127. if err != nil {
  128. logger.Errorf("trigger checkpoint for %s err: %s", h.responder.GetName(), err)
  129. return
  130. }
  131. h.releaseBlocksAndResetBarriers()
  132. // clean up all the buffer
  133. var temp []*BufferOrEvent
  134. for _, d := range h.buffer {
  135. temp = append(temp, d)
  136. }
  137. go func() {
  138. for _, d := range temp {
  139. h.output <- d
  140. }
  141. }()
  142. h.buffer = make([]*BufferOrEvent, 0)
  143. }
  144. }
  145. func (h *BarrierAligner) onBarrier(name string, ctx api.StreamContext) {
  146. logger := ctx.GetLogger()
  147. if _, ok := h.blockedChannels[name]; !ok {
  148. h.blockedChannels[name] = true
  149. logger.Debugf("Received barrier from channel %s", name)
  150. }
  151. }
  152. func (h *BarrierAligner) SetOutput(output chan<- *BufferOrEvent) {
  153. h.output = output
  154. }
  155. func (h *BarrierAligner) releaseBlocksAndResetBarriers() {
  156. h.blockedChannels = make(map[string]bool)
  157. }
  158. func (h *BarrierAligner) beginNewAlignment(barrier *Barrier, ctx api.StreamContext) {
  159. logger := ctx.GetLogger()
  160. h.currentCheckpointId = barrier.CheckpointId
  161. h.onBarrier(barrier.OpId, ctx)
  162. logger.Debugf("Starting stream alignment for checkpoint %d", barrier.CheckpointId)
  163. }