xsql_processor.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434
  1. package processors
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "engine/common"
  6. "engine/xsql"
  7. "engine/xsql/plans"
  8. "engine/xstream"
  9. "engine/xstream/extensions"
  10. "engine/xstream/operators"
  11. "engine/xstream/sinks"
  12. "fmt"
  13. "github.com/dgraph-io/badger"
  14. "path"
  15. "strings"
  16. )
  17. var log = common.Log
  18. type StreamProcessor struct {
  19. statement string
  20. badgerDir string
  21. }
  22. //@params s : the sql string of create stream statement
  23. //@params d : the directory of the badger DB to save the stream info
  24. func NewStreamProcessor(s, d string) *StreamProcessor {
  25. processor := &StreamProcessor{
  26. statement: s,
  27. badgerDir: d,
  28. }
  29. return processor
  30. }
  31. func (p *StreamProcessor) Exec() (result []string, err error) {
  32. parser := xsql.NewParser(strings.NewReader(p.statement))
  33. stmt, err := xsql.Language.Parse(parser)
  34. if err != nil {
  35. return
  36. }
  37. db, err := common.DbOpen(p.badgerDir)
  38. if err != nil {
  39. return
  40. }
  41. defer common.DbClose(db)
  42. switch s := stmt.(type) {
  43. case *xsql.StreamStmt:
  44. var r string
  45. r, err = p.execCreateStream(s, db)
  46. result = append(result, r)
  47. case *xsql.ShowStreamsStatement:
  48. result, err = p.execShowStream(s, db)
  49. case *xsql.DescribeStreamStatement:
  50. var r string
  51. r, err = p.execDescribeStream(s, db)
  52. result = append(result, r)
  53. case *xsql.ExplainStreamStatement:
  54. var r string
  55. r, err = p.execExplainStream(s, db)
  56. result = append(result, r)
  57. case *xsql.DropStreamStatement:
  58. var r string
  59. r, err = p.execDropStream(s, db)
  60. result = append(result, r)
  61. }
  62. return
  63. }
  64. func (p *StreamProcessor) execCreateStream(stmt *xsql.StreamStmt, db *badger.DB) (string, error) {
  65. err := common.DbSet(db, string(stmt.Name), p.statement)
  66. if err != nil {
  67. return "", err
  68. }else{
  69. return fmt.Sprintf("stream %s created", stmt.Name), nil
  70. }
  71. }
  72. func (p *StreamProcessor) execShowStream(stmt *xsql.ShowStreamsStatement, db *badger.DB) ([]string,error) {
  73. keys, err := common.DbKeys(db)
  74. if len(keys) == 0 {
  75. keys = append(keys, "no stream definition found")
  76. }
  77. return keys, err
  78. }
  79. func (p *StreamProcessor) execDescribeStream(stmt *xsql.DescribeStreamStatement, db *badger.DB) (string,error) {
  80. s, err := common.DbGet(db, string(stmt.Name))
  81. if err != nil {
  82. return "", fmt.Errorf("stream %s not found", stmt.Name)
  83. }
  84. parser := xsql.NewParser(strings.NewReader(s))
  85. stream, err := xsql.Language.Parse(parser)
  86. streamStmt, ok := stream.(*xsql.StreamStmt)
  87. if !ok{
  88. return "", fmt.Errorf("error resolving the stream %s, the data in db may be corrupted", stmt.Name)
  89. }
  90. var buff bytes.Buffer
  91. buff.WriteString("Fields\n--------------------------------------------------------------------------------\n")
  92. for _, f := range streamStmt.StreamFields {
  93. buff.WriteString(f.Name + "\t")
  94. xsql.PrintFieldType(f.FieldType, &buff)
  95. buff.WriteString("\n")
  96. }
  97. buff.WriteString("\n")
  98. common.PrintMap(streamStmt.Options, &buff)
  99. return buff.String(), err
  100. }
  101. func (p *StreamProcessor) execExplainStream(stmt *xsql.ExplainStreamStatement, db *badger.DB) (string,error) {
  102. _, err := common.DbGet(db, string(stmt.Name))
  103. if err != nil{
  104. return "", fmt.Errorf("stream %s not found", stmt.Name)
  105. }
  106. return "TO BE SUPPORTED", nil
  107. }
  108. func (p *StreamProcessor) execDropStream(stmt *xsql.DropStreamStatement, db *badger.DB) (string, error) {
  109. err := common.DbDelete(db, string(stmt.Name))
  110. if err != nil {
  111. return "", err
  112. }else{
  113. return fmt.Sprintf("stream %s dropped", stmt.Name), nil
  114. }
  115. }
  116. func GetStream(db *badger.DB, name string) (stmt *xsql.StreamStmt, err error){
  117. s, err := common.DbGet(db, name)
  118. if err != nil {
  119. return
  120. }
  121. parser := xsql.NewParser(strings.NewReader(s))
  122. stream, err := xsql.Language.Parse(parser)
  123. stmt, ok := stream.(*xsql.StreamStmt)
  124. if !ok{
  125. err = fmt.Errorf("error resolving the stream %s, the data in db may be corrupted", name)
  126. }
  127. return
  128. }
  129. type RuleProcessor struct {
  130. badgerDir string
  131. }
  132. func NewRuleProcessor(d string) *RuleProcessor {
  133. processor := &RuleProcessor{
  134. badgerDir: d,
  135. }
  136. return processor
  137. }
  138. func (p *RuleProcessor) ExecCreate(name, ruleJson string) (*xstream.Rule, error) {
  139. rule, err := p.getRuleByJson(name, ruleJson)
  140. if err != nil {
  141. return nil, err
  142. }
  143. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  144. if err != nil {
  145. return nil, err
  146. }
  147. err = common.DbSet(db, string(name), ruleJson)
  148. if err != nil {
  149. common.DbClose(db)
  150. return nil, err
  151. }else{
  152. log.Infof("rule %s created", name)
  153. common.DbClose(db)
  154. }
  155. return rule, nil
  156. }
  157. func (p *RuleProcessor) GetRuleByName(name string) (*xstream.Rule, error) {
  158. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  159. if err != nil {
  160. return nil, err
  161. }
  162. defer common.DbClose(db)
  163. s, err := common.DbGet(db, string(name))
  164. if err != nil {
  165. return nil, fmt.Errorf("rule %s not found", name)
  166. }
  167. return p.getRuleByJson(name, s)
  168. }
  169. func (p *RuleProcessor) getRuleByJson(name, ruleJson string) (*xstream.Rule, error) {
  170. var rule xstream.Rule
  171. if err := json.Unmarshal([]byte(ruleJson), &rule); err != nil {
  172. return nil, fmt.Errorf("parse rule %s error : %s", ruleJson, err)
  173. }
  174. rule.Id = name
  175. //validation
  176. if name == ""{
  177. return nil, fmt.Errorf("missing rule id")
  178. }
  179. if rule.Sql == ""{
  180. return nil, fmt.Errorf("missing rule sql")
  181. }
  182. if rule.Actions == nil || len(rule.Actions) == 0{
  183. return nil, fmt.Errorf("missing rule actions")
  184. }
  185. return &rule, nil
  186. }
  187. func (p *RuleProcessor) ExecInitRule(rule *xstream.Rule) (*xstream.TopologyNew, error) {
  188. if tp, inputs, err := p.createTopo(rule); err != nil {
  189. return nil, err
  190. }else{
  191. for _, m := range rule.Actions {
  192. for name, action := range m {
  193. switch name {
  194. case "log":
  195. log.Printf("Create log sink with %s", action)
  196. tp.AddSink(inputs, sinks.NewLogSink("sink_log", rule.Id))
  197. case "mqtt":
  198. log.Printf("Create mqtt sink with %s", action)
  199. if ms, err := sinks.NewMqttSink("mqtt_log", rule.Id, action); err != nil{
  200. return nil, err
  201. }else{
  202. tp.AddSink(inputs, ms)
  203. }
  204. default:
  205. return nil, fmt.Errorf("unsupported action: %s", name)
  206. }
  207. }
  208. }
  209. return tp, nil
  210. }
  211. }
  212. func (p *RuleProcessor) ExecQuery(ruleid, sql string) (*xstream.TopologyNew, error) {
  213. if tp, inputs, err := p.createTopo(&xstream.Rule{Id: ruleid, Sql: sql}); err != nil {
  214. return nil, err
  215. } else {
  216. tp.AddSink(inputs, sinks.NewLogSinkToMemory("sink_log", ruleid))
  217. go func() {
  218. select {
  219. case err := <-tp.Open():
  220. log.Println(err)
  221. tp.Cancel()
  222. }
  223. }()
  224. return tp, nil
  225. }
  226. }
  227. func (p *RuleProcessor) ExecDesc(name string) (string, error) {
  228. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  229. if err != nil {
  230. return "", err
  231. }
  232. defer common.DbClose(db)
  233. s, err := common.DbGet(db, string(name))
  234. if err != nil {
  235. return "", fmt.Errorf("rule %s not found", name)
  236. }
  237. dst := &bytes.Buffer{}
  238. if err := json.Indent(dst, []byte(s), "", " "); err != nil {
  239. return "", err
  240. }
  241. return fmt.Sprintln(dst.String()), nil
  242. }
  243. func (p *RuleProcessor) ExecShow() (string, error) {
  244. keys, err := p.GetAllRules()
  245. if err != nil{
  246. return "", err
  247. }
  248. if len(keys) == 0 {
  249. keys = append(keys, "no rule definition found")
  250. }
  251. var result string
  252. for _, c := range keys{
  253. result = result + fmt.Sprintln(c)
  254. }
  255. return result, nil
  256. }
  257. func (p *RuleProcessor) GetAllRules() ([]string, error) {
  258. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  259. if err != nil {
  260. return nil, err
  261. }
  262. defer common.DbClose(db)
  263. return common.DbKeys(db)
  264. }
  265. func (p *RuleProcessor) ExecDrop(name string) (string, error) {
  266. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  267. if err != nil {
  268. return "", err
  269. }
  270. defer common.DbClose(db)
  271. err = common.DbDelete(db, string(name))
  272. if err != nil {
  273. return "", err
  274. }else{
  275. return fmt.Sprintf("rule %s dropped", name), nil
  276. }
  277. }
  278. func (p *RuleProcessor) createTopo(rule *xstream.Rule) (*xstream.TopologyNew, []xstream.Emitter, error) {
  279. return p.createTopoWithSources(rule, nil)
  280. }
  281. //For test to mock source
  282. func (p *RuleProcessor) createTopoWithSources(rule *xstream.Rule, sources []xstream.Source) (*xstream.TopologyNew, []xstream.Emitter, error){
  283. name := rule.Id
  284. sql := rule.Sql
  285. var isEventTime bool
  286. var lateTol int64
  287. if iet, ok := rule.Options["isEventTime"]; ok{
  288. isEventTime, ok = iet.(bool)
  289. if !ok{
  290. return nil, nil, fmt.Errorf("invalid rule option isEventTime %v, bool type required", iet)
  291. }
  292. }
  293. if isEventTime {
  294. if l, ok := rule.Options["lateTolerance"]; ok{
  295. if fl, ok := l.(float64); ok{
  296. lateTol = int64(fl)
  297. }else{
  298. return nil, nil, fmt.Errorf("invalid rule option lateTolerance %v, int type required", l)
  299. }
  300. }
  301. }
  302. shouldCreateSource := sources == nil
  303. parser := xsql.NewParser(strings.NewReader(sql))
  304. if stmt, err := xsql.Language.Parse(parser); err != nil{
  305. return nil, nil, fmt.Errorf("parse sql %s error: %s", sql , err)
  306. }else {
  307. if selectStmt, ok := stmt.(*xsql.SelectStatement); !ok {
  308. return nil, nil, fmt.Errorf("sql %s is not a select statement", sql)
  309. } else {
  310. tp := xstream.NewWithName(name)
  311. var inputs []xstream.Emitter
  312. streamsFromStmt := xsql.GetStreams(selectStmt)
  313. if !shouldCreateSource && len(streamsFromStmt) != len(sources){
  314. return nil, nil, fmt.Errorf("invalid parameter sources or streams, the length cannot match the statement, expect %d sources", len(streamsFromStmt))
  315. }
  316. db, err := common.DbOpen(path.Join(p.badgerDir, "stream"))
  317. if err != nil {
  318. return nil, nil, err
  319. }
  320. defer common.DbClose(db)
  321. for i, s := range streamsFromStmt {
  322. streamStmt, err := GetStream(db, s)
  323. if err != nil {
  324. return nil, nil, err
  325. }
  326. pp, err := plans.NewPreprocessor(streamStmt, isEventTime)
  327. if err != nil{
  328. return nil, nil, err
  329. }
  330. if shouldCreateSource{
  331. mqs, err := extensions.NewWithName(string(streamStmt.Name), streamStmt.Options["DATASOURCE"], streamStmt.Options["CONF_KEY"])
  332. if err != nil {
  333. return nil, nil, err
  334. }
  335. tp.AddSrc(mqs)
  336. preprocessorOp := xstream.Transform(pp, "preprocessor_"+s)
  337. tp.AddOperator([]xstream.Emitter{mqs}, preprocessorOp)
  338. inputs = append(inputs, preprocessorOp)
  339. }else{
  340. tp.AddSrc(sources[i])
  341. preprocessorOp := xstream.Transform(pp, "preprocessor_"+s)
  342. tp.AddOperator([]xstream.Emitter{sources[i]}, preprocessorOp)
  343. inputs = append(inputs, preprocessorOp)
  344. }
  345. }
  346. dimensions := selectStmt.Dimensions
  347. var w *xsql.Window
  348. if dimensions != nil {
  349. w = dimensions.GetWindow()
  350. if w != nil {
  351. wop, err := operators.NewWindowOp("window", w, isEventTime, lateTol, streamsFromStmt)
  352. if err != nil {
  353. return nil, nil, err
  354. }
  355. tp.AddOperator(inputs, wop)
  356. inputs = []xstream.Emitter{wop}
  357. }
  358. }
  359. if w != nil && selectStmt.Joins != nil {
  360. joinOp := xstream.Transform(&plans.JoinPlan{Joins: selectStmt.Joins, From: selectStmt.Sources[0].(*xsql.Table)}, "join")
  361. //TODO concurrency setting by command
  362. //joinOp.SetConcurrency(3)
  363. tp.AddOperator(inputs, joinOp)
  364. inputs = []xstream.Emitter{joinOp}
  365. }
  366. if selectStmt.Condition != nil {
  367. filterOp := xstream.Transform(&plans.FilterPlan{Condition: selectStmt.Condition}, "filter")
  368. //TODO concurrency setting by command
  369. // filterOp.SetConcurrency(3)
  370. tp.AddOperator(inputs, filterOp)
  371. inputs = []xstream.Emitter{filterOp}
  372. }
  373. var ds xsql.Dimensions
  374. if dimensions != nil {
  375. ds = dimensions.GetGroups()
  376. if ds != nil && len(ds) > 0 {
  377. aggregateOp := xstream.Transform(&plans.AggregatePlan{Dimensions: ds}, "aggregate")
  378. tp.AddOperator(inputs, aggregateOp)
  379. inputs = []xstream.Emitter{aggregateOp}
  380. }
  381. }
  382. if selectStmt.SortFields != nil {
  383. orderOp := xstream.Transform(&plans.OrderPlan{SortFields:selectStmt.SortFields}, "order")
  384. tp.AddOperator(inputs, orderOp)
  385. inputs = []xstream.Emitter{orderOp}
  386. }
  387. if selectStmt.Fields != nil {
  388. projectOp := xstream.Transform(&plans.ProjectPlan{Fields: selectStmt.Fields, IsAggregate: xsql.IsAggStatement(selectStmt)}, "project")
  389. tp.AddOperator(inputs, projectOp)
  390. inputs = []xstream.Emitter{projectOp}
  391. }
  392. return tp, inputs, nil
  393. }
  394. }
  395. }