xsql_processor.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523
  1. package processors
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "engine/common"
  6. "engine/common/plugin_manager"
  7. "engine/xsql"
  8. "engine/xsql/plans"
  9. "engine/xstream"
  10. "engine/xstream/api"
  11. "engine/xstream/extensions"
  12. "engine/xstream/nodes"
  13. "engine/xstream/operators"
  14. "engine/xstream/sinks"
  15. "fmt"
  16. "github.com/dgraph-io/badger"
  17. "github.com/go-yaml/yaml"
  18. "path"
  19. "strings"
  20. )
  21. var log = common.Log
  22. type StreamProcessor struct {
  23. statement string
  24. badgerDir string
  25. }
  26. //@params s : the sql string of create stream statement
  27. //@params d : the directory of the badger DB to save the stream info
  28. func NewStreamProcessor(s, d string) *StreamProcessor {
  29. processor := &StreamProcessor{
  30. statement: s,
  31. badgerDir: d,
  32. }
  33. return processor
  34. }
  35. func (p *StreamProcessor) Exec() (result []string, err error) {
  36. parser := xsql.NewParser(strings.NewReader(p.statement))
  37. stmt, err := xsql.Language.Parse(parser)
  38. if err != nil {
  39. return
  40. }
  41. db, err := common.DbOpen(p.badgerDir)
  42. if err != nil {
  43. return
  44. }
  45. defer common.DbClose(db)
  46. switch s := stmt.(type) {
  47. case *xsql.StreamStmt:
  48. var r string
  49. r, err = p.execCreateStream(s, db)
  50. result = append(result, r)
  51. case *xsql.ShowStreamsStatement:
  52. result, err = p.execShowStream(s, db)
  53. case *xsql.DescribeStreamStatement:
  54. var r string
  55. r, err = p.execDescribeStream(s, db)
  56. result = append(result, r)
  57. case *xsql.ExplainStreamStatement:
  58. var r string
  59. r, err = p.execExplainStream(s, db)
  60. result = append(result, r)
  61. case *xsql.DropStreamStatement:
  62. var r string
  63. r, err = p.execDropStream(s, db)
  64. result = append(result, r)
  65. }
  66. return
  67. }
  68. func (p *StreamProcessor) execCreateStream(stmt *xsql.StreamStmt, db *badger.DB) (string, error) {
  69. err := common.DbSet(db, string(stmt.Name), p.statement)
  70. if err != nil {
  71. return "", err
  72. }else{
  73. return fmt.Sprintf("Stream %s is created.", stmt.Name), nil
  74. }
  75. }
  76. func (p *StreamProcessor) execShowStream(stmt *xsql.ShowStreamsStatement, db *badger.DB) ([]string,error) {
  77. keys, err := common.DbKeys(db)
  78. if len(keys) == 0 {
  79. keys = append(keys, "No stream definitions are found.")
  80. }
  81. return keys, err
  82. }
  83. func (p *StreamProcessor) execDescribeStream(stmt *xsql.DescribeStreamStatement, db *badger.DB) (string,error) {
  84. s, err := common.DbGet(db, string(stmt.Name))
  85. if err != nil {
  86. return "", fmt.Errorf("Stream %s is not found.", stmt.Name)
  87. }
  88. parser := xsql.NewParser(strings.NewReader(s))
  89. stream, err := xsql.Language.Parse(parser)
  90. streamStmt, ok := stream.(*xsql.StreamStmt)
  91. if !ok{
  92. return "", fmt.Errorf("Error resolving the stream %s, the data in db may be corrupted.", stmt.Name)
  93. }
  94. var buff bytes.Buffer
  95. buff.WriteString("Fields\n--------------------------------------------------------------------------------\n")
  96. for _, f := range streamStmt.StreamFields {
  97. buff.WriteString(f.Name + "\t")
  98. xsql.PrintFieldType(f.FieldType, &buff)
  99. buff.WriteString("\n")
  100. }
  101. buff.WriteString("\n")
  102. common.PrintMap(streamStmt.Options, &buff)
  103. return buff.String(), err
  104. }
  105. func (p *StreamProcessor) execExplainStream(stmt *xsql.ExplainStreamStatement, db *badger.DB) (string,error) {
  106. _, err := common.DbGet(db, string(stmt.Name))
  107. if err != nil{
  108. return "", fmt.Errorf("Stream %s is not found.", stmt.Name)
  109. }
  110. return "TO BE SUPPORTED", nil
  111. }
  112. func (p *StreamProcessor) execDropStream(stmt *xsql.DropStreamStatement, db *badger.DB) (string, error) {
  113. err := common.DbDelete(db, string(stmt.Name))
  114. if err != nil {
  115. return "", err
  116. }else{
  117. return fmt.Sprintf("Stream %s is dropped.", stmt.Name), nil
  118. }
  119. }
  120. func GetStream(db *badger.DB, name string) (stmt *xsql.StreamStmt, err error){
  121. s, err := common.DbGet(db, name)
  122. if err != nil {
  123. return
  124. }
  125. parser := xsql.NewParser(strings.NewReader(s))
  126. stream, err := xsql.Language.Parse(parser)
  127. stmt, ok := stream.(*xsql.StreamStmt)
  128. if !ok{
  129. err = fmt.Errorf("Error resolving the stream %s, the data in db may be corrupted.", name)
  130. }
  131. return
  132. }
  133. type RuleProcessor struct {
  134. badgerDir string
  135. }
  136. func NewRuleProcessor(d string) *RuleProcessor {
  137. processor := &RuleProcessor{
  138. badgerDir: d,
  139. }
  140. return processor
  141. }
  142. func (p *RuleProcessor) ExecCreate(name, ruleJson string) (*api.Rule, error) {
  143. rule, err := p.getRuleByJson(name, ruleJson)
  144. if err != nil {
  145. return nil, err
  146. }
  147. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  148. if err != nil {
  149. return nil, err
  150. }
  151. err = common.DbSet(db, string(name), ruleJson)
  152. if err != nil {
  153. common.DbClose(db)
  154. return nil, err
  155. }else{
  156. log.Infof("Rule %s is created.", name)
  157. common.DbClose(db)
  158. }
  159. return rule, nil
  160. }
  161. func (p *RuleProcessor) GetRuleByName(name string) (*api.Rule, error) {
  162. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  163. if err != nil {
  164. return nil, err
  165. }
  166. defer common.DbClose(db)
  167. s, err := common.DbGet(db, string(name))
  168. if err != nil {
  169. return nil, fmt.Errorf("Rule %s is not found.", name)
  170. }
  171. return p.getRuleByJson(name, s)
  172. }
  173. func (p *RuleProcessor) getRuleByJson(name, ruleJson string) (*api.Rule, error) {
  174. var rule api.Rule
  175. if err := json.Unmarshal([]byte(ruleJson), &rule); err != nil {
  176. return nil, fmt.Errorf("Parse rule %s error : %s.", ruleJson, err)
  177. }
  178. rule.Id = name
  179. //validation
  180. if name == ""{
  181. return nil, fmt.Errorf("Missing rule id.")
  182. }
  183. if rule.Sql == ""{
  184. return nil, fmt.Errorf("Missing rule SQL.")
  185. }
  186. if rule.Actions == nil || len(rule.Actions) == 0{
  187. return nil, fmt.Errorf("Missing rule actions.")
  188. }
  189. return &rule, nil
  190. }
  191. func (p *RuleProcessor) ExecInitRule(rule *api.Rule) (*xstream.TopologyNew, error) {
  192. if tp, inputs, err := p.createTopo(rule); err != nil {
  193. return nil, err
  194. }else{
  195. for _, m := range rule.Actions {
  196. for name, action := range m {
  197. props, ok := action.(map[string]interface{})
  198. if !ok {
  199. return nil, fmt.Errorf("expect map[string]interface{} type for the action properties, but found %v", action)
  200. }
  201. if s, err := getSink(name, props); err != nil{
  202. return nil, err
  203. }else{
  204. tp.AddSink(inputs, nodes.NewSinkNode("sink_" + name, s))
  205. }
  206. }
  207. }
  208. return tp, nil
  209. }
  210. }
  211. func (p *RuleProcessor) ExecQuery(ruleid, sql string) (*xstream.TopologyNew, error) {
  212. if tp, inputs, err := p.createTopo(&api.Rule{Id: ruleid, Sql: sql}); err != nil {
  213. return nil, err
  214. } else {
  215. tp.AddSink(inputs, nodes.NewSinkNode("sink_memory_log", sinks.NewLogSinkToMemory()))
  216. go func() {
  217. select {
  218. case err := <-tp.Open():
  219. log.Println(err)
  220. tp.Cancel()
  221. }
  222. }()
  223. return tp, nil
  224. }
  225. }
  226. func (p *RuleProcessor) ExecDesc(name string) (string, error) {
  227. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  228. if err != nil {
  229. return "", err
  230. }
  231. defer common.DbClose(db)
  232. s, err := common.DbGet(db, string(name))
  233. if err != nil {
  234. return "", fmt.Errorf("Rule %s is not found.", name)
  235. }
  236. dst := &bytes.Buffer{}
  237. if err := json.Indent(dst, []byte(s), "", " "); err != nil {
  238. return "", err
  239. }
  240. return fmt.Sprintln(dst.String()), nil
  241. }
  242. func (p *RuleProcessor) ExecShow() (string, error) {
  243. keys, err := p.GetAllRules()
  244. if err != nil{
  245. return "", err
  246. }
  247. if len(keys) == 0 {
  248. keys = append(keys, "No rule definitions are found.")
  249. }
  250. var result string
  251. for _, c := range keys{
  252. result = result + fmt.Sprintln(c)
  253. }
  254. return result, nil
  255. }
  256. func (p *RuleProcessor) GetAllRules() ([]string, error) {
  257. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  258. if err != nil {
  259. return nil, err
  260. }
  261. defer common.DbClose(db)
  262. return common.DbKeys(db)
  263. }
  264. func (p *RuleProcessor) ExecDrop(name string) (string, error) {
  265. db, err := common.DbOpen(path.Join(p.badgerDir, "rule"))
  266. if err != nil {
  267. return "", err
  268. }
  269. defer common.DbClose(db)
  270. err = common.DbDelete(db, string(name))
  271. if err != nil {
  272. return "", err
  273. }else{
  274. return fmt.Sprintf("Rule %s is dropped.", name), nil
  275. }
  276. }
  277. func (p *RuleProcessor) createTopo(rule *api.Rule) (*xstream.TopologyNew, []api.Emitter, error) {
  278. return p.createTopoWithSources(rule, nil)
  279. }
  280. //For test to mock source
  281. func (p *RuleProcessor) createTopoWithSources(rule *api.Rule, sources []*nodes.SourceNode) (*xstream.TopologyNew, []api.Emitter, error){
  282. name := rule.Id
  283. sql := rule.Sql
  284. var isEventTime bool
  285. var lateTol int64
  286. if iet, ok := rule.Options["isEventTime"]; ok{
  287. isEventTime, ok = iet.(bool)
  288. if !ok{
  289. return nil, nil, fmt.Errorf("Invalid rule option isEventTime %v, bool type is required.", iet)
  290. }
  291. }
  292. if isEventTime {
  293. if l, ok := rule.Options["lateTolerance"]; ok{
  294. if fl, ok := l.(float64); ok{
  295. lateTol = int64(fl)
  296. }else{
  297. return nil, nil, fmt.Errorf("Invalid rule option lateTolerance %v, int type is required.", l)
  298. }
  299. }
  300. }
  301. shouldCreateSource := sources == nil
  302. parser := xsql.NewParser(strings.NewReader(sql))
  303. if stmt, err := xsql.Language.Parse(parser); err != nil{
  304. return nil, nil, fmt.Errorf("Parse SQL %s error: %s.", sql , err)
  305. }else {
  306. if selectStmt, ok := stmt.(*xsql.SelectStatement); !ok {
  307. return nil, nil, fmt.Errorf("SQL %s is not a select statement.", sql)
  308. } else {
  309. tp := xstream.NewWithName(name)
  310. var inputs []api.Emitter
  311. streamsFromStmt := xsql.GetStreams(selectStmt)
  312. if !shouldCreateSource && len(streamsFromStmt) != len(sources){
  313. return nil, nil, fmt.Errorf("Invalid parameter sources or streams, the length cannot match the statement, expect %d sources.", len(streamsFromStmt))
  314. }
  315. db, err := common.DbOpen(path.Join(p.badgerDir, "stream"))
  316. if err != nil {
  317. return nil, nil, err
  318. }
  319. defer common.DbClose(db)
  320. for i, s := range streamsFromStmt {
  321. streamStmt, err := GetStream(db, s)
  322. if err != nil {
  323. return nil, nil, fmt.Errorf("fail to get stream %s, please check if stream is created", s)
  324. }
  325. pp, err := plans.NewPreprocessor(streamStmt, selectStmt.Fields, isEventTime)
  326. if err != nil{
  327. return nil, nil, err
  328. }
  329. if shouldCreateSource{
  330. src, err := getSource(streamStmt)
  331. if err != nil {
  332. return nil, nil, fmt.Errorf("fail to get source: %v", err)
  333. }
  334. node := nodes.NewSourceNode(s, src)
  335. tp.AddSrc(node)
  336. preprocessorOp := xstream.Transform(pp, "preprocessor_"+s)
  337. tp.AddOperator([]api.Emitter{node}, preprocessorOp)
  338. inputs = append(inputs, preprocessorOp)
  339. } else {
  340. tp.AddSrc(sources[i])
  341. preprocessorOp := xstream.Transform(pp, "preprocessor_"+s)
  342. tp.AddOperator([]api.Emitter{sources[i]}, preprocessorOp)
  343. inputs = append(inputs, preprocessorOp)
  344. }
  345. }
  346. dimensions := selectStmt.Dimensions
  347. var w *xsql.Window
  348. if dimensions != nil {
  349. w = dimensions.GetWindow()
  350. if w != nil {
  351. wop, err := operators.NewWindowOp("window", w, isEventTime, lateTol, streamsFromStmt)
  352. if err != nil {
  353. return nil, nil, err
  354. }
  355. tp.AddOperator(inputs, wop)
  356. inputs = []api.Emitter{wop}
  357. }
  358. }
  359. if w != nil && selectStmt.Joins != nil {
  360. joinOp := xstream.Transform(&plans.JoinPlan{Joins: selectStmt.Joins, From: selectStmt.Sources[0].(*xsql.Table)}, "join")
  361. //TODO concurrency setting by command
  362. //joinOp.SetConcurrency(3)
  363. tp.AddOperator(inputs, joinOp)
  364. inputs = []api.Emitter{joinOp}
  365. }
  366. if selectStmt.Condition != nil {
  367. filterOp := xstream.Transform(&plans.FilterPlan{Condition: selectStmt.Condition}, "filter")
  368. //TODO concurrency setting by command
  369. // filterOp.SetConcurrency(3)
  370. tp.AddOperator(inputs, filterOp)
  371. inputs = []api.Emitter{filterOp}
  372. }
  373. var ds xsql.Dimensions
  374. if dimensions != nil {
  375. ds = dimensions.GetGroups()
  376. if ds != nil && len(ds) > 0 {
  377. aggregateOp := xstream.Transform(&plans.AggregatePlan{Dimensions: ds}, "aggregate")
  378. tp.AddOperator(inputs, aggregateOp)
  379. inputs = []api.Emitter{aggregateOp}
  380. }
  381. }
  382. if selectStmt.Having != nil {
  383. havingOp := xstream.Transform(&plans.HavingPlan{selectStmt.Having}, "having")
  384. tp.AddOperator(inputs, havingOp)
  385. inputs = []api.Emitter{havingOp}
  386. }
  387. if selectStmt.SortFields != nil {
  388. orderOp := xstream.Transform(&plans.OrderPlan{SortFields: selectStmt.SortFields}, "order")
  389. tp.AddOperator(inputs, orderOp)
  390. inputs = []api.Emitter{orderOp}
  391. }
  392. if selectStmt.Fields != nil {
  393. projectOp := xstream.Transform(&plans.ProjectPlan{Fields: selectStmt.Fields, IsAggregate: xsql.IsAggStatement(selectStmt)}, "project")
  394. tp.AddOperator(inputs, projectOp)
  395. inputs = []api.Emitter{projectOp}
  396. }
  397. return tp, inputs, nil
  398. }
  399. }
  400. }
  401. func getSource(streamStmt *xsql.StreamStmt) (api.Source, error) {
  402. t, ok := streamStmt.Options["TYPE"]
  403. if !ok{
  404. t = "mqtt"
  405. }
  406. var s api.Source
  407. switch t {
  408. case "mqtt":
  409. s = &extensions.MQTTSource{}
  410. log.Debugf("Source mqtt created")
  411. default:
  412. nf, err := plugin_manager.GetPlugin(t, "sources")
  413. if err != nil {
  414. return nil, err
  415. }
  416. s, ok = nf.(api.Source)
  417. if !ok {
  418. return nil, fmt.Errorf("exported symbol %s is not type of api.Source", t)
  419. }
  420. }
  421. props := getConf(t, streamStmt.Options["CONF_KEY"])
  422. err := s.Configure(streamStmt.Options["DATASOURCE"], props)
  423. if err != nil{
  424. return nil, err
  425. }
  426. log.Debugf("Source %s created", t)
  427. return s, nil
  428. }
  429. func getConf(t string, confkey string) map[string]interface{} {
  430. conf, err := common.LoadConf("sources/" + t + ".yaml")
  431. props := make(map[string]interface{})
  432. if err == nil {
  433. cfg := make(map[string]map[string]interface{})
  434. if err := yaml.Unmarshal(conf, &cfg); err != nil {
  435. log.Warnf("fail to parse yaml for source %s. Return an empty configuration", t)
  436. } else {
  437. var ok bool
  438. props, ok = cfg["default"]
  439. if !ok {
  440. log.Warnf("default conf is not found", confkey)
  441. }
  442. if c, ok := cfg[confkey]; ok {
  443. for k, v := range c {
  444. props[k] = v
  445. }
  446. }
  447. }
  448. } else {
  449. log.Warnf("config file %s.yaml is not loaded properly. Return an empty configuration", t)
  450. }
  451. log.Debugf("get conf for %s with conf key %s: %v", t, confkey, props)
  452. return props
  453. }
  454. func getSink(name string, action map[string]interface{}) (api.Sink, error) {
  455. log.Tracef("trying to get sink %s with action %v", name, action)
  456. var s api.Sink
  457. switch name {
  458. case "log":
  459. s = sinks.NewLogSink()
  460. case "mqtt":
  461. s = &sinks.MQTTSink{}
  462. default:
  463. nf, err := plugin_manager.GetPlugin(name, "sinks")
  464. if err != nil {
  465. return nil, err
  466. }
  467. var ok bool
  468. s, ok = nf.(api.Sink)
  469. if !ok {
  470. return nil, fmt.Errorf("exported symbol %s is not type of api.Sink", name)
  471. }
  472. }
  473. err := s.Configure(action)
  474. if err != nil{
  475. return nil, err
  476. }
  477. log.Debugf("Sink %s created", name)
  478. return s, nil
  479. }