parser.go 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260
  1. package xsql
  2. import (
  3. "fmt"
  4. "github.com/emqx/kuiper/common"
  5. "github.com/golang-collections/collections/stack"
  6. "io"
  7. "math"
  8. "reflect"
  9. "strconv"
  10. "strings"
  11. )
  12. type Parser struct {
  13. s *Scanner
  14. i int // buffer index
  15. n int // buffer char count
  16. buf [3]struct {
  17. tok Token
  18. lit string
  19. }
  20. inmeta bool
  21. }
  22. func (p *Parser) parseCondition() (Expr, error) {
  23. if tok, _ := p.scanIgnoreWhitespace(); tok != WHERE {
  24. p.unscan()
  25. return nil, nil
  26. }
  27. expr, err := p.ParseExpr()
  28. if err != nil {
  29. return nil, err
  30. }
  31. return expr, nil
  32. }
  33. func (p *Parser) scan() (tok Token, lit string) {
  34. if p.n > 0 {
  35. p.n--
  36. return p.curr()
  37. }
  38. tok, lit = p.s.Scan()
  39. if tok != WS && tok != COMMENT {
  40. p.i = (p.i + 1) % len(p.buf)
  41. buf := &p.buf[p.i]
  42. buf.tok, buf.lit = tok, lit
  43. }
  44. return
  45. }
  46. func (p *Parser) curr() (Token, string) {
  47. i := (p.i - p.n + len(p.buf)) % len(p.buf)
  48. buf := &p.buf[i]
  49. return buf.tok, buf.lit
  50. }
  51. func (p *Parser) scanIgnoreWhitespace() (tok Token, lit string) {
  52. tok, lit = p.scan()
  53. for {
  54. if tok == WS || tok == COMMENT {
  55. tok, lit = p.scan()
  56. } else {
  57. break
  58. }
  59. }
  60. return tok, lit
  61. }
  62. func (p *Parser) unscan() { p.n++ }
  63. func NewParser(r io.Reader) *Parser {
  64. return &Parser{s: NewScanner(r)}
  65. }
  66. func (p *Parser) ParseQueries() (SelectStatements, error) {
  67. var stmts SelectStatements
  68. if stmt, err := p.Parse(); err != nil {
  69. return nil, err
  70. } else {
  71. stmts = append(stmts, *stmt)
  72. }
  73. for {
  74. if tok, _ := p.scanIgnoreWhitespace(); tok == SEMICOLON {
  75. if stmt, err := p.Parse(); err != nil {
  76. return nil, err
  77. } else {
  78. if stmt != nil {
  79. stmts = append(stmts, *stmt)
  80. }
  81. }
  82. } else if tok == EOF {
  83. break
  84. }
  85. }
  86. return stmts, nil
  87. }
  88. func (p *Parser) Parse() (*SelectStatement, error) {
  89. selects := &SelectStatement{}
  90. if tok, lit := p.scanIgnoreWhitespace(); tok == EOF {
  91. return nil, nil
  92. } else if tok != SELECT {
  93. return nil, fmt.Errorf("Found %q, Expected SELECT.\n", lit)
  94. }
  95. if fields, err := p.parseFields(); err != nil {
  96. return nil, err
  97. } else {
  98. selects.Fields = fields
  99. }
  100. if src, err := p.parseSource(); err != nil {
  101. return nil, err
  102. } else {
  103. selects.Sources = src
  104. }
  105. if joins, err := p.parseJoins(); err != nil {
  106. return nil, err
  107. } else {
  108. selects.Joins = joins
  109. }
  110. if exp, err := p.parseCondition(); err != nil {
  111. return nil, err
  112. } else {
  113. if exp != nil {
  114. selects.Condition = exp
  115. }
  116. }
  117. if dims, err := p.parseDimensions(); err != nil {
  118. return nil, err
  119. } else {
  120. selects.Dimensions = dims
  121. }
  122. if having, err := p.parseHaving(); err != nil {
  123. return nil, err
  124. } else {
  125. selects.Having = having
  126. }
  127. if sorts, err := p.parseSorts(); err != nil {
  128. return nil, err
  129. } else {
  130. selects.SortFields = sorts
  131. }
  132. if tok, lit := p.scanIgnoreWhitespace(); tok == SEMICOLON {
  133. p.unscan()
  134. return selects, nil
  135. } else if tok != EOF {
  136. return nil, fmt.Errorf("found %q, expected EOF.", lit)
  137. }
  138. if err := Validate(selects); err != nil {
  139. return nil, err
  140. }
  141. return selects, nil
  142. }
  143. func (p *Parser) parseSource() (Sources, error) {
  144. var sources Sources
  145. if tok, lit := p.scanIgnoreWhitespace(); tok != FROM {
  146. return nil, fmt.Errorf("found %q, expected FROM.", lit)
  147. }
  148. if src, alias, err := p.parseSourceLiteral(); err != nil {
  149. return nil, err
  150. } else {
  151. sources = append(sources, &Table{Name: src, Alias: alias})
  152. }
  153. return sources, nil
  154. }
  155. //TODO Current func has problems when the source includes white space.
  156. func (p *Parser) parseSourceLiteral() (string, string, error) {
  157. var sourceSeg []string
  158. var alias string
  159. for {
  160. //HASH, DIV & ADD token is specially support for MQTT topic name patterns.
  161. if tok, lit := p.scanIgnoreWhitespace(); tok.allowedSourceToken() {
  162. sourceSeg = append(sourceSeg, lit)
  163. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == AS {
  164. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  165. alias = lit2
  166. } else {
  167. return "", "", fmt.Errorf("found %q, expected JOIN key word.", lit)
  168. }
  169. } else if tok1.allowedSourceToken() {
  170. sourceSeg = append(sourceSeg, lit1)
  171. } else {
  172. p.unscan()
  173. break
  174. }
  175. } else {
  176. p.unscan()
  177. break
  178. }
  179. }
  180. return strings.Join(sourceSeg, ""), alias, nil
  181. }
  182. func (p *Parser) parseFieldNameSections() ([]string, error) {
  183. var fieldNameSects []string
  184. for {
  185. if tok, lit := p.scanIgnoreWhitespace(); tok == IDENT || tok == ASTERISK {
  186. fieldNameSects = append(fieldNameSects, lit)
  187. if tok1, _ := p.scanIgnoreWhitespace(); !tok1.allowedSFNToken() {
  188. p.unscan()
  189. break
  190. }
  191. } else {
  192. p.unscan()
  193. break
  194. }
  195. }
  196. if len(fieldNameSects) == 0 {
  197. return nil, fmt.Errorf("Cannot find any field name.\n")
  198. } else if len(fieldNameSects) > 2 {
  199. return nil, fmt.Errorf("Too many field names. Please use -> to reference keys in struct.\n")
  200. }
  201. return fieldNameSects, nil
  202. }
  203. func (p *Parser) parseJoins() (Joins, error) {
  204. var joins Joins
  205. for {
  206. if tok, lit := p.scanIgnoreWhitespace(); tok == INNER || tok == LEFT || tok == RIGHT || tok == FULL || tok == CROSS {
  207. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == JOIN {
  208. var jt = INNER_JOIN
  209. switch tok {
  210. case INNER:
  211. jt = INNER_JOIN
  212. case LEFT:
  213. jt = LEFT_JOIN
  214. case RIGHT:
  215. jt = RIGHT_JOIN
  216. case FULL:
  217. jt = FULL_JOIN
  218. case CROSS:
  219. jt = CROSS_JOIN
  220. }
  221. if j, err := p.ParseJoin(jt); err != nil {
  222. return nil, err
  223. } else {
  224. joins = append(joins, *j)
  225. }
  226. } else {
  227. return nil, fmt.Errorf("found %q, expected JOIN key word.", lit)
  228. }
  229. } else {
  230. p.unscan()
  231. if len(joins) > 0 {
  232. return joins, nil
  233. }
  234. return nil, nil
  235. }
  236. }
  237. return joins, nil
  238. }
  239. func (p *Parser) ParseJoin(joinType JoinType) (*Join, error) {
  240. var j = &Join{JoinType: joinType}
  241. if src, alias, err := p.parseSourceLiteral(); err != nil {
  242. return nil, err
  243. } else {
  244. j.Name = src
  245. j.Alias = alias
  246. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ON {
  247. if CROSS_JOIN == joinType {
  248. return nil, fmt.Errorf("On expression is not required for cross join type.\n")
  249. }
  250. if exp, err := p.ParseExpr(); err != nil {
  251. return nil, err
  252. } else {
  253. j.Expr = exp
  254. }
  255. } else {
  256. p.unscan()
  257. }
  258. }
  259. return j, nil
  260. }
  261. func (p *Parser) parseDimensions() (Dimensions, error) {
  262. var ds Dimensions
  263. if t, _ := p.scanIgnoreWhitespace(); t == GROUP {
  264. if t1, l1 := p.scanIgnoreWhitespace(); t1 == BY {
  265. for {
  266. if exp, err := p.ParseExpr(); err != nil {
  267. return nil, err
  268. } else {
  269. d := Dimension{Expr: exp}
  270. ds = append(ds, d)
  271. }
  272. if tok, _ := p.scanIgnoreWhitespace(); tok == COMMA {
  273. continue
  274. } else {
  275. p.unscan()
  276. break
  277. }
  278. }
  279. } else {
  280. return nil, fmt.Errorf("found %q, expected BY statement.", l1)
  281. }
  282. } else {
  283. p.unscan()
  284. }
  285. return ds, nil
  286. }
  287. func (p *Parser) parseHaving() (Expr, error) {
  288. if tok, _ := p.scanIgnoreWhitespace(); tok != HAVING {
  289. p.unscan()
  290. return nil, nil
  291. }
  292. expr, err := p.ParseExpr()
  293. if err != nil {
  294. return nil, err
  295. }
  296. return expr, nil
  297. }
  298. func (p *Parser) parseSorts() (SortFields, error) {
  299. var ss SortFields
  300. if t, _ := p.scanIgnoreWhitespace(); t == ORDER {
  301. if t1, l1 := p.scanIgnoreWhitespace(); t1 == BY {
  302. for {
  303. if t1, l1 = p.scanIgnoreWhitespace(); t1 == IDENT {
  304. s := SortField{Ascending: true}
  305. p.unscan()
  306. if name, err := p.parseFieldNameSections(); err == nil {
  307. s.Name = strings.Join(name, tokens[COLSEP])
  308. } else {
  309. return nil, err
  310. }
  311. if t2, _ := p.scanIgnoreWhitespace(); t2 == DESC {
  312. s.Ascending = false
  313. ss = append(ss, s)
  314. } else if t2 == ASC {
  315. ss = append(ss, s)
  316. } else {
  317. ss = append(ss, s)
  318. p.unscan()
  319. continue
  320. }
  321. } else if t1 == COMMA {
  322. continue
  323. } else {
  324. p.unscan()
  325. break
  326. }
  327. }
  328. } else {
  329. return nil, fmt.Errorf("found %q, expected BY keyword.", l1)
  330. }
  331. } else {
  332. p.unscan()
  333. }
  334. return ss, nil
  335. }
  336. func (p *Parser) parseFields() (Fields, error) {
  337. var fields Fields
  338. tok, _ := p.scanIgnoreWhitespace()
  339. if tok == ASTERISK {
  340. fields = append(fields, Field{AName: "", Expr: &Wildcard{Token: tok}})
  341. return fields, nil
  342. }
  343. p.unscan()
  344. for {
  345. field, err := p.parseField()
  346. if err != nil {
  347. return nil, err
  348. } else {
  349. fields = append(fields, *field)
  350. }
  351. tok, _ = p.scanIgnoreWhitespace()
  352. if tok != COMMA {
  353. p.unscan()
  354. break
  355. }
  356. }
  357. return fields, nil
  358. }
  359. func (p *Parser) parseField() (*Field, error) {
  360. field := &Field{}
  361. if exp, err := p.ParseExpr(); err != nil {
  362. return nil, err
  363. } else {
  364. if e, ok := exp.(*FieldRef); ok {
  365. field.Name = e.Name
  366. } else if e, ok := exp.(*Call); ok {
  367. field.Name = e.Name
  368. }
  369. field.Expr = exp
  370. }
  371. if alias, err := p.parseAlias(); err != nil {
  372. return nil, err
  373. } else {
  374. if alias != "" {
  375. field.AName = alias
  376. }
  377. }
  378. return field, nil
  379. }
  380. func (p *Parser) parseAlias() (string, error) {
  381. tok, lit := p.scanIgnoreWhitespace()
  382. if tok == AS {
  383. if tok, lit = p.scanIgnoreWhitespace(); tok != IDENT {
  384. return "", fmt.Errorf("found %q, expected as alias.", lit)
  385. } else {
  386. return lit, nil
  387. }
  388. }
  389. p.unscan()
  390. return "", nil
  391. }
  392. func (p *Parser) ParseExpr() (Expr, error) {
  393. var err error
  394. root := &BinaryExpr{}
  395. root.RHS, err = p.parseUnaryExpr()
  396. if err != nil {
  397. return nil, err
  398. }
  399. for {
  400. op, _ := p.scanIgnoreWhitespace()
  401. if !op.isOperator() {
  402. p.unscan()
  403. return root.RHS, nil
  404. } else if op == ASTERISK { //Change the asterisk to Mul token.
  405. op = MUL
  406. } else if op == LBRACKET { //LBRACKET is a special token, need to unscan
  407. op = SUBSET
  408. p.unscan()
  409. }
  410. var rhs Expr
  411. if rhs, err = p.parseUnaryExpr(); err != nil {
  412. return nil, err
  413. }
  414. for node := root; ; {
  415. r, ok := node.RHS.(*BinaryExpr)
  416. if !ok || r.OP.Precedence() >= op.Precedence() {
  417. node.RHS = &BinaryExpr{LHS: node.RHS, RHS: rhs, OP: op}
  418. break
  419. }
  420. node = r
  421. }
  422. }
  423. return nil, nil
  424. }
  425. func (p *Parser) parseUnaryExpr() (Expr, error) {
  426. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == LPAREN {
  427. expr, err := p.ParseExpr()
  428. if err != nil {
  429. return nil, err
  430. }
  431. // Expect an RPAREN at the end.
  432. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != RPAREN {
  433. return nil, fmt.Errorf("found %q, expected right paren.", lit2)
  434. }
  435. return &ParenExpr{Expr: expr}, nil
  436. } else if tok1 == LBRACKET {
  437. return p.parseBracketExpr()
  438. }
  439. p.unscan()
  440. tok, lit := p.scanIgnoreWhitespace()
  441. if tok == CASE {
  442. return p.parseCaseExpr()
  443. } else if tok == IDENT {
  444. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == LPAREN {
  445. return p.parseCall(lit)
  446. }
  447. p.unscan() //Back the Lparen token
  448. p.unscan() //Back the ident token
  449. if n, err := p.parseFieldNameSections(); err != nil {
  450. return nil, err
  451. } else {
  452. if p.inmeta {
  453. if len(n) == 2 {
  454. return &MetaRef{StreamName: StreamName(n[0]), Name: n[1]}, nil
  455. }
  456. return &MetaRef{StreamName: "", Name: n[0]}, nil
  457. } else {
  458. if len(n) == 2 {
  459. return &FieldRef{StreamName: StreamName(n[0]), Name: n[1]}, nil
  460. }
  461. return &FieldRef{StreamName: "", Name: n[0]}, nil
  462. }
  463. }
  464. } else if tok == STRING {
  465. return &StringLiteral{Val: lit}, nil
  466. } else if tok == INTEGER {
  467. val, _ := strconv.Atoi(lit)
  468. return &IntegerLiteral{Val: val}, nil
  469. } else if tok == NUMBER {
  470. if v, err := strconv.ParseFloat(lit, 64); err != nil {
  471. return nil, fmt.Errorf("found %q, invalid number value.", lit)
  472. } else {
  473. return &NumberLiteral{Val: v}, nil
  474. }
  475. } else if tok == TRUE || tok == FALSE {
  476. if v, err := strconv.ParseBool(lit); err != nil {
  477. return nil, fmt.Errorf("found %q, invalid boolean value.", lit)
  478. } else {
  479. return &BooleanLiteral{Val: v}, nil
  480. }
  481. } else if tok.isTimeLiteral() {
  482. return &TimeLiteral{Val: tok}, nil
  483. }
  484. return nil, fmt.Errorf("found %q, expected expression.", lit)
  485. }
  486. func (p *Parser) parseBracketExpr() (Expr, error) {
  487. tok2, lit2 := p.scanIgnoreWhitespace()
  488. if tok2 == RBRACKET {
  489. //field[]
  490. return &ColonExpr{Start: 0, End: math.MinInt32}, nil
  491. } else if tok2 == INTEGER {
  492. start, err := strconv.Atoi(lit2)
  493. if err != nil {
  494. return nil, fmt.Errorf("The start index %s is not an int value in bracket expression.", lit2)
  495. }
  496. if tok3, _ := p.scanIgnoreWhitespace(); tok3 == RBRACKET {
  497. //Such as field[2]
  498. return &IndexExpr{Index: start}, nil
  499. } else if tok3 == COLON {
  500. //Such as field[2:] or field[2:4]
  501. return p.parseColonExpr(start)
  502. }
  503. } else if tok2 == COLON {
  504. //Such as field[:3] or [:]
  505. return p.parseColonExpr(0)
  506. }
  507. return nil, fmt.Errorf("Unexpected token %q. when parsing bracket expressions.", lit2)
  508. }
  509. func (p *Parser) parseColonExpr(start int) (Expr, error) {
  510. tok, lit := p.scanIgnoreWhitespace()
  511. if tok == INTEGER {
  512. end, err := strconv.Atoi(lit)
  513. if err != nil {
  514. return nil, fmt.Errorf("The end index %s is not an int value in bracket expression.", lit)
  515. }
  516. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == RBRACKET {
  517. return &ColonExpr{Start: start, End: end}, nil
  518. } else {
  519. return nil, fmt.Errorf("Found %q, expected right bracket.", lit1)
  520. }
  521. } else if tok == RBRACKET {
  522. return &ColonExpr{Start: start, End: math.MinInt32}, nil
  523. }
  524. return nil, fmt.Errorf("Found %q, expected right bracket.", lit)
  525. }
  526. func (p *Parser) parseAs(f *Field) (*Field, error) {
  527. tok, lit := p.scanIgnoreWhitespace()
  528. if tok != IDENT {
  529. return nil, fmt.Errorf("found %q, expected as alias.", lit)
  530. }
  531. f.AName = lit
  532. return f, nil
  533. }
  534. func (p *Parser) parseCall(name string) (Expr, error) {
  535. if strings.ToLower(name) == "meta" || strings.ToLower(name) == "mqtt" {
  536. p.inmeta = true
  537. defer func() {
  538. p.inmeta = false
  539. }()
  540. }
  541. var args []Expr
  542. for {
  543. if tok, _ := p.scanIgnoreWhitespace(); tok == RPAREN {
  544. if valErr := validateFuncs(name, nil); valErr != nil {
  545. return nil, valErr
  546. }
  547. return &Call{Name: name, Args: args}, nil
  548. } else if tok == ASTERISK {
  549. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != RPAREN {
  550. return nil, fmt.Errorf("found %q, expected right paren.", lit2)
  551. } else {
  552. if p.inmeta {
  553. args = append(args, &MetaRef{StreamName: "", Name: "*"})
  554. } else {
  555. args = append(args, &Wildcard{Token: ASTERISK})
  556. }
  557. return &Call{Name: name, Args: args}, nil
  558. }
  559. } else {
  560. p.unscan()
  561. }
  562. if exp, err := p.ParseExpr(); err != nil {
  563. return nil, err
  564. } else {
  565. args = append(args, exp)
  566. }
  567. if tok, _ := p.scanIgnoreWhitespace(); tok != COMMA {
  568. p.unscan()
  569. break
  570. }
  571. }
  572. if tok, lit := p.scanIgnoreWhitespace(); tok != RPAREN {
  573. return nil, fmt.Errorf("found function call %q, expected ), but with %q.", name, lit)
  574. }
  575. if wt, error := validateWindows(name, args); wt == NOT_WINDOW {
  576. if valErr := validateFuncs(name, args); valErr != nil {
  577. return nil, valErr
  578. }
  579. // Add context for some aggregate func
  580. if name == "deduplicate" {
  581. args = append([]Expr{&Wildcard{Token: ASTERISK}}, args...)
  582. }
  583. return &Call{Name: name, Args: args}, nil
  584. } else {
  585. if error != nil {
  586. return nil, error
  587. }
  588. win, err := p.ConvertToWindows(wt, args)
  589. if err != nil {
  590. return nil, error
  591. }
  592. // parse filter clause
  593. f, err := p.parseFilter()
  594. if err != nil {
  595. return nil, err
  596. } else if f != nil {
  597. win.Filter = f
  598. }
  599. return win, nil
  600. }
  601. }
  602. func (p *Parser) parseCaseExpr() (*CaseExpr, error) {
  603. c := &CaseExpr{}
  604. tok, _ := p.scanIgnoreWhitespace()
  605. p.unscan()
  606. if tok != WHEN { // no condition value for case, additional validation needed
  607. if exp, err := p.ParseExpr(); err != nil {
  608. return nil, err
  609. } else {
  610. c.Value = exp
  611. }
  612. }
  613. loop:
  614. for {
  615. tok, _ := p.scanIgnoreWhitespace()
  616. switch tok {
  617. case WHEN:
  618. if exp, err := p.ParseExpr(); err != nil {
  619. return nil, err
  620. } else {
  621. if c.WhenClauses == nil {
  622. c.WhenClauses = make([]*WhenClause, 0)
  623. }
  624. if c.Value == nil && !isBooleanArg(exp) {
  625. return nil, fmt.Errorf("invalid CASE expression, WHEN expression must be a bool condition")
  626. }
  627. w := &WhenClause{
  628. Expr: exp,
  629. }
  630. tokThen, _ := p.scanIgnoreWhitespace()
  631. if tokThen != THEN {
  632. return nil, fmt.Errorf("invalid CASE expression, THEN expected after WHEN")
  633. } else {
  634. if expThen, err := p.ParseExpr(); err != nil {
  635. return nil, err
  636. } else {
  637. w.Result = expThen
  638. c.WhenClauses = append(c.WhenClauses, w)
  639. }
  640. }
  641. }
  642. case ELSE:
  643. if c.WhenClauses != nil {
  644. if exp, err := p.ParseExpr(); err != nil {
  645. return nil, err
  646. } else {
  647. c.ElseClause = exp
  648. }
  649. } else {
  650. return nil, fmt.Errorf("invalid CASE expression, WHEN expected before ELSE")
  651. }
  652. case END:
  653. if c.WhenClauses != nil {
  654. break loop
  655. } else {
  656. return nil, fmt.Errorf("invalid CASE expression, WHEN expected before END")
  657. }
  658. default:
  659. return nil, fmt.Errorf("invalid CASE expression, END expected")
  660. }
  661. }
  662. return c, nil
  663. }
  664. func validateWindows(name string, args []Expr) (WindowType, error) {
  665. fname := strings.ToLower(name)
  666. switch fname {
  667. case "tumblingwindow":
  668. if err := validateWindow(fname, 2, args); err != nil {
  669. return TUMBLING_WINDOW, err
  670. }
  671. return TUMBLING_WINDOW, nil
  672. case "hoppingwindow":
  673. if err := validateWindow(fname, 3, args); err != nil {
  674. return HOPPING_WINDOW, err
  675. }
  676. return HOPPING_WINDOW, nil
  677. case "sessionwindow":
  678. if err := validateWindow(fname, 3, args); err != nil {
  679. return SESSION_WINDOW, err
  680. }
  681. return SESSION_WINDOW, nil
  682. case "slidingwindow":
  683. if err := validateWindow(fname, 2, args); err != nil {
  684. return SLIDING_WINDOW, err
  685. }
  686. return SLIDING_WINDOW, nil
  687. case "countwindow":
  688. if len(args) == 1 {
  689. if para1, ok := args[0].(*IntegerLiteral); ok && para1.Val > 0 {
  690. return COUNT_WINDOW, nil
  691. } else {
  692. return COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s.", args[0])
  693. }
  694. } else if len(args) == 2 {
  695. if para1, ok1 := args[0].(*IntegerLiteral); ok1 {
  696. if para2, ok2 := args[1].(*IntegerLiteral); ok2 {
  697. if para1.Val < para2.Val {
  698. return COUNT_WINDOW, fmt.Errorf("The second parameter value %d should be less than the first parameter %d.", para2.Val, para1.Val)
  699. } else {
  700. return COUNT_WINDOW, nil
  701. }
  702. }
  703. }
  704. return COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s, %s.", args[0], args[1])
  705. } else {
  706. return COUNT_WINDOW, fmt.Errorf("Invalid parameter count.")
  707. }
  708. }
  709. return NOT_WINDOW, nil
  710. }
  711. func validateWindow(funcName string, expectLen int, args []Expr) error {
  712. if len(args) != expectLen {
  713. return fmt.Errorf("The arguments for %s should be %d.\n", funcName, expectLen)
  714. }
  715. if _, ok := args[0].(*TimeLiteral); !ok {
  716. return fmt.Errorf("The 1st argument for %s is expecting timer literal expression. One value of [dd|hh|mi|ss|ms].\n", funcName)
  717. }
  718. for i := 1; i < len(args); i++ {
  719. if _, ok := args[i].(*IntegerLiteral); !ok {
  720. return fmt.Errorf("The %d argument for %s is expecting interger literal expression. \n", i, funcName)
  721. }
  722. }
  723. return nil
  724. }
  725. func (p *Parser) ConvertToWindows(wtype WindowType, args []Expr) (*Window, error) {
  726. win := &Window{WindowType: wtype}
  727. if wtype == COUNT_WINDOW {
  728. win.Length = &IntegerLiteral{Val: args[0].(*IntegerLiteral).Val}
  729. if len(args) == 2 {
  730. win.Interval = &IntegerLiteral{Val: args[1].(*IntegerLiteral).Val}
  731. }
  732. return win, nil
  733. }
  734. var unit = 1
  735. v := args[0].(*TimeLiteral).Val
  736. switch v {
  737. case DD:
  738. unit = 24 * 3600 * 1000
  739. case HH:
  740. unit = 3600 * 1000
  741. case MI:
  742. unit = 60 * 1000
  743. case SS:
  744. unit = 1000
  745. case MS:
  746. unit = 1
  747. default:
  748. return nil, fmt.Errorf("Invalid timeliteral %s", v)
  749. }
  750. win.Length = &IntegerLiteral{Val: args[1].(*IntegerLiteral).Val * unit}
  751. if len(args) > 2 {
  752. win.Interval = &IntegerLiteral{Val: args[2].(*IntegerLiteral).Val * unit}
  753. } else {
  754. win.Interval = &IntegerLiteral{Val: 0}
  755. }
  756. return win, nil
  757. }
  758. func (p *Parser) ParseCreateStmt() (Statement, error) {
  759. if tok, _ := p.scanIgnoreWhitespace(); tok == CREATE {
  760. tok1, lit1 := p.scanIgnoreWhitespace()
  761. stmt := &StreamStmt{}
  762. switch tok1 {
  763. case STREAM:
  764. stmt.StreamType = TypeStream
  765. case TABLE:
  766. stmt.StreamType = TypeTable
  767. default:
  768. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  769. }
  770. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  771. stmt.Name = StreamName(lit2)
  772. if fields, err := p.parseStreamFields(); err != nil {
  773. return nil, err
  774. } else {
  775. stmt.StreamFields = fields
  776. }
  777. if opts, err := p.parseStreamOptions(); err != nil {
  778. return nil, err
  779. } else {
  780. stmt.Options = opts
  781. }
  782. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == SEMICOLON {
  783. p.unscan()
  784. } else if tok3 == EOF {
  785. //Finish parsing create stream statement. Jump to validate
  786. } else {
  787. return nil, fmt.Errorf("found %q, expected semicolon or EOF.", lit3)
  788. }
  789. } else {
  790. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  791. }
  792. if valErr := validateStream(stmt); valErr != nil {
  793. return nil, valErr
  794. }
  795. return stmt, nil
  796. } else {
  797. p.unscan()
  798. return nil, nil
  799. }
  800. }
  801. // TODO more accurate validation for table
  802. func validateStream(stmt *StreamStmt) error {
  803. f := stmt.Options.FORMAT
  804. if f == "" {
  805. f = common.FORMAT_JSON
  806. }
  807. switch strings.ToLower(f) {
  808. case common.FORMAT_JSON:
  809. //do nothing
  810. case common.FORMAT_BINARY:
  811. if stmt.StreamType == TypeTable {
  812. return fmt.Errorf("'binary' format is not supported for table")
  813. }
  814. switch len(stmt.StreamFields) {
  815. case 0:
  816. // do nothing for schemaless
  817. case 1:
  818. f := stmt.StreamFields[0]
  819. if bt, ok := f.FieldType.(*BasicType); ok {
  820. if bt.Type == BYTEA {
  821. break
  822. }
  823. }
  824. return fmt.Errorf("'binary' format stream can have only 'bytea' type field")
  825. default:
  826. return fmt.Errorf("'binary' format stream can have only one field")
  827. }
  828. default:
  829. return fmt.Errorf("option 'format=%s' is invalid", f)
  830. }
  831. return nil
  832. }
  833. func (p *Parser) parseShowStmt() (Statement, error) {
  834. if tok, _ := p.scanIgnoreWhitespace(); tok == SHOW {
  835. tok1, lit1 := p.scanIgnoreWhitespace()
  836. switch tok1 {
  837. case STREAMS:
  838. ss := &ShowStreamsStatement{}
  839. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == EOF || tok2 == SEMICOLON {
  840. return ss, nil
  841. } else {
  842. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  843. }
  844. case TABLES:
  845. ss := &ShowTablesStatement{}
  846. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == EOF || tok2 == SEMICOLON {
  847. return ss, nil
  848. } else {
  849. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  850. }
  851. default:
  852. return nil, fmt.Errorf("found %q, expected keyword streams or tables.", lit1)
  853. }
  854. } else {
  855. p.unscan()
  856. return nil, nil
  857. }
  858. }
  859. func (p *Parser) parseDescribeStmt() (Statement, error) {
  860. if tok, _ := p.scanIgnoreWhitespace(); tok == DESCRIBE {
  861. tok1, lit1 := p.scanIgnoreWhitespace()
  862. switch tok1 {
  863. case STREAM:
  864. dss := &DescribeStreamStatement{}
  865. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  866. dss.Name = lit2
  867. return dss, nil
  868. } else {
  869. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  870. }
  871. case TABLE:
  872. dss := &DescribeTableStatement{}
  873. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  874. dss.Name = lit2
  875. return dss, nil
  876. } else {
  877. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  878. }
  879. default:
  880. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  881. }
  882. } else {
  883. p.unscan()
  884. return nil, nil
  885. }
  886. }
  887. func (p *Parser) parseExplainStmt() (Statement, error) {
  888. if tok, _ := p.scanIgnoreWhitespace(); tok == EXPLAIN {
  889. tok1, lit1 := p.scanIgnoreWhitespace()
  890. switch tok1 {
  891. case STREAM:
  892. ess := &ExplainStreamStatement{}
  893. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  894. ess.Name = lit2
  895. return ess, nil
  896. } else {
  897. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  898. }
  899. case TABLE:
  900. ess := &ExplainTableStatement{}
  901. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  902. ess.Name = lit2
  903. return ess, nil
  904. } else {
  905. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  906. }
  907. default:
  908. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  909. }
  910. } else {
  911. p.unscan()
  912. return nil, nil
  913. }
  914. }
  915. func (p *Parser) parseDropStmt() (Statement, error) {
  916. if tok, _ := p.scanIgnoreWhitespace(); tok == DROP {
  917. tok1, lit1 := p.scanIgnoreWhitespace()
  918. switch tok1 {
  919. case STREAM:
  920. ess := &DropStreamStatement{}
  921. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  922. ess.Name = lit2
  923. return ess, nil
  924. } else {
  925. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  926. }
  927. case TABLE:
  928. ess := &DropTableStatement{}
  929. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  930. ess.Name = lit2
  931. return ess, nil
  932. } else {
  933. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  934. }
  935. default:
  936. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  937. }
  938. } else {
  939. p.unscan()
  940. return nil, nil
  941. }
  942. }
  943. func (p *Parser) parseStreamFields() (StreamFields, error) {
  944. lStack := &stack.Stack{}
  945. var fields StreamFields
  946. if tok, lit := p.scanIgnoreWhitespace(); tok == LPAREN {
  947. lStack.Push(lit)
  948. for {
  949. //For the schemaless streams
  950. //create stream demo () WITH (FORMAT="JSON", DATASOURCE="demo" TYPE="edgex")
  951. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == RPAREN {
  952. lStack.Pop()
  953. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != WITH {
  954. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  955. }
  956. return fields, nil
  957. } else {
  958. p.unscan()
  959. }
  960. if f, err := p.parseStreamField(); err != nil {
  961. return nil, err
  962. } else {
  963. fields = append(fields, *f)
  964. }
  965. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == RPAREN {
  966. lStack.Pop()
  967. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == WITH {
  968. //Check the stack for LPAREN; If the stack for LPAREN is not zero, then it's not correct.
  969. if lStack.Len() > 0 {
  970. return nil, fmt.Errorf("Parenthesis is not matched.")
  971. }
  972. break
  973. } else if tok2 == COMMA {
  974. if lStack.Len() > 0 {
  975. return nil, fmt.Errorf("Parenthesis is in create record type not matched.")
  976. }
  977. p.unscan()
  978. break
  979. } else if tok2 == RPAREN { //The nested type definition of ARRAY and Struct, such as "field ARRAY(STRUCT(f BIGINT))"
  980. if lStack.Len() > 0 {
  981. return nil, fmt.Errorf("Parenthesis is not matched.")
  982. }
  983. p.unscan()
  984. break
  985. } else {
  986. if lStack.Len() == 0 {
  987. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  988. }
  989. p.unscan()
  990. }
  991. } else {
  992. p.unscan()
  993. }
  994. }
  995. } else {
  996. return nil, fmt.Errorf("found %q, expected lparen after stream name.", lit)
  997. }
  998. return fields, nil
  999. }
  1000. func (p *Parser) parseStreamField() (*StreamField, error) {
  1001. field := &StreamField{}
  1002. if tok, lit := p.scanIgnoreWhitespace(); tok == IDENT {
  1003. field.Name = lit
  1004. tok1, lit1 := p.scanIgnoreWhitespace()
  1005. if t := getDataType(tok1); t != UNKNOWN && t.isSimpleType() {
  1006. field.FieldType = &BasicType{Type: t}
  1007. } else if t == ARRAY {
  1008. if f, e := p.parseStreamArrayType(); e != nil {
  1009. return nil, e
  1010. } else {
  1011. field.FieldType = f
  1012. }
  1013. } else if t == STRUCT {
  1014. if f, e := p.parseStreamStructType(); e != nil {
  1015. return nil, e
  1016. } else {
  1017. field.FieldType = f
  1018. }
  1019. } else if t == UNKNOWN {
  1020. return nil, fmt.Errorf("found %q, expect valid stream field types(BIGINT | FLOAT | STRINGS | DATETIME | BOOLEAN | BYTEA | ARRAY | STRUCT).", lit1)
  1021. }
  1022. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == COMMA {
  1023. //Just consume the comma.
  1024. } else if tok2 == RPAREN {
  1025. p.unscan()
  1026. } else {
  1027. return nil, fmt.Errorf("found %q, expect comma or rparen.", lit2)
  1028. }
  1029. } else {
  1030. return nil, fmt.Errorf("found %q, expect stream field name.", lit)
  1031. }
  1032. return field, nil
  1033. }
  1034. func (p *Parser) parseStreamArrayType() (FieldType, error) {
  1035. lStack := &stack.Stack{}
  1036. if tok, _ := p.scanIgnoreWhitespace(); tok == LPAREN {
  1037. lStack.Push(LPAREN)
  1038. tok1, lit1 := p.scanIgnoreWhitespace()
  1039. if t := getDataType(tok1); t != UNKNOWN && t.isSimpleType() {
  1040. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == RPAREN {
  1041. lStack.Pop()
  1042. if lStack.Len() > 0 {
  1043. return nil, fmt.Errorf("Parenthesis is in array type not matched.")
  1044. }
  1045. return &ArrayType{Type: t}, nil
  1046. } else {
  1047. return nil, fmt.Errorf("found %q, expect rparen in array type definition.", lit2)
  1048. }
  1049. } else if tok1 == XSTRUCT {
  1050. if f, err := p.parseStreamStructType(); err != nil {
  1051. return nil, err
  1052. } else {
  1053. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == RPAREN {
  1054. lStack.Pop()
  1055. if lStack.Len() > 0 {
  1056. return nil, fmt.Errorf("Parenthesis is in struct of array type %q not matched.", tok1)
  1057. }
  1058. return &ArrayType{Type: STRUCT, FieldType: f}, nil
  1059. } else {
  1060. return nil, fmt.Errorf("found %q, expect rparen in struct of array type definition.", lit2)
  1061. }
  1062. }
  1063. } else if tok1 == COMMA {
  1064. p.unscan()
  1065. } else {
  1066. return nil, fmt.Errorf("found %q, expect stream data types.", lit1)
  1067. }
  1068. } else {
  1069. }
  1070. return nil, nil
  1071. }
  1072. func (p *Parser) parseStreamStructType() (FieldType, error) {
  1073. rf := &RecType{}
  1074. if sfs, err := p.parseStreamFields(); err != nil {
  1075. return nil, err
  1076. } else {
  1077. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == COMMA {
  1078. rf.StreamFields = sfs
  1079. p.unscan()
  1080. } else if tok2 == RPAREN {
  1081. rf.StreamFields = sfs
  1082. p.unscan()
  1083. } else {
  1084. return nil, fmt.Errorf("found %q, expect comma in create stream record statement.", lit2)
  1085. }
  1086. }
  1087. return rf, nil
  1088. }
  1089. func (p *Parser) parseStreamOptions() (*Options, error) {
  1090. opts := &Options{}
  1091. v := reflect.ValueOf(opts)
  1092. lStack := &stack.Stack{}
  1093. if tok, lit := p.scanIgnoreWhitespace(); tok == LPAREN {
  1094. lStack.Push(LPAREN)
  1095. for {
  1096. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == DATASOURCE || tok1 == FORMAT || tok1 == KEY || tok1 == CONF_KEY || tok1 == STRICT_VALIDATION || tok1 == TYPE || tok1 == TIMESTAMP || tok1 == TIMESTAMP_FORMAT || tok1 == RETAIN_SIZE {
  1097. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == EQ {
  1098. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == STRING {
  1099. switch tok1 {
  1100. case STRICT_VALIDATION:
  1101. if val := strings.ToUpper(lit3); (val != "TRUE") && (val != "FALSE") {
  1102. return nil, fmt.Errorf("found %q, expect TRUE/FALSE value in %s option.", lit3, tok1)
  1103. } else {
  1104. opts.STRICT_VALIDATION = (val == "TRUE")
  1105. }
  1106. case RETAIN_SIZE:
  1107. if val, err := strconv.Atoi(lit3); err != nil {
  1108. return nil, fmt.Errorf("found %q, expect number value in %s option.", lit3, tok1)
  1109. } else {
  1110. opts.RETAIN_SIZE = val
  1111. }
  1112. default:
  1113. f := v.Elem().FieldByName(lit1)
  1114. if f.IsValid() {
  1115. f.SetString(lit3)
  1116. } else { // should not happen
  1117. return nil, fmt.Errorf("invalid field %s.", lit1)
  1118. }
  1119. }
  1120. } else {
  1121. return nil, fmt.Errorf("found %q, expect string value in option.", lit3)
  1122. }
  1123. } else {
  1124. return nil, fmt.Errorf("found %q, expect equals(=) in options.", lit2)
  1125. }
  1126. } else if tok1 == COMMA {
  1127. continue
  1128. } else if tok1 == RPAREN {
  1129. if lStack.Pop(); lStack.Len() == 0 {
  1130. break
  1131. } else {
  1132. return nil, fmt.Errorf("Parenthesis is not matched in options definition.")
  1133. }
  1134. } else {
  1135. return nil, fmt.Errorf("found %q, unknown option keys(DATASOURCE|FORMAT|KEY|CONF_KEY|STRICT_VALIDATION|TYPE|TIMESTAMP|TIMESTAMP_FORMAT|RETAIN_SIZE).", lit1)
  1136. }
  1137. }
  1138. } else {
  1139. return nil, fmt.Errorf("found %q, expect stream options.", lit)
  1140. }
  1141. return opts, nil
  1142. }
  1143. // Only support filter on window now
  1144. func (p *Parser) parseFilter() (Expr, error) {
  1145. if tok, _ := p.scanIgnoreWhitespace(); tok != FILTER {
  1146. p.unscan()
  1147. return nil, nil
  1148. }
  1149. if tok, lit := p.scanIgnoreWhitespace(); tok != LPAREN {
  1150. return nil, fmt.Errorf("Found %q after FILTER, expect parentheses.", lit)
  1151. }
  1152. if tok, lit := p.scanIgnoreWhitespace(); tok != WHERE {
  1153. return nil, fmt.Errorf("Found %q after FILTER(, expect WHERE.", lit)
  1154. }
  1155. expr, err := p.ParseExpr()
  1156. if err != nil {
  1157. return nil, err
  1158. }
  1159. if tok, lit := p.scanIgnoreWhitespace(); tok != RPAREN {
  1160. return nil, fmt.Errorf("Found %q after FILTER, expect right parentheses.", lit)
  1161. }
  1162. return expr, nil
  1163. }