parser.go 32 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285
  1. package xsql
  2. import (
  3. "fmt"
  4. "github.com/emqx/kuiper/common"
  5. "github.com/golang-collections/collections/stack"
  6. "io"
  7. "math"
  8. "reflect"
  9. "strconv"
  10. "strings"
  11. )
  12. type Parser struct {
  13. s *Scanner
  14. i int // buffer index
  15. n int // buffer char count
  16. buf [3]struct {
  17. tok Token
  18. lit string
  19. }
  20. inmeta bool
  21. }
  22. func (p *Parser) parseCondition() (Expr, error) {
  23. if tok, _ := p.scanIgnoreWhitespace(); tok != WHERE {
  24. p.unscan()
  25. return nil, nil
  26. }
  27. expr, err := p.ParseExpr()
  28. if err != nil {
  29. return nil, err
  30. }
  31. return expr, nil
  32. }
  33. func (p *Parser) scan() (tok Token, lit string) {
  34. if p.n > 0 {
  35. p.n--
  36. return p.curr()
  37. }
  38. tok, lit = p.s.Scan()
  39. if tok != WS && tok != COMMENT {
  40. p.i = (p.i + 1) % len(p.buf)
  41. buf := &p.buf[p.i]
  42. buf.tok, buf.lit = tok, lit
  43. }
  44. return
  45. }
  46. func (p *Parser) curr() (Token, string) {
  47. i := (p.i - p.n + len(p.buf)) % len(p.buf)
  48. buf := &p.buf[i]
  49. return buf.tok, buf.lit
  50. }
  51. func (p *Parser) scanIgnoreWhitespace() (tok Token, lit string) {
  52. tok, lit = p.scan()
  53. for {
  54. if tok == WS || tok == COMMENT {
  55. tok, lit = p.scan()
  56. } else {
  57. break
  58. }
  59. }
  60. return tok, lit
  61. }
  62. func (p *Parser) unscan() { p.n++ }
  63. func NewParser(r io.Reader) *Parser {
  64. return &Parser{s: NewScanner(r)}
  65. }
  66. func (p *Parser) ParseQueries() (SelectStatements, error) {
  67. var stmts SelectStatements
  68. if stmt, err := p.Parse(); err != nil {
  69. return nil, err
  70. } else {
  71. stmts = append(stmts, *stmt)
  72. }
  73. for {
  74. if tok, _ := p.scanIgnoreWhitespace(); tok == SEMICOLON {
  75. if stmt, err := p.Parse(); err != nil {
  76. return nil, err
  77. } else {
  78. if stmt != nil {
  79. stmts = append(stmts, *stmt)
  80. }
  81. }
  82. } else if tok == EOF {
  83. break
  84. }
  85. }
  86. return stmts, nil
  87. }
  88. func (p *Parser) Parse() (*SelectStatement, error) {
  89. selects := &SelectStatement{}
  90. if tok, lit := p.scanIgnoreWhitespace(); tok == EOF {
  91. return nil, nil
  92. } else if tok != SELECT {
  93. return nil, fmt.Errorf("Found %q, Expected SELECT.\n", lit)
  94. }
  95. if fields, err := p.parseFields(); err != nil {
  96. return nil, err
  97. } else {
  98. selects.Fields = fields
  99. }
  100. if src, err := p.parseSource(); err != nil {
  101. return nil, err
  102. } else {
  103. selects.Sources = src
  104. }
  105. if joins, err := p.parseJoins(); err != nil {
  106. return nil, err
  107. } else {
  108. selects.Joins = joins
  109. }
  110. if exp, err := p.parseCondition(); err != nil {
  111. return nil, err
  112. } else {
  113. if exp != nil {
  114. selects.Condition = exp
  115. }
  116. }
  117. if dims, err := p.parseDimensions(); err != nil {
  118. return nil, err
  119. } else {
  120. selects.Dimensions = dims
  121. }
  122. if having, err := p.parseHaving(); err != nil {
  123. return nil, err
  124. } else {
  125. selects.Having = having
  126. }
  127. if sorts, err := p.parseSorts(); err != nil {
  128. return nil, err
  129. } else {
  130. selects.SortFields = sorts
  131. }
  132. if tok, lit := p.scanIgnoreWhitespace(); tok == SEMICOLON {
  133. p.unscan()
  134. return selects, nil
  135. } else if tok != EOF {
  136. return nil, fmt.Errorf("found %q, expected EOF.", lit)
  137. }
  138. if err := Validate(selects); err != nil {
  139. return nil, err
  140. }
  141. return selects, nil
  142. }
  143. func (p *Parser) parseSource() (Sources, error) {
  144. var sources Sources
  145. if tok, lit := p.scanIgnoreWhitespace(); tok != FROM {
  146. return nil, fmt.Errorf("found %q, expected FROM.", lit)
  147. }
  148. if src, alias, err := p.parseSourceLiteral(); err != nil {
  149. return nil, err
  150. } else {
  151. sources = append(sources, &Table{Name: src, Alias: alias})
  152. }
  153. return sources, nil
  154. }
  155. //TODO Current func has problems when the source includes white space.
  156. func (p *Parser) parseSourceLiteral() (string, string, error) {
  157. var sourceSeg []string
  158. var alias string
  159. for {
  160. //HASH, DIV & ADD token is specially support for MQTT topic name patterns.
  161. if tok, lit := p.scanIgnoreWhitespace(); tok.allowedSourceToken() {
  162. sourceSeg = append(sourceSeg, lit)
  163. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == AS {
  164. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  165. alias = lit2
  166. } else {
  167. return "", "", fmt.Errorf("found %q, expected JOIN key word.", lit)
  168. }
  169. } else if tok1.allowedSourceToken() {
  170. sourceSeg = append(sourceSeg, lit1)
  171. } else {
  172. p.unscan()
  173. break
  174. }
  175. } else {
  176. p.unscan()
  177. break
  178. }
  179. }
  180. return strings.Join(sourceSeg, ""), alias, nil
  181. }
  182. func (p *Parser) parseFieldNameSections() ([]string, error) {
  183. var fieldNameSects []string
  184. for {
  185. if tok, lit := p.scanIgnoreWhitespace(); tok == IDENT || tok == ASTERISK {
  186. fieldNameSects = append(fieldNameSects, lit)
  187. if tok1, _ := p.scanIgnoreWhitespace(); !tok1.allowedSFNToken() {
  188. p.unscan()
  189. break
  190. }
  191. } else {
  192. p.unscan()
  193. break
  194. }
  195. }
  196. if len(fieldNameSects) == 0 {
  197. return nil, fmt.Errorf("Cannot find any field name.\n")
  198. } else if len(fieldNameSects) > 2 {
  199. return nil, fmt.Errorf("Too many field names. Please use -> to reference keys in struct.\n")
  200. }
  201. return fieldNameSects, nil
  202. }
  203. func (p *Parser) parseJoins() (Joins, error) {
  204. var joins Joins
  205. for {
  206. if tok, lit := p.scanIgnoreWhitespace(); tok == INNER || tok == LEFT || tok == RIGHT || tok == FULL || tok == CROSS {
  207. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == JOIN {
  208. var jt = INNER_JOIN
  209. switch tok {
  210. case INNER:
  211. jt = INNER_JOIN
  212. case LEFT:
  213. jt = LEFT_JOIN
  214. case RIGHT:
  215. jt = RIGHT_JOIN
  216. case FULL:
  217. jt = FULL_JOIN
  218. case CROSS:
  219. jt = CROSS_JOIN
  220. }
  221. if j, err := p.ParseJoin(jt); err != nil {
  222. return nil, err
  223. } else {
  224. joins = append(joins, *j)
  225. }
  226. } else {
  227. return nil, fmt.Errorf("found %q, expected JOIN key word.", lit)
  228. }
  229. } else {
  230. p.unscan()
  231. if len(joins) > 0 {
  232. return joins, nil
  233. }
  234. return nil, nil
  235. }
  236. }
  237. return joins, nil
  238. }
  239. func (p *Parser) ParseJoin(joinType JoinType) (*Join, error) {
  240. var j = &Join{JoinType: joinType}
  241. if src, alias, err := p.parseSourceLiteral(); err != nil {
  242. return nil, err
  243. } else {
  244. j.Name = src
  245. j.Alias = alias
  246. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ON {
  247. if CROSS_JOIN == joinType {
  248. return nil, fmt.Errorf("On expression is not required for cross join type.\n")
  249. }
  250. if exp, err := p.ParseExpr(); err != nil {
  251. return nil, err
  252. } else {
  253. j.Expr = exp
  254. }
  255. } else {
  256. p.unscan()
  257. }
  258. }
  259. return j, nil
  260. }
  261. func (p *Parser) parseDimensions() (Dimensions, error) {
  262. var ds Dimensions
  263. if t, _ := p.scanIgnoreWhitespace(); t == GROUP {
  264. if t1, l1 := p.scanIgnoreWhitespace(); t1 == BY {
  265. for {
  266. if exp, err := p.ParseExpr(); err != nil {
  267. return nil, err
  268. } else {
  269. d := Dimension{Expr: exp}
  270. ds = append(ds, d)
  271. }
  272. if tok, _ := p.scanIgnoreWhitespace(); tok == COMMA {
  273. continue
  274. } else {
  275. p.unscan()
  276. break
  277. }
  278. }
  279. } else {
  280. return nil, fmt.Errorf("found %q, expected BY statement.", l1)
  281. }
  282. } else {
  283. p.unscan()
  284. }
  285. return ds, nil
  286. }
  287. func (p *Parser) parseHaving() (Expr, error) {
  288. if tok, _ := p.scanIgnoreWhitespace(); tok != HAVING {
  289. p.unscan()
  290. return nil, nil
  291. }
  292. expr, err := p.ParseExpr()
  293. if err != nil {
  294. return nil, err
  295. }
  296. return expr, nil
  297. }
  298. func (p *Parser) parseSorts() (SortFields, error) {
  299. var ss SortFields
  300. if t, _ := p.scanIgnoreWhitespace(); t == ORDER {
  301. if t1, l1 := p.scanIgnoreWhitespace(); t1 == BY {
  302. for {
  303. if t1, l1 = p.scanIgnoreWhitespace(); t1 == IDENT {
  304. s := SortField{Ascending: true}
  305. p.unscan()
  306. if name, err := p.parseFieldNameSections(); err == nil {
  307. s.Name = strings.Join(name, tokens[COLSEP])
  308. } else {
  309. return nil, err
  310. }
  311. if t2, _ := p.scanIgnoreWhitespace(); t2 == DESC {
  312. s.Ascending = false
  313. ss = append(ss, s)
  314. } else if t2 == ASC {
  315. ss = append(ss, s)
  316. } else {
  317. ss = append(ss, s)
  318. p.unscan()
  319. continue
  320. }
  321. } else if t1 == COMMA {
  322. continue
  323. } else {
  324. p.unscan()
  325. break
  326. }
  327. }
  328. } else {
  329. return nil, fmt.Errorf("found %q, expected BY keyword.", l1)
  330. }
  331. } else {
  332. p.unscan()
  333. }
  334. return ss, nil
  335. }
  336. func (p *Parser) parseFields() (Fields, error) {
  337. var fields Fields
  338. tok, _ := p.scanIgnoreWhitespace()
  339. if tok == ASTERISK {
  340. fields = append(fields, Field{AName: "", Expr: &Wildcard{Token: tok}})
  341. return fields, nil
  342. }
  343. p.unscan()
  344. for {
  345. field, err := p.parseField()
  346. if err != nil {
  347. return nil, err
  348. } else {
  349. fields = append(fields, *field)
  350. }
  351. tok, _ = p.scanIgnoreWhitespace()
  352. if tok != COMMA {
  353. p.unscan()
  354. break
  355. }
  356. }
  357. return fields, nil
  358. }
  359. func (p *Parser) parseField() (*Field, error) {
  360. field := &Field{}
  361. if exp, err := p.ParseExpr(); err != nil {
  362. return nil, err
  363. } else {
  364. if e, ok := exp.(*FieldRef); ok {
  365. field.Name = e.Name
  366. } else if e, ok := exp.(*Call); ok {
  367. field.Name = e.Name
  368. }
  369. field.Expr = exp
  370. }
  371. if alias, err := p.parseAlias(); err != nil {
  372. return nil, err
  373. } else {
  374. if alias != "" {
  375. field.AName = alias
  376. }
  377. }
  378. return field, nil
  379. }
  380. func (p *Parser) parseAlias() (string, error) {
  381. tok, lit := p.scanIgnoreWhitespace()
  382. if tok == AS {
  383. if tok, lit = p.scanIgnoreWhitespace(); tok != IDENT {
  384. return "", fmt.Errorf("found %q, expected as alias.", lit)
  385. } else {
  386. return lit, nil
  387. }
  388. }
  389. p.unscan()
  390. return "", nil
  391. }
  392. func (p *Parser) ParseExpr() (Expr, error) {
  393. var err error
  394. root := &BinaryExpr{}
  395. root.RHS, err = p.parseUnaryExpr(false)
  396. if err != nil {
  397. return nil, err
  398. }
  399. for {
  400. op, _ := p.scanIgnoreWhitespace()
  401. if !op.isOperator() {
  402. p.unscan()
  403. return root.RHS, nil
  404. } else if op == ASTERISK { //Change the asterisk to Mul token.
  405. op = MUL
  406. } else if op == LBRACKET { //LBRACKET is a special token, need to unscan
  407. op = SUBSET
  408. p.unscan()
  409. }
  410. var rhs Expr
  411. if rhs, err = p.parseUnaryExpr(op == ARROW); err != nil {
  412. return nil, err
  413. }
  414. for node := root; ; {
  415. r, ok := node.RHS.(*BinaryExpr)
  416. if !ok || r.OP.Precedence() >= op.Precedence() {
  417. node.RHS = &BinaryExpr{LHS: node.RHS, RHS: rhs, OP: op}
  418. break
  419. }
  420. node = r
  421. }
  422. }
  423. return nil, nil
  424. }
  425. func (p *Parser) parseUnaryExpr(isSubField bool) (Expr, error) {
  426. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == LPAREN {
  427. expr, err := p.ParseExpr()
  428. if err != nil {
  429. return nil, err
  430. }
  431. // Expect an RPAREN at the end.
  432. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != RPAREN {
  433. return nil, fmt.Errorf("found %q, expected right paren.", lit2)
  434. }
  435. return &ParenExpr{Expr: expr}, nil
  436. } else if tok1 == LBRACKET {
  437. return p.parseBracketExpr()
  438. }
  439. p.unscan()
  440. tok, lit := p.scanIgnoreWhiteSpaceWithNegativeNum()
  441. if tok == CASE {
  442. return p.parseCaseExpr()
  443. } else if tok == IDENT {
  444. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == LPAREN {
  445. return p.parseCall(lit)
  446. }
  447. p.unscan() //Back the Lparen token
  448. p.unscan() //Back the ident token
  449. if n, err := p.parseFieldNameSections(); err != nil {
  450. return nil, err
  451. } else {
  452. if p.inmeta {
  453. if len(n) == 2 {
  454. return &MetaRef{StreamName: StreamName(n[0]), Name: n[1]}, nil
  455. }
  456. if isSubField {
  457. return &MetaRef{StreamName: "", Name: n[0]}, nil
  458. }
  459. return &MetaRef{StreamName: DefaultStream, Name: n[0]}, nil
  460. } else {
  461. if len(n) == 2 {
  462. return &FieldRef{StreamName: StreamName(n[0]), Name: n[1]}, nil
  463. }
  464. if isSubField {
  465. return &FieldRef{StreamName: "", Name: n[0]}, nil
  466. }
  467. return &FieldRef{StreamName: DefaultStream, Name: n[0]}, nil
  468. }
  469. }
  470. } else if tok == STRING {
  471. return &StringLiteral{Val: lit}, nil
  472. } else if tok == INTEGER {
  473. val, _ := strconv.Atoi(lit)
  474. return &IntegerLiteral{Val: val}, nil
  475. } else if tok == NUMBER {
  476. if v, err := strconv.ParseFloat(lit, 64); err != nil {
  477. return nil, fmt.Errorf("found %q, invalid number value.", lit)
  478. } else {
  479. return &NumberLiteral{Val: v}, nil
  480. }
  481. } else if tok == TRUE || tok == FALSE {
  482. if v, err := strconv.ParseBool(lit); err != nil {
  483. return nil, fmt.Errorf("found %q, invalid boolean value.", lit)
  484. } else {
  485. return &BooleanLiteral{Val: v}, nil
  486. }
  487. } else if tok.isTimeLiteral() {
  488. return &TimeLiteral{Val: tok}, nil
  489. }
  490. return nil, fmt.Errorf("found %q, expected expression.", lit)
  491. }
  492. func (p *Parser) parseBracketExpr() (Expr, error) {
  493. tok2, lit2 := p.scanIgnoreWhiteSpaceWithNegativeNum()
  494. if tok2 == RBRACKET {
  495. //field[]
  496. return &ColonExpr{Start: 0, End: math.MinInt32}, nil
  497. } else if tok2 == INTEGER {
  498. start, err := strconv.Atoi(lit2)
  499. if err != nil {
  500. return nil, fmt.Errorf("The start index %s is not an int value in bracket expression.", lit2)
  501. }
  502. if tok3, _ := p.scanIgnoreWhitespace(); tok3 == RBRACKET {
  503. //Such as field[2]
  504. return &IndexExpr{Index: start}, nil
  505. } else if tok3 == COLON {
  506. //Such as field[2:] or field[2:4]
  507. return p.parseColonExpr(start)
  508. }
  509. } else if tok2 == COLON {
  510. //Such as field[:3] or [:]
  511. return p.parseColonExpr(0)
  512. }
  513. return nil, fmt.Errorf("Unexpected token %q. when parsing bracket expressions.", lit2)
  514. }
  515. func (p *Parser) parseColonExpr(start int) (Expr, error) {
  516. tok, lit := p.scanIgnoreWhiteSpaceWithNegativeNum()
  517. if tok == INTEGER {
  518. end, err := strconv.Atoi(lit)
  519. if err != nil {
  520. return nil, fmt.Errorf("The end index %s is not an int value in bracket expression.", lit)
  521. }
  522. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == RBRACKET {
  523. return &ColonExpr{Start: start, End: end}, nil
  524. } else {
  525. return nil, fmt.Errorf("Found %q, expected right bracket.", lit1)
  526. }
  527. } else if tok == RBRACKET {
  528. return &ColonExpr{Start: start, End: math.MinInt32}, nil
  529. }
  530. return nil, fmt.Errorf("Found %q, expected right bracket.", lit)
  531. }
  532. func (p *Parser) scanIgnoreWhiteSpaceWithNegativeNum() (Token, string) {
  533. tok, lit := p.scanIgnoreWhitespace()
  534. if tok == SUB {
  535. _, _ = p.s.ScanWhiteSpace()
  536. r := p.s.read()
  537. if isDigit(r) {
  538. p.s.unread()
  539. tok, lit = p.s.ScanNumber(false, true)
  540. }
  541. }
  542. return tok, lit
  543. }
  544. func (p *Parser) parseAs(f *Field) (*Field, error) {
  545. tok, lit := p.scanIgnoreWhitespace()
  546. if tok != IDENT {
  547. return nil, fmt.Errorf("found %q, expected as alias.", lit)
  548. }
  549. f.AName = lit
  550. return f, nil
  551. }
  552. func (p *Parser) parseCall(name string) (Expr, error) {
  553. if strings.ToLower(name) == "meta" || strings.ToLower(name) == "mqtt" {
  554. p.inmeta = true
  555. defer func() {
  556. p.inmeta = false
  557. }()
  558. }
  559. var args []Expr
  560. for {
  561. if tok, _ := p.scanIgnoreWhitespace(); tok == RPAREN {
  562. if valErr := validateFuncs(name, nil); valErr != nil {
  563. return nil, valErr
  564. }
  565. return &Call{Name: name, Args: args}, nil
  566. } else if tok == ASTERISK {
  567. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != RPAREN {
  568. return nil, fmt.Errorf("found %q, expected right paren.", lit2)
  569. } else {
  570. if p.inmeta {
  571. args = append(args, &MetaRef{StreamName: "", Name: "*"})
  572. } else {
  573. args = append(args, &Wildcard{Token: ASTERISK})
  574. }
  575. return &Call{Name: name, Args: args}, nil
  576. }
  577. } else {
  578. p.unscan()
  579. }
  580. if exp, err := p.ParseExpr(); err != nil {
  581. return nil, err
  582. } else {
  583. args = append(args, exp)
  584. }
  585. if tok, _ := p.scanIgnoreWhitespace(); tok != COMMA {
  586. p.unscan()
  587. break
  588. }
  589. }
  590. if tok, lit := p.scanIgnoreWhitespace(); tok != RPAREN {
  591. return nil, fmt.Errorf("found function call %q, expected ), but with %q.", name, lit)
  592. }
  593. if wt, error := validateWindows(name, args); wt == NOT_WINDOW {
  594. if valErr := validateFuncs(name, args); valErr != nil {
  595. return nil, valErr
  596. }
  597. // Add context for some aggregate func
  598. if name == "deduplicate" {
  599. args = append([]Expr{&Wildcard{Token: ASTERISK}}, args...)
  600. }
  601. return &Call{Name: name, Args: args}, nil
  602. } else {
  603. if error != nil {
  604. return nil, error
  605. }
  606. win, err := p.ConvertToWindows(wt, args)
  607. if err != nil {
  608. return nil, error
  609. }
  610. // parse filter clause
  611. f, err := p.parseFilter()
  612. if err != nil {
  613. return nil, err
  614. } else if f != nil {
  615. win.Filter = f
  616. }
  617. return win, nil
  618. }
  619. }
  620. func (p *Parser) parseCaseExpr() (*CaseExpr, error) {
  621. c := &CaseExpr{}
  622. tok, _ := p.scanIgnoreWhitespace()
  623. p.unscan()
  624. if tok != WHEN { // no condition value for case, additional validation needed
  625. if exp, err := p.ParseExpr(); err != nil {
  626. return nil, err
  627. } else {
  628. c.Value = exp
  629. }
  630. }
  631. loop:
  632. for {
  633. tok, _ := p.scanIgnoreWhitespace()
  634. switch tok {
  635. case WHEN:
  636. if exp, err := p.ParseExpr(); err != nil {
  637. return nil, err
  638. } else {
  639. if c.WhenClauses == nil {
  640. c.WhenClauses = make([]*WhenClause, 0)
  641. }
  642. if c.Value == nil && !isBooleanArg(exp) {
  643. return nil, fmt.Errorf("invalid CASE expression, WHEN expression must be a bool condition")
  644. }
  645. w := &WhenClause{
  646. Expr: exp,
  647. }
  648. tokThen, _ := p.scanIgnoreWhitespace()
  649. if tokThen != THEN {
  650. return nil, fmt.Errorf("invalid CASE expression, THEN expected after WHEN")
  651. } else {
  652. if expThen, err := p.ParseExpr(); err != nil {
  653. return nil, err
  654. } else {
  655. w.Result = expThen
  656. c.WhenClauses = append(c.WhenClauses, w)
  657. }
  658. }
  659. }
  660. case ELSE:
  661. if c.WhenClauses != nil {
  662. if exp, err := p.ParseExpr(); err != nil {
  663. return nil, err
  664. } else {
  665. c.ElseClause = exp
  666. }
  667. } else {
  668. return nil, fmt.Errorf("invalid CASE expression, WHEN expected before ELSE")
  669. }
  670. case END:
  671. if c.WhenClauses != nil {
  672. break loop
  673. } else {
  674. return nil, fmt.Errorf("invalid CASE expression, WHEN expected before END")
  675. }
  676. default:
  677. return nil, fmt.Errorf("invalid CASE expression, END expected")
  678. }
  679. }
  680. return c, nil
  681. }
  682. func validateWindows(name string, args []Expr) (WindowType, error) {
  683. fname := strings.ToLower(name)
  684. switch fname {
  685. case "tumblingwindow":
  686. if err := validateWindow(fname, 2, args); err != nil {
  687. return TUMBLING_WINDOW, err
  688. }
  689. return TUMBLING_WINDOW, nil
  690. case "hoppingwindow":
  691. if err := validateWindow(fname, 3, args); err != nil {
  692. return HOPPING_WINDOW, err
  693. }
  694. return HOPPING_WINDOW, nil
  695. case "sessionwindow":
  696. if err := validateWindow(fname, 3, args); err != nil {
  697. return SESSION_WINDOW, err
  698. }
  699. return SESSION_WINDOW, nil
  700. case "slidingwindow":
  701. if err := validateWindow(fname, 2, args); err != nil {
  702. return SLIDING_WINDOW, err
  703. }
  704. return SLIDING_WINDOW, nil
  705. case "countwindow":
  706. if len(args) == 1 {
  707. if para1, ok := args[0].(*IntegerLiteral); ok && para1.Val > 0 {
  708. return COUNT_WINDOW, nil
  709. } else {
  710. return COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s.", args[0])
  711. }
  712. } else if len(args) == 2 {
  713. if para1, ok1 := args[0].(*IntegerLiteral); ok1 {
  714. if para2, ok2 := args[1].(*IntegerLiteral); ok2 {
  715. if para1.Val < para2.Val {
  716. return COUNT_WINDOW, fmt.Errorf("The second parameter value %d should be less than the first parameter %d.", para2.Val, para1.Val)
  717. } else {
  718. return COUNT_WINDOW, nil
  719. }
  720. }
  721. }
  722. return COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s, %s.", args[0], args[1])
  723. } else {
  724. return COUNT_WINDOW, fmt.Errorf("Invalid parameter count.")
  725. }
  726. }
  727. return NOT_WINDOW, nil
  728. }
  729. func validateWindow(funcName string, expectLen int, args []Expr) error {
  730. if len(args) != expectLen {
  731. return fmt.Errorf("The arguments for %s should be %d.\n", funcName, expectLen)
  732. }
  733. if _, ok := args[0].(*TimeLiteral); !ok {
  734. return fmt.Errorf("The 1st argument for %s is expecting timer literal expression. One value of [dd|hh|mi|ss|ms].\n", funcName)
  735. }
  736. for i := 1; i < len(args); i++ {
  737. if _, ok := args[i].(*IntegerLiteral); !ok {
  738. return fmt.Errorf("The %d argument for %s is expecting interger literal expression. \n", i, funcName)
  739. }
  740. }
  741. return nil
  742. }
  743. func (p *Parser) ConvertToWindows(wtype WindowType, args []Expr) (*Window, error) {
  744. win := &Window{WindowType: wtype}
  745. if wtype == COUNT_WINDOW {
  746. win.Length = &IntegerLiteral{Val: args[0].(*IntegerLiteral).Val}
  747. if len(args) == 2 {
  748. win.Interval = &IntegerLiteral{Val: args[1].(*IntegerLiteral).Val}
  749. }
  750. return win, nil
  751. }
  752. var unit = 1
  753. v := args[0].(*TimeLiteral).Val
  754. switch v {
  755. case DD:
  756. unit = 24 * 3600 * 1000
  757. case HH:
  758. unit = 3600 * 1000
  759. case MI:
  760. unit = 60 * 1000
  761. case SS:
  762. unit = 1000
  763. case MS:
  764. unit = 1
  765. default:
  766. return nil, fmt.Errorf("Invalid timeliteral %s", v)
  767. }
  768. win.Length = &IntegerLiteral{Val: args[1].(*IntegerLiteral).Val * unit}
  769. if len(args) > 2 {
  770. win.Interval = &IntegerLiteral{Val: args[2].(*IntegerLiteral).Val * unit}
  771. } else {
  772. win.Interval = &IntegerLiteral{Val: 0}
  773. }
  774. return win, nil
  775. }
  776. func (p *Parser) ParseCreateStmt() (Statement, error) {
  777. if tok, _ := p.scanIgnoreWhitespace(); tok == CREATE {
  778. tok1, lit1 := p.scanIgnoreWhitespace()
  779. stmt := &StreamStmt{}
  780. switch tok1 {
  781. case STREAM:
  782. stmt.StreamType = TypeStream
  783. case TABLE:
  784. stmt.StreamType = TypeTable
  785. default:
  786. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  787. }
  788. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  789. stmt.Name = StreamName(lit2)
  790. if fields, err := p.parseStreamFields(); err != nil {
  791. return nil, err
  792. } else {
  793. stmt.StreamFields = fields
  794. }
  795. if opts, err := p.parseStreamOptions(); err != nil {
  796. return nil, err
  797. } else {
  798. stmt.Options = opts
  799. }
  800. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == SEMICOLON {
  801. p.unscan()
  802. } else if tok3 == EOF {
  803. //Finish parsing create stream statement. Jump to validate
  804. } else {
  805. return nil, fmt.Errorf("found %q, expected semicolon or EOF.", lit3)
  806. }
  807. } else {
  808. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  809. }
  810. if valErr := validateStream(stmt); valErr != nil {
  811. return nil, valErr
  812. }
  813. return stmt, nil
  814. } else {
  815. p.unscan()
  816. return nil, nil
  817. }
  818. }
  819. // TODO more accurate validation for table
  820. func validateStream(stmt *StreamStmt) error {
  821. f := stmt.Options.FORMAT
  822. if f == "" {
  823. f = common.FORMAT_JSON
  824. }
  825. switch strings.ToLower(f) {
  826. case common.FORMAT_JSON:
  827. //do nothing
  828. case common.FORMAT_BINARY:
  829. if stmt.StreamType == TypeTable {
  830. return fmt.Errorf("'binary' format is not supported for table")
  831. }
  832. switch len(stmt.StreamFields) {
  833. case 0:
  834. // do nothing for schemaless
  835. case 1:
  836. f := stmt.StreamFields[0]
  837. if bt, ok := f.FieldType.(*BasicType); ok {
  838. if bt.Type == BYTEA {
  839. break
  840. }
  841. }
  842. return fmt.Errorf("'binary' format stream can have only 'bytea' type field")
  843. default:
  844. return fmt.Errorf("'binary' format stream can have only one field")
  845. }
  846. default:
  847. return fmt.Errorf("option 'format=%s' is invalid", f)
  848. }
  849. return nil
  850. }
  851. func (p *Parser) parseShowStmt() (Statement, error) {
  852. if tok, _ := p.scanIgnoreWhitespace(); tok == SHOW {
  853. tok1, lit1 := p.scanIgnoreWhitespace()
  854. switch tok1 {
  855. case STREAMS:
  856. ss := &ShowStreamsStatement{}
  857. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == EOF || tok2 == SEMICOLON {
  858. return ss, nil
  859. } else {
  860. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  861. }
  862. case TABLES:
  863. ss := &ShowTablesStatement{}
  864. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == EOF || tok2 == SEMICOLON {
  865. return ss, nil
  866. } else {
  867. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  868. }
  869. default:
  870. return nil, fmt.Errorf("found %q, expected keyword streams or tables.", lit1)
  871. }
  872. } else {
  873. p.unscan()
  874. return nil, nil
  875. }
  876. }
  877. func (p *Parser) parseDescribeStmt() (Statement, error) {
  878. if tok, _ := p.scanIgnoreWhitespace(); tok == DESCRIBE {
  879. tok1, lit1 := p.scanIgnoreWhitespace()
  880. switch tok1 {
  881. case STREAM:
  882. dss := &DescribeStreamStatement{}
  883. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  884. dss.Name = lit2
  885. return dss, nil
  886. } else {
  887. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  888. }
  889. case TABLE:
  890. dss := &DescribeTableStatement{}
  891. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  892. dss.Name = lit2
  893. return dss, nil
  894. } else {
  895. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  896. }
  897. default:
  898. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  899. }
  900. } else {
  901. p.unscan()
  902. return nil, nil
  903. }
  904. }
  905. func (p *Parser) parseExplainStmt() (Statement, error) {
  906. if tok, _ := p.scanIgnoreWhitespace(); tok == EXPLAIN {
  907. tok1, lit1 := p.scanIgnoreWhitespace()
  908. switch tok1 {
  909. case STREAM:
  910. ess := &ExplainStreamStatement{}
  911. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  912. ess.Name = lit2
  913. return ess, nil
  914. } else {
  915. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  916. }
  917. case TABLE:
  918. ess := &ExplainTableStatement{}
  919. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  920. ess.Name = lit2
  921. return ess, nil
  922. } else {
  923. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  924. }
  925. default:
  926. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  927. }
  928. } else {
  929. p.unscan()
  930. return nil, nil
  931. }
  932. }
  933. func (p *Parser) parseDropStmt() (Statement, error) {
  934. if tok, _ := p.scanIgnoreWhitespace(); tok == DROP {
  935. tok1, lit1 := p.scanIgnoreWhitespace()
  936. switch tok1 {
  937. case STREAM:
  938. ess := &DropStreamStatement{}
  939. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  940. ess.Name = lit2
  941. return ess, nil
  942. } else {
  943. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  944. }
  945. case TABLE:
  946. ess := &DropTableStatement{}
  947. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  948. ess.Name = lit2
  949. return ess, nil
  950. } else {
  951. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  952. }
  953. default:
  954. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  955. }
  956. } else {
  957. p.unscan()
  958. return nil, nil
  959. }
  960. }
  961. func (p *Parser) parseStreamFields() (StreamFields, error) {
  962. lStack := &stack.Stack{}
  963. var fields StreamFields
  964. if tok, lit := p.scanIgnoreWhitespace(); tok == LPAREN {
  965. lStack.Push(lit)
  966. for {
  967. //For the schemaless streams
  968. //create stream demo () WITH (FORMAT="JSON", DATASOURCE="demo" TYPE="edgex")
  969. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == RPAREN {
  970. lStack.Pop()
  971. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != WITH {
  972. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  973. }
  974. return fields, nil
  975. } else {
  976. p.unscan()
  977. }
  978. if f, err := p.parseStreamField(); err != nil {
  979. return nil, err
  980. } else {
  981. fields = append(fields, *f)
  982. }
  983. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == RPAREN {
  984. lStack.Pop()
  985. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == WITH {
  986. //Check the stack for LPAREN; If the stack for LPAREN is not zero, then it's not correct.
  987. if lStack.Len() > 0 {
  988. return nil, fmt.Errorf("Parenthesis is not matched.")
  989. }
  990. break
  991. } else if tok2 == COMMA {
  992. if lStack.Len() > 0 {
  993. return nil, fmt.Errorf("Parenthesis is in create record type not matched.")
  994. }
  995. p.unscan()
  996. break
  997. } else if tok2 == RPAREN { //The nested type definition of ARRAY and Struct, such as "field ARRAY(STRUCT(f BIGINT))"
  998. if lStack.Len() > 0 {
  999. return nil, fmt.Errorf("Parenthesis is not matched.")
  1000. }
  1001. p.unscan()
  1002. break
  1003. } else {
  1004. if lStack.Len() == 0 {
  1005. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  1006. }
  1007. p.unscan()
  1008. }
  1009. } else {
  1010. p.unscan()
  1011. }
  1012. }
  1013. } else {
  1014. return nil, fmt.Errorf("found %q, expected lparen after stream name.", lit)
  1015. }
  1016. return fields, nil
  1017. }
  1018. func (p *Parser) parseStreamField() (*StreamField, error) {
  1019. field := &StreamField{}
  1020. if tok, lit := p.scanIgnoreWhitespace(); tok == IDENT {
  1021. field.Name = lit
  1022. tok1, lit1 := p.scanIgnoreWhitespace()
  1023. if t := getDataType(tok1); t != UNKNOWN && t.isSimpleType() {
  1024. field.FieldType = &BasicType{Type: t}
  1025. } else if t == ARRAY {
  1026. if f, e := p.parseStreamArrayType(); e != nil {
  1027. return nil, e
  1028. } else {
  1029. field.FieldType = f
  1030. }
  1031. } else if t == STRUCT {
  1032. if f, e := p.parseStreamStructType(); e != nil {
  1033. return nil, e
  1034. } else {
  1035. field.FieldType = f
  1036. }
  1037. } else if t == UNKNOWN {
  1038. return nil, fmt.Errorf("found %q, expect valid stream field types(BIGINT | FLOAT | STRINGS | DATETIME | BOOLEAN | BYTEA | ARRAY | STRUCT).", lit1)
  1039. }
  1040. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == COMMA {
  1041. //Just consume the comma.
  1042. } else if tok2 == RPAREN {
  1043. p.unscan()
  1044. } else {
  1045. return nil, fmt.Errorf("found %q, expect comma or rparen.", lit2)
  1046. }
  1047. } else {
  1048. return nil, fmt.Errorf("found %q, expect stream field name.", lit)
  1049. }
  1050. return field, nil
  1051. }
  1052. func (p *Parser) parseStreamArrayType() (FieldType, error) {
  1053. lStack := &stack.Stack{}
  1054. if tok, _ := p.scanIgnoreWhitespace(); tok == LPAREN {
  1055. lStack.Push(LPAREN)
  1056. tok1, lit1 := p.scanIgnoreWhitespace()
  1057. if t := getDataType(tok1); t != UNKNOWN && t.isSimpleType() {
  1058. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == RPAREN {
  1059. lStack.Pop()
  1060. if lStack.Len() > 0 {
  1061. return nil, fmt.Errorf("Parenthesis is in array type not matched.")
  1062. }
  1063. return &ArrayType{Type: t}, nil
  1064. } else {
  1065. return nil, fmt.Errorf("found %q, expect rparen in array type definition.", lit2)
  1066. }
  1067. } else if tok1 == XSTRUCT {
  1068. if f, err := p.parseStreamStructType(); err != nil {
  1069. return nil, err
  1070. } else {
  1071. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == RPAREN {
  1072. lStack.Pop()
  1073. if lStack.Len() > 0 {
  1074. return nil, fmt.Errorf("Parenthesis is in struct of array type %q not matched.", tok1)
  1075. }
  1076. return &ArrayType{Type: STRUCT, FieldType: f}, nil
  1077. } else {
  1078. return nil, fmt.Errorf("found %q, expect rparen in struct of array type definition.", lit2)
  1079. }
  1080. }
  1081. } else if tok1 == COMMA {
  1082. p.unscan()
  1083. } else {
  1084. return nil, fmt.Errorf("found %q, expect stream data types.", lit1)
  1085. }
  1086. } else {
  1087. }
  1088. return nil, nil
  1089. }
  1090. func (p *Parser) parseStreamStructType() (FieldType, error) {
  1091. rf := &RecType{}
  1092. if sfs, err := p.parseStreamFields(); err != nil {
  1093. return nil, err
  1094. } else {
  1095. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == COMMA {
  1096. rf.StreamFields = sfs
  1097. p.unscan()
  1098. } else if tok2 == RPAREN {
  1099. rf.StreamFields = sfs
  1100. p.unscan()
  1101. } else {
  1102. return nil, fmt.Errorf("found %q, expect comma in create stream record statement.", lit2)
  1103. }
  1104. }
  1105. return rf, nil
  1106. }
  1107. func (p *Parser) parseStreamOptions() (*Options, error) {
  1108. opts := &Options{}
  1109. v := reflect.ValueOf(opts)
  1110. lStack := &stack.Stack{}
  1111. if tok, lit := p.scanIgnoreWhitespace(); tok == LPAREN {
  1112. lStack.Push(LPAREN)
  1113. for {
  1114. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == DATASOURCE || tok1 == FORMAT || tok1 == KEY || tok1 == CONF_KEY || tok1 == STRICT_VALIDATION || tok1 == TYPE || tok1 == TIMESTAMP || tok1 == TIMESTAMP_FORMAT || tok1 == RETAIN_SIZE || tok1 == SHARED {
  1115. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == EQ {
  1116. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == STRING {
  1117. switch tok1 {
  1118. case STRICT_VALIDATION:
  1119. if val := strings.ToUpper(lit3); (val != "TRUE") && (val != "FALSE") {
  1120. return nil, fmt.Errorf("found %q, expect TRUE/FALSE value in %s option.", lit3, tok1)
  1121. } else {
  1122. opts.STRICT_VALIDATION = (val == "TRUE")
  1123. }
  1124. case RETAIN_SIZE:
  1125. if val, err := strconv.Atoi(lit3); err != nil {
  1126. return nil, fmt.Errorf("found %q, expect number value in %s option.", lit3, tok1)
  1127. } else {
  1128. opts.RETAIN_SIZE = val
  1129. }
  1130. case SHARED:
  1131. if val := strings.ToUpper(lit3); (val != "TRUE") && (val != "FALSE") {
  1132. return nil, fmt.Errorf("found %q, expect TRUE/FALSE value in %s option.", lit3, tok1)
  1133. } else {
  1134. opts.SHARED = (val == "TRUE")
  1135. }
  1136. default:
  1137. f := v.Elem().FieldByName(lit1)
  1138. if f.IsValid() {
  1139. f.SetString(lit3)
  1140. } else { // should not happen
  1141. return nil, fmt.Errorf("invalid field %s.", lit1)
  1142. }
  1143. }
  1144. } else {
  1145. return nil, fmt.Errorf("found %q, expect string value in option.", lit3)
  1146. }
  1147. } else {
  1148. return nil, fmt.Errorf("found %q, expect equals(=) in options.", lit2)
  1149. }
  1150. } else if tok1 == COMMA {
  1151. continue
  1152. } else if tok1 == RPAREN {
  1153. if lStack.Pop(); lStack.Len() == 0 {
  1154. break
  1155. } else {
  1156. return nil, fmt.Errorf("Parenthesis is not matched in options definition.")
  1157. }
  1158. } else {
  1159. return nil, fmt.Errorf("found %q, unknown option keys(DATASOURCE|FORMAT|KEY|CONF_KEY|SHARED|STRICT_VALIDATION|TYPE|TIMESTAMP|TIMESTAMP_FORMAT|RETAIN_SIZE).", lit1)
  1160. }
  1161. }
  1162. } else {
  1163. return nil, fmt.Errorf("found %q, expect stream options.", lit)
  1164. }
  1165. return opts, nil
  1166. }
  1167. // Only support filter on window now
  1168. func (p *Parser) parseFilter() (Expr, error) {
  1169. if tok, _ := p.scanIgnoreWhitespace(); tok != FILTER {
  1170. p.unscan()
  1171. return nil, nil
  1172. }
  1173. if tok, lit := p.scanIgnoreWhitespace(); tok != LPAREN {
  1174. return nil, fmt.Errorf("Found %q after FILTER, expect parentheses.", lit)
  1175. }
  1176. if tok, lit := p.scanIgnoreWhitespace(); tok != WHERE {
  1177. return nil, fmt.Errorf("Found %q after FILTER(, expect WHERE.", lit)
  1178. }
  1179. expr, err := p.ParseExpr()
  1180. if err != nil {
  1181. return nil, err
  1182. }
  1183. if tok, lit := p.scanIgnoreWhitespace(); tok != RPAREN {
  1184. return nil, fmt.Errorf("Found %q after FILTER, expect right parentheses.", lit)
  1185. }
  1186. return expr, nil
  1187. }