parser.go 27 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100
  1. package xsql
  2. import (
  3. "fmt"
  4. "github.com/golang-collections/collections/stack"
  5. "io"
  6. "strconv"
  7. "strings"
  8. )
  9. type Parser struct {
  10. s *Scanner
  11. i int // buffer index
  12. n int // buffer char count
  13. buf [3]struct {
  14. tok Token
  15. lit string
  16. }
  17. inmeta bool
  18. }
  19. func (p *Parser) parseCondition() (Expr, error) {
  20. if tok, _ := p.scanIgnoreWhitespace(); tok != WHERE {
  21. p.unscan()
  22. return nil, nil
  23. }
  24. expr, err := p.ParseExpr()
  25. if err != nil {
  26. return nil, err
  27. }
  28. return expr, nil
  29. }
  30. func (p *Parser) scan() (tok Token, lit string) {
  31. if p.n > 0 {
  32. p.n--
  33. return p.curr()
  34. }
  35. tok, lit = p.s.Scan()
  36. if tok != WS && tok != COMMENT {
  37. p.i = (p.i + 1) % len(p.buf)
  38. buf := &p.buf[p.i]
  39. buf.tok, buf.lit = tok, lit
  40. }
  41. return
  42. }
  43. func (p *Parser) curr() (Token, string) {
  44. i := (p.i - p.n + len(p.buf)) % len(p.buf)
  45. buf := &p.buf[i]
  46. return buf.tok, buf.lit
  47. }
  48. func (p *Parser) scanIgnoreWhitespace() (tok Token, lit string) {
  49. tok, lit = p.scan()
  50. for {
  51. if tok == WS || tok == COMMENT {
  52. tok, lit = p.scan()
  53. } else {
  54. break
  55. }
  56. }
  57. return tok, lit
  58. }
  59. func (p *Parser) unscan() { p.n++ }
  60. func NewParser(r io.Reader) *Parser {
  61. return &Parser{s: NewScanner(r)}
  62. }
  63. func (p *Parser) ParseQueries() (SelectStatements, error) {
  64. var stmts SelectStatements
  65. if stmt, err := p.Parse(); err != nil {
  66. return nil, err
  67. } else {
  68. stmts = append(stmts, *stmt)
  69. }
  70. for {
  71. if tok, _ := p.scanIgnoreWhitespace(); tok == SEMICOLON {
  72. if stmt, err := p.Parse(); err != nil {
  73. return nil, err
  74. } else {
  75. if stmt != nil {
  76. stmts = append(stmts, *stmt)
  77. }
  78. }
  79. } else if tok == EOF {
  80. break
  81. }
  82. }
  83. return stmts, nil
  84. }
  85. func (p *Parser) Parse() (*SelectStatement, error) {
  86. selects := &SelectStatement{}
  87. if tok, lit := p.scanIgnoreWhitespace(); tok == EOF {
  88. return nil, nil
  89. } else if tok != SELECT {
  90. return nil, fmt.Errorf("Found %q, Expected SELECT.\n", lit)
  91. }
  92. if fields, err := p.parseFields(); err != nil {
  93. return nil, err
  94. } else {
  95. selects.Fields = fields
  96. }
  97. if src, err := p.parseSource(); err != nil {
  98. return nil, err
  99. } else {
  100. selects.Sources = src
  101. }
  102. if joins, err := p.parseJoins(); err != nil {
  103. return nil, err
  104. } else {
  105. selects.Joins = joins
  106. }
  107. if exp, err := p.parseCondition(); err != nil {
  108. return nil, err
  109. } else {
  110. if exp != nil {
  111. selects.Condition = exp
  112. }
  113. }
  114. if dims, err := p.parseDimensions(); err != nil {
  115. return nil, err
  116. } else {
  117. selects.Dimensions = dims
  118. }
  119. if having, err := p.parseHaving(); err != nil {
  120. return nil, err
  121. } else {
  122. selects.Having = having
  123. }
  124. if sorts, err := p.parseSorts(); err != nil {
  125. return nil, err
  126. } else {
  127. selects.SortFields = sorts
  128. }
  129. if tok, lit := p.scanIgnoreWhitespace(); tok == SEMICOLON {
  130. p.unscan()
  131. return selects, nil
  132. } else if tok != EOF {
  133. return nil, fmt.Errorf("found %q, expected EOF.", lit)
  134. }
  135. if err := Validate(selects); err != nil {
  136. return nil, err
  137. }
  138. return selects, nil
  139. }
  140. func (p *Parser) parseSource() (Sources, error) {
  141. var sources Sources
  142. if tok, lit := p.scanIgnoreWhitespace(); tok != FROM {
  143. return nil, fmt.Errorf("found %q, expected FROM.", lit)
  144. }
  145. if src, alias, err := p.parseSourceLiteral(); err != nil {
  146. return nil, err
  147. } else {
  148. sources = append(sources, &Table{Name: src, Alias: alias})
  149. }
  150. return sources, nil
  151. }
  152. //TODO Current func has problems when the source includes white space.
  153. func (p *Parser) parseSourceLiteral() (string, string, error) {
  154. var sourceSeg []string
  155. var alias string
  156. for {
  157. //HASH, DIV & ADD token is specially support for MQTT topic name patterns.
  158. if tok, lit := p.scanIgnoreWhitespace(); tok.allowedSourceToken() {
  159. sourceSeg = append(sourceSeg, lit)
  160. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == AS {
  161. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  162. alias = lit2
  163. } else {
  164. return "", "", fmt.Errorf("found %q, expected JOIN key word.", lit)
  165. }
  166. } else if tok1.allowedSourceToken() {
  167. sourceSeg = append(sourceSeg, lit1)
  168. } else {
  169. p.unscan()
  170. break
  171. }
  172. } else {
  173. p.unscan()
  174. break
  175. }
  176. }
  177. return strings.Join(sourceSeg, ""), alias, nil
  178. }
  179. func (p *Parser) parseFieldNameSections() ([]string, error) {
  180. var fieldNameSects []string
  181. for {
  182. if tok, lit := p.scanIgnoreWhitespace(); tok == IDENT || tok == ASTERISK {
  183. fieldNameSects = append(fieldNameSects, lit)
  184. if tok1, _ := p.scanIgnoreWhitespace(); !tok1.allowedSFNToken() {
  185. p.unscan()
  186. break
  187. }
  188. } else {
  189. p.unscan()
  190. break
  191. }
  192. }
  193. if len(fieldNameSects) == 0 {
  194. return nil, fmt.Errorf("Cannot find any field name.\n")
  195. } else if len(fieldNameSects) > 2 {
  196. return nil, fmt.Errorf("Too many field names. Please use -> to reference keys in struct.\n")
  197. }
  198. return fieldNameSects, nil
  199. }
  200. func (p *Parser) parseJoins() (Joins, error) {
  201. var joins Joins
  202. for {
  203. if tok, lit := p.scanIgnoreWhitespace(); tok == INNER || tok == LEFT || tok == RIGHT || tok == FULL || tok == CROSS {
  204. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == JOIN {
  205. var jt = INNER_JOIN
  206. switch tok {
  207. case INNER:
  208. jt = INNER_JOIN
  209. case LEFT:
  210. jt = LEFT_JOIN
  211. case RIGHT:
  212. jt = RIGHT_JOIN
  213. case FULL:
  214. jt = FULL_JOIN
  215. case CROSS:
  216. jt = CROSS_JOIN
  217. }
  218. if j, err := p.ParseJoin(jt); err != nil {
  219. return nil, err
  220. } else {
  221. joins = append(joins, *j)
  222. }
  223. } else {
  224. return nil, fmt.Errorf("found %q, expected JOIN key word.", lit)
  225. }
  226. } else {
  227. p.unscan()
  228. if len(joins) > 0 {
  229. return joins, nil
  230. }
  231. return nil, nil
  232. }
  233. }
  234. return joins, nil
  235. }
  236. func (p *Parser) ParseJoin(joinType JoinType) (*Join, error) {
  237. var j = &Join{JoinType: joinType}
  238. if src, alias, err := p.parseSourceLiteral(); err != nil {
  239. return nil, err
  240. } else {
  241. j.Name = src
  242. j.Alias = alias
  243. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ON {
  244. if CROSS_JOIN == joinType {
  245. return nil, fmt.Errorf("On expression is not required for cross join type.\n")
  246. }
  247. if exp, err := p.ParseExpr(); err != nil {
  248. return nil, err
  249. } else {
  250. j.Expr = exp
  251. }
  252. } else {
  253. p.unscan()
  254. }
  255. }
  256. return j, nil
  257. }
  258. func (p *Parser) parseDimensions() (Dimensions, error) {
  259. var ds Dimensions
  260. if t, _ := p.scanIgnoreWhitespace(); t == GROUP {
  261. if t1, l1 := p.scanIgnoreWhitespace(); t1 == BY {
  262. for {
  263. if exp, err := p.ParseExpr(); err != nil {
  264. return nil, err
  265. } else {
  266. d := Dimension{Expr: exp}
  267. ds = append(ds, d)
  268. }
  269. if tok, _ := p.scanIgnoreWhitespace(); tok == COMMA {
  270. continue
  271. } else {
  272. p.unscan()
  273. break
  274. }
  275. }
  276. } else {
  277. return nil, fmt.Errorf("found %q, expected BY statement.", l1)
  278. }
  279. } else {
  280. p.unscan()
  281. }
  282. return ds, nil
  283. }
  284. func (p *Parser) parseHaving() (Expr, error) {
  285. if tok, _ := p.scanIgnoreWhitespace(); tok != HAVING {
  286. p.unscan()
  287. return nil, nil
  288. }
  289. expr, err := p.ParseExpr()
  290. if err != nil {
  291. return nil, err
  292. }
  293. return expr, nil
  294. }
  295. func (p *Parser) parseSorts() (SortFields, error) {
  296. var ss SortFields
  297. if t, _ := p.scanIgnoreWhitespace(); t == ORDER {
  298. if t1, l1 := p.scanIgnoreWhitespace(); t1 == BY {
  299. for {
  300. if t1, l1 = p.scanIgnoreWhitespace(); t1 == IDENT {
  301. s := SortField{Ascending: true}
  302. p.unscan()
  303. if name, err := p.parseFieldNameSections(); err == nil {
  304. s.Name = strings.Join(name, tokens[COLSEP])
  305. } else {
  306. return nil, err
  307. }
  308. if t2, _ := p.scanIgnoreWhitespace(); t2 == DESC {
  309. s.Ascending = false
  310. ss = append(ss, s)
  311. } else if t2 == ASC {
  312. ss = append(ss, s)
  313. } else {
  314. ss = append(ss, s)
  315. p.unscan()
  316. continue
  317. }
  318. } else if t1 == COMMA {
  319. continue
  320. } else {
  321. p.unscan()
  322. break
  323. }
  324. }
  325. } else {
  326. return nil, fmt.Errorf("found %q, expected BY keyword.", l1)
  327. }
  328. } else {
  329. p.unscan()
  330. }
  331. return ss, nil
  332. }
  333. func (p *Parser) parseFields() (Fields, error) {
  334. var fields Fields
  335. tok, _ := p.scanIgnoreWhitespace()
  336. if tok == ASTERISK {
  337. fields = append(fields, Field{AName: "", Expr: &Wildcard{Token: tok}})
  338. return fields, nil
  339. }
  340. p.unscan()
  341. for {
  342. field, err := p.parseField()
  343. if err != nil {
  344. return nil, err
  345. } else {
  346. fields = append(fields, *field)
  347. }
  348. tok, _ = p.scanIgnoreWhitespace()
  349. if tok != COMMA {
  350. p.unscan()
  351. break
  352. }
  353. }
  354. return fields, nil
  355. }
  356. func (p *Parser) parseField() (*Field, error) {
  357. field := &Field{}
  358. if exp, err := p.ParseExpr(); err != nil {
  359. return nil, err
  360. } else {
  361. if e, ok := exp.(*FieldRef); ok {
  362. field.Name = e.Name
  363. } else if e, ok := exp.(*Call); ok {
  364. field.Name = e.Name
  365. }
  366. field.Expr = exp
  367. }
  368. if alias, err := p.parseAlias(); err != nil {
  369. return nil, err
  370. } else {
  371. if alias != "" {
  372. field.AName = alias
  373. }
  374. }
  375. return field, nil
  376. }
  377. func (p *Parser) parseAlias() (string, error) {
  378. tok, lit := p.scanIgnoreWhitespace()
  379. if tok == AS {
  380. if tok, lit = p.scanIgnoreWhitespace(); tok != IDENT {
  381. return "", fmt.Errorf("found %q, expected as alias.", lit)
  382. } else {
  383. return lit, nil
  384. }
  385. }
  386. p.unscan()
  387. return "", nil
  388. }
  389. func (p *Parser) ParseExpr() (Expr, error) {
  390. var err error
  391. root := &BinaryExpr{}
  392. root.RHS, err = p.parseUnaryExpr()
  393. if err != nil {
  394. return nil, err
  395. }
  396. for {
  397. op, _ := p.scanIgnoreWhitespace()
  398. if !op.isOperator() {
  399. p.unscan()
  400. return root.RHS, nil
  401. } else if op == ASTERISK { //Change the asterisk to Mul token.
  402. op = MUL
  403. } else if op == LBRACKET { //LBRACKET is a special token, need to unscan
  404. op = SUBSET
  405. p.unscan()
  406. }
  407. var rhs Expr
  408. if rhs, err = p.parseUnaryExpr(); err != nil {
  409. return nil, err
  410. }
  411. for node := root; ; {
  412. r, ok := node.RHS.(*BinaryExpr)
  413. if !ok || r.OP.Precedence() >= op.Precedence() {
  414. node.RHS = &BinaryExpr{LHS: node.RHS, RHS: rhs, OP: op}
  415. break
  416. }
  417. node = r
  418. }
  419. }
  420. return nil, nil
  421. }
  422. func (p *Parser) parseUnaryExpr() (Expr, error) {
  423. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == LPAREN {
  424. expr, err := p.ParseExpr()
  425. if err != nil {
  426. return nil, err
  427. }
  428. // Expect an RPAREN at the end.
  429. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != RPAREN {
  430. return nil, fmt.Errorf("found %q, expected right paren.", lit2)
  431. }
  432. return &ParenExpr{Expr: expr}, nil
  433. } else if tok1 == LBRACKET {
  434. return p.parseBracketExpr()
  435. }
  436. p.unscan()
  437. tok, lit := p.scanIgnoreWhitespace()
  438. if tok == IDENT {
  439. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == LPAREN {
  440. return p.parseCall(lit)
  441. }
  442. p.unscan() //Back the Lparen token
  443. p.unscan() //Back the ident token
  444. if n, err := p.parseFieldNameSections(); err != nil {
  445. return nil, err
  446. } else {
  447. if p.inmeta {
  448. if len(n) == 2 {
  449. return &MetaRef{StreamName: StreamName(n[0]), Name: n[1]}, nil
  450. }
  451. return &MetaRef{StreamName: "", Name: n[0]}, nil
  452. } else {
  453. if len(n) == 2 {
  454. return &FieldRef{StreamName: StreamName(n[0]), Name: n[1]}, nil
  455. }
  456. return &FieldRef{StreamName: "", Name: n[0]}, nil
  457. }
  458. }
  459. } else if tok == STRING {
  460. return &StringLiteral{Val: lit}, nil
  461. } else if tok == INTEGER {
  462. val, _ := strconv.Atoi(lit)
  463. return &IntegerLiteral{Val: val}, nil
  464. } else if tok == NUMBER {
  465. if v, err := strconv.ParseFloat(lit, 64); err != nil {
  466. return nil, fmt.Errorf("found %q, invalid number value.", lit)
  467. } else {
  468. return &NumberLiteral{Val: v}, nil
  469. }
  470. } else if tok == TRUE || tok == FALSE {
  471. if v, err := strconv.ParseBool(lit); err != nil {
  472. return nil, fmt.Errorf("found %q, invalid boolean value.", lit)
  473. } else {
  474. return &BooleanLiteral{Val: v}, nil
  475. }
  476. } else if tok.isTimeLiteral() {
  477. return &TimeLiteral{Val: tok}, nil
  478. }
  479. return nil, fmt.Errorf("found %q, expected expression.", lit)
  480. }
  481. func (p *Parser) parseBracketExpr() (Expr, error) {
  482. tok2, lit2 := p.scanIgnoreWhitespace()
  483. if tok2 == RBRACKET {
  484. //field[]
  485. return &ColonExpr{Start: 0, End: -1}, nil
  486. } else if tok2 == INTEGER {
  487. start, err := strconv.Atoi(lit2)
  488. if err != nil {
  489. return nil, fmt.Errorf("The start index %s is not an int value in bracket expression.", lit2)
  490. }
  491. if tok3, _ := p.scanIgnoreWhitespace(); tok3 == RBRACKET {
  492. //Such as field[2]
  493. return &IndexExpr{Index: start}, nil
  494. } else if tok3 == COLON {
  495. //Such as field[2:] or field[2:4]
  496. return p.parseColonExpr(start)
  497. }
  498. } else if tok2 == COLON {
  499. //Such as field[:3] or [:]
  500. return p.parseColonExpr(0)
  501. }
  502. return nil, fmt.Errorf("Unexpected token %q. when parsing bracket expressions.", lit2)
  503. }
  504. func (p *Parser) parseColonExpr(start int) (Expr, error) {
  505. tok, lit := p.scanIgnoreWhitespace()
  506. if tok == INTEGER {
  507. end, err := strconv.Atoi(lit)
  508. if err != nil {
  509. return nil, fmt.Errorf("The end index %s is not an int value in bracket expression.", lit)
  510. }
  511. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == RBRACKET {
  512. return &ColonExpr{Start: start, End: end}, nil
  513. } else {
  514. return nil, fmt.Errorf("Found %q, expected right bracket.", lit1)
  515. }
  516. } else if tok == RBRACKET {
  517. return &ColonExpr{Start: start, End: -1}, nil
  518. }
  519. return nil, fmt.Errorf("Found %q, expected right bracket.", lit)
  520. }
  521. func (p *Parser) parseAs(f *Field) (*Field, error) {
  522. tok, lit := p.scanIgnoreWhitespace()
  523. if tok != IDENT {
  524. return nil, fmt.Errorf("found %q, expected as alias.", lit)
  525. }
  526. f.AName = lit
  527. return f, nil
  528. }
  529. func (p *Parser) parseCall(name string) (Expr, error) {
  530. if strings.ToLower(name) == "meta" || strings.ToLower(name) == "mqtt" {
  531. p.inmeta = true
  532. defer func() {
  533. p.inmeta = false
  534. }()
  535. }
  536. var args []Expr
  537. for {
  538. if tok, _ := p.scanIgnoreWhitespace(); tok == RPAREN {
  539. if valErr := validateFuncs(name, nil); valErr != nil {
  540. return nil, valErr
  541. }
  542. return &Call{Name: name, Args: args}, nil
  543. } else if tok == ASTERISK {
  544. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != RPAREN {
  545. return nil, fmt.Errorf("found %q, expected right paren.", lit2)
  546. } else {
  547. if p.inmeta {
  548. args = append(args, &MetaRef{StreamName: "", Name: "*"})
  549. } else if _, ok := funcWithAsteriskSupportMap[name]; ok {
  550. args = append(args, &Wildcard{Token: ASTERISK})
  551. } else {
  552. args = append(args, &StringLiteral{Val: "*"})
  553. }
  554. return &Call{Name: name, Args: args}, nil
  555. }
  556. } else {
  557. p.unscan()
  558. }
  559. if exp, err := p.ParseExpr(); err != nil {
  560. return nil, err
  561. } else {
  562. args = append(args, exp)
  563. }
  564. if tok, _ := p.scanIgnoreWhitespace(); tok != COMMA {
  565. p.unscan()
  566. break
  567. }
  568. }
  569. if tok, lit := p.scanIgnoreWhitespace(); tok != RPAREN {
  570. return nil, fmt.Errorf("found function call %q, expected ), but with %q.", name, lit)
  571. }
  572. if wt, error := validateWindows(name, args); wt == NOT_WINDOW {
  573. if valErr := validateFuncs(name, args); valErr != nil {
  574. return nil, valErr
  575. }
  576. // Add context for some aggregate func
  577. if name == "deduplicate" {
  578. args = append([]Expr{&Wildcard{Token: ASTERISK}}, args...)
  579. }
  580. return &Call{Name: name, Args: args}, nil
  581. } else {
  582. if error != nil {
  583. return nil, error
  584. }
  585. win, err := p.ConvertToWindows(wt, args)
  586. if err != nil {
  587. return nil, error
  588. }
  589. // parse filter clause
  590. f, err := p.parseFilter()
  591. if err != nil {
  592. return nil, err
  593. } else if f != nil {
  594. win.Filter = f
  595. }
  596. return win, nil
  597. }
  598. }
  599. func validateWindows(name string, args []Expr) (WindowType, error) {
  600. fname := strings.ToLower(name)
  601. switch fname {
  602. case "tumblingwindow":
  603. if err := validateWindow(fname, 2, args); err != nil {
  604. return TUMBLING_WINDOW, err
  605. }
  606. return TUMBLING_WINDOW, nil
  607. case "hoppingwindow":
  608. if err := validateWindow(fname, 3, args); err != nil {
  609. return HOPPING_WINDOW, err
  610. }
  611. return HOPPING_WINDOW, nil
  612. case "sessionwindow":
  613. if err := validateWindow(fname, 3, args); err != nil {
  614. return SESSION_WINDOW, err
  615. }
  616. return SESSION_WINDOW, nil
  617. case "slidingwindow":
  618. if err := validateWindow(fname, 2, args); err != nil {
  619. return SLIDING_WINDOW, err
  620. }
  621. return SLIDING_WINDOW, nil
  622. case "countwindow":
  623. if len(args) == 1 {
  624. if para1, ok := args[0].(*IntegerLiteral); ok && para1.Val > 0 {
  625. return COUNT_WINDOW, nil
  626. } else {
  627. return COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s.", args[0])
  628. }
  629. } else if len(args) == 2 {
  630. if para1, ok1 := args[0].(*IntegerLiteral); ok1 {
  631. if para2, ok2 := args[1].(*IntegerLiteral); ok2 {
  632. if para1.Val < para2.Val {
  633. return COUNT_WINDOW, fmt.Errorf("The second parameter value %d should be less than the first parameter %d.", para2.Val, para1.Val)
  634. } else {
  635. return COUNT_WINDOW, nil
  636. }
  637. }
  638. }
  639. return COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s, %s.", args[0], args[1])
  640. } else {
  641. return COUNT_WINDOW, fmt.Errorf("Invalid parameter count.")
  642. }
  643. }
  644. return NOT_WINDOW, nil
  645. }
  646. func validateWindow(funcName string, expectLen int, args []Expr) error {
  647. if len(args) != expectLen {
  648. return fmt.Errorf("The arguments for %s should be %d.\n", funcName, expectLen)
  649. }
  650. if _, ok := args[0].(*TimeLiteral); !ok {
  651. return fmt.Errorf("The 1st argument for %s is expecting timer literal expression. One value of [dd|hh|mi|ss|ms].\n", funcName)
  652. }
  653. for i := 1; i < len(args); i++ {
  654. if _, ok := args[i].(*IntegerLiteral); !ok {
  655. return fmt.Errorf("The %d argument for %s is expecting interger literal expression. \n", i, funcName)
  656. }
  657. }
  658. return nil
  659. }
  660. func (p *Parser) ConvertToWindows(wtype WindowType, args []Expr) (*Window, error) {
  661. win := &Window{WindowType: wtype}
  662. if wtype == COUNT_WINDOW {
  663. win.Length = &IntegerLiteral{Val: args[0].(*IntegerLiteral).Val}
  664. if len(args) == 2 {
  665. win.Interval = &IntegerLiteral{Val: args[1].(*IntegerLiteral).Val}
  666. }
  667. return win, nil
  668. }
  669. var unit = 1
  670. v := args[0].(*TimeLiteral).Val
  671. switch v {
  672. case DD:
  673. unit = 24 * 3600 * 1000
  674. case HH:
  675. unit = 3600 * 1000
  676. case MI:
  677. unit = 60 * 1000
  678. case SS:
  679. unit = 1000
  680. case MS:
  681. unit = 1
  682. default:
  683. return nil, fmt.Errorf("Invalid timeliteral %s", v)
  684. }
  685. win.Length = &IntegerLiteral{Val: args[1].(*IntegerLiteral).Val * unit}
  686. if len(args) > 2 {
  687. win.Interval = &IntegerLiteral{Val: args[2].(*IntegerLiteral).Val * unit}
  688. } else {
  689. win.Interval = &IntegerLiteral{Val: 0}
  690. }
  691. return win, nil
  692. }
  693. func (p *Parser) ParseCreateStreamStmt() (*StreamStmt, error) {
  694. stmt := &StreamStmt{}
  695. if tok, _ := p.scanIgnoreWhitespace(); tok == CREATE {
  696. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == STREAM {
  697. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  698. stmt.Name = StreamName(lit2)
  699. if fields, err := p.parseStreamFields(); err != nil {
  700. return nil, err
  701. } else {
  702. stmt.StreamFields = fields
  703. }
  704. if opts, err := p.parseStreamOptions(); err != nil {
  705. return nil, err
  706. } else {
  707. stmt.Options = opts
  708. }
  709. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == SEMICOLON {
  710. p.unscan()
  711. return stmt, nil
  712. } else if tok3 == EOF {
  713. //Finish parsing create stream statement.
  714. return stmt, nil
  715. } else {
  716. return nil, fmt.Errorf("found %q, expected semicolon or EOF.", lit3)
  717. }
  718. } else {
  719. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  720. }
  721. } else {
  722. return nil, fmt.Errorf("found %q, expected keyword stream.", lit1)
  723. }
  724. } else {
  725. p.unscan()
  726. return nil, nil
  727. }
  728. return stmt, nil
  729. }
  730. func (p *Parser) parseShowStreamsStmt() (*ShowStreamsStatement, error) {
  731. ss := &ShowStreamsStatement{}
  732. if tok, _ := p.scanIgnoreWhitespace(); tok == SHOW {
  733. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == STREAMS {
  734. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == EOF || tok2 == SEMICOLON {
  735. return ss, nil
  736. } else {
  737. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  738. }
  739. } else {
  740. return nil, fmt.Errorf("found %q, expected keyword streams.", lit1)
  741. }
  742. } else {
  743. p.unscan()
  744. return nil, nil
  745. }
  746. return ss, nil
  747. }
  748. func (p *Parser) parseDescribeStreamStmt() (*DescribeStreamStatement, error) {
  749. dss := &DescribeStreamStatement{}
  750. if tok, _ := p.scanIgnoreWhitespace(); tok == DESCRIBE {
  751. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == STREAM {
  752. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  753. dss.Name = lit2
  754. return dss, nil
  755. } else {
  756. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  757. }
  758. } else {
  759. return nil, fmt.Errorf("found %q, expected keyword stream.", lit1)
  760. }
  761. } else {
  762. p.unscan()
  763. return nil, nil
  764. }
  765. }
  766. func (p *Parser) parseExplainStreamsStmt() (*ExplainStreamStatement, error) {
  767. ess := &ExplainStreamStatement{}
  768. if tok, _ := p.scanIgnoreWhitespace(); tok == EXPLAIN {
  769. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == STREAM {
  770. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  771. ess.Name = lit2
  772. return ess, nil
  773. } else {
  774. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  775. }
  776. } else {
  777. return nil, fmt.Errorf("found %q, expected keyword stream.", lit1)
  778. }
  779. } else {
  780. p.unscan()
  781. return nil, nil
  782. }
  783. }
  784. func (p *Parser) parseDropStreamsStmt() (*DropStreamStatement, error) {
  785. ess := &DropStreamStatement{}
  786. if tok, _ := p.scanIgnoreWhitespace(); tok == DROP {
  787. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == STREAM {
  788. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == IDENT {
  789. ess.Name = lit2
  790. return ess, nil
  791. } else {
  792. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  793. }
  794. } else {
  795. return nil, fmt.Errorf("found %q, expected keyword stream.", lit1)
  796. }
  797. } else {
  798. p.unscan()
  799. return nil, nil
  800. }
  801. }
  802. func (p *Parser) parseStreamFields() (StreamFields, error) {
  803. lStack := &stack.Stack{}
  804. var fields StreamFields
  805. if tok, lit := p.scanIgnoreWhitespace(); tok == LPAREN {
  806. lStack.Push(lit)
  807. for {
  808. //For the schemaless streams
  809. //create stream demo () WITH (FORMAT="JSON", DATASOURCE="demo" TYPE="edgex")
  810. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == RPAREN {
  811. lStack.Pop()
  812. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != WITH {
  813. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  814. }
  815. return fields, nil
  816. } else {
  817. p.unscan()
  818. }
  819. if f, err := p.parseStreamField(); err != nil {
  820. return nil, err
  821. } else {
  822. fields = append(fields, *f)
  823. }
  824. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == RPAREN {
  825. lStack.Pop()
  826. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == WITH {
  827. //Check the stack for LPAREN; If the stack for LPAREN is not zero, then it's not correct.
  828. if lStack.Len() > 0 {
  829. return nil, fmt.Errorf("Parenthesis is not matched.")
  830. }
  831. break
  832. } else if tok2 == COMMA {
  833. if lStack.Len() > 0 {
  834. return nil, fmt.Errorf("Parenthesis is in create record type not matched.")
  835. }
  836. p.unscan()
  837. break
  838. } else if tok2 == RPAREN { //The nested type definition of ARRAY and Struct, such as "field ARRAY(STRUCT(f BIGINT))"
  839. if lStack.Len() > 0 {
  840. return nil, fmt.Errorf("Parenthesis is not matched.")
  841. }
  842. p.unscan()
  843. break
  844. } else {
  845. if lStack.Len() == 0 {
  846. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  847. }
  848. p.unscan()
  849. }
  850. } else {
  851. p.unscan()
  852. }
  853. }
  854. } else {
  855. return nil, fmt.Errorf("found %q, expected lparen after stream name.", lit)
  856. }
  857. return fields, nil
  858. }
  859. func (p *Parser) parseStreamField() (*StreamField, error) {
  860. field := &StreamField{}
  861. if tok, lit := p.scanIgnoreWhitespace(); tok == IDENT {
  862. field.Name = lit
  863. tok1, lit1 := p.scanIgnoreWhitespace()
  864. if t := getDataType(tok1); t != UNKNOWN && t.isSimpleType() {
  865. field.FieldType = &BasicType{Type: t}
  866. } else if t == ARRAY {
  867. if f, e := p.parseStreamArrayType(); e != nil {
  868. return nil, e
  869. } else {
  870. field.FieldType = f
  871. }
  872. } else if t == STRUCT {
  873. if f, e := p.parseStreamStructType(); e != nil {
  874. return nil, e
  875. } else {
  876. field.FieldType = f
  877. }
  878. } else if t == UNKNOWN {
  879. return nil, fmt.Errorf("found %q, expect valid stream field types(BIGINT | FLOAT | STRINGS | DATETIME | BOOLEAN | ARRAY | STRUCT).", lit1)
  880. }
  881. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == COMMA {
  882. //Just consume the comma.
  883. } else if tok2 == RPAREN {
  884. p.unscan()
  885. } else {
  886. return nil, fmt.Errorf("found %q, expect comma or rparen.", lit2)
  887. }
  888. } else {
  889. return nil, fmt.Errorf("found %q, expect stream field name.", lit)
  890. }
  891. return field, nil
  892. }
  893. func (p *Parser) parseStreamArrayType() (FieldType, error) {
  894. lStack := &stack.Stack{}
  895. if tok, _ := p.scanIgnoreWhitespace(); tok == LPAREN {
  896. lStack.Push(LPAREN)
  897. tok1, lit1 := p.scanIgnoreWhitespace()
  898. if t := getDataType(tok1); t != UNKNOWN && t.isSimpleType() {
  899. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == RPAREN {
  900. lStack.Pop()
  901. if lStack.Len() > 0 {
  902. return nil, fmt.Errorf("Parenthesis is in array type not matched.")
  903. }
  904. return &ArrayType{Type: t}, nil
  905. } else {
  906. return nil, fmt.Errorf("found %q, expect rparen in array type definition.", lit2)
  907. }
  908. } else if tok1 == XSTRUCT {
  909. if f, err := p.parseStreamStructType(); err != nil {
  910. return nil, err
  911. } else {
  912. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == RPAREN {
  913. lStack.Pop()
  914. if lStack.Len() > 0 {
  915. return nil, fmt.Errorf("Parenthesis is in struct of array type %q not matched.", tok1)
  916. }
  917. return &ArrayType{Type: STRUCT, FieldType: f}, nil
  918. } else {
  919. return nil, fmt.Errorf("found %q, expect rparen in struct of array type definition.", lit2)
  920. }
  921. }
  922. } else if tok1 == COMMA {
  923. p.unscan()
  924. } else {
  925. return nil, fmt.Errorf("found %q, expect stream data types.", lit1)
  926. }
  927. } else {
  928. }
  929. return nil, nil
  930. }
  931. func (p *Parser) parseStreamStructType() (FieldType, error) {
  932. rf := &RecType{}
  933. if sfs, err := p.parseStreamFields(); err != nil {
  934. return nil, err
  935. } else {
  936. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == COMMA {
  937. rf.StreamFields = sfs
  938. p.unscan()
  939. } else if tok2 == RPAREN {
  940. rf.StreamFields = sfs
  941. p.unscan()
  942. } else {
  943. return nil, fmt.Errorf("found %q, expect comma in create stream record statement.", lit2)
  944. }
  945. }
  946. return rf, nil
  947. }
  948. func (p *Parser) parseStreamOptions() (map[string]string, error) {
  949. var opts = make(map[string]string)
  950. lStack := &stack.Stack{}
  951. if tok, lit := p.scanIgnoreWhitespace(); tok == LPAREN {
  952. lStack.Push(LPAREN)
  953. for {
  954. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == DATASOURCE || tok1 == FORMAT || tok1 == KEY || tok1 == CONF_KEY || tok1 == STRICT_VALIDATION || tok1 == TYPE || tok1 == TIMESTAMP || tok1 == TIMESTAMP_FORMAT {
  955. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == EQ {
  956. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == STRING {
  957. if tok1 == STRICT_VALIDATION {
  958. if val := strings.ToUpper(lit3); (val != "TRUE") && (val != "FALSE") {
  959. return nil, fmt.Errorf("found %q, expect TRUE/FALSE value in %s option.", lit3, tok1)
  960. }
  961. }
  962. opts[lit1] = lit3
  963. } else {
  964. return nil, fmt.Errorf("found %q, expect string value in option.", lit3)
  965. }
  966. } else {
  967. return nil, fmt.Errorf("found %q, expect equals(=) in options.", lit2)
  968. }
  969. } else if tok1 == COMMA {
  970. continue
  971. } else if tok1 == RPAREN {
  972. if lStack.Pop(); lStack.Len() == 0 {
  973. break
  974. } else {
  975. return nil, fmt.Errorf("Parenthesis is not matched in options definition.")
  976. }
  977. } else {
  978. return nil, fmt.Errorf("found %q, unknown option keys(DATASOURCE|FORMAT|KEY|CONF_KEY|STRICT_VALIDATION|TYPE).", lit1)
  979. }
  980. }
  981. } else {
  982. return nil, fmt.Errorf("found %q, expect stream options.", lit)
  983. }
  984. return opts, nil
  985. }
  986. // Only support filter on window now
  987. func (p *Parser) parseFilter() (Expr, error) {
  988. if tok, _ := p.scanIgnoreWhitespace(); tok != FILTER {
  989. p.unscan()
  990. return nil, nil
  991. }
  992. if tok, lit := p.scanIgnoreWhitespace(); tok != LPAREN {
  993. return nil, fmt.Errorf("Found %q after FILTER, expect parentheses.", lit)
  994. }
  995. if tok, lit := p.scanIgnoreWhitespace(); tok != WHERE {
  996. return nil, fmt.Errorf("Found %q after FILTER(, expect WHERE.", lit)
  997. }
  998. expr, err := p.ParseExpr()
  999. if err != nil {
  1000. return nil, err
  1001. }
  1002. if tok, lit := p.scanIgnoreWhitespace(); tok != RPAREN {
  1003. return nil, fmt.Errorf("Found %q after FILTER, expect right parentheses.", lit)
  1004. }
  1005. return expr, nil
  1006. }