parser.go 42 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602
  1. // Copyright 2022-2023 EMQ Technologies Co., Ltd.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package xsql
  15. import (
  16. "fmt"
  17. "io"
  18. "math"
  19. "reflect"
  20. "strconv"
  21. "strings"
  22. "github.com/golang-collections/collections/stack"
  23. "github.com/lf-edge/ekuiper/internal/binder/function"
  24. "github.com/lf-edge/ekuiper/pkg/ast"
  25. "github.com/lf-edge/ekuiper/pkg/message"
  26. )
  27. type Parser struct {
  28. s *Scanner
  29. i int // buffer index
  30. n int // buffer char count
  31. buf [3]struct {
  32. tok ast.Token
  33. lit string
  34. }
  35. inFunc string // currently parsing function name
  36. f int // anonymous field index number
  37. fn int // function index number
  38. clause string
  39. sourceNames []string // source names in the from/join clause
  40. }
  41. func (p *Parser) ParseCondition() (ast.Expr, error) {
  42. if tok, _ := p.scanIgnoreWhitespace(); tok != ast.WHERE {
  43. p.unscan()
  44. return nil, nil
  45. }
  46. expr, err := p.ParseExpr()
  47. if err != nil {
  48. return nil, err
  49. }
  50. return expr, nil
  51. }
  52. func (p *Parser) scan() (tok ast.Token, lit string) {
  53. if p.n > 0 {
  54. p.n--
  55. return p.curr()
  56. }
  57. tok, lit = p.s.Scan()
  58. if tok != ast.WS && tok != ast.COMMENT {
  59. p.i = (p.i + 1) % len(p.buf)
  60. buf := &p.buf[p.i]
  61. buf.tok, buf.lit = tok, lit
  62. }
  63. return
  64. }
  65. func (p *Parser) curr() (ast.Token, string) {
  66. i := (p.i - p.n + len(p.buf)) % len(p.buf)
  67. buf := &p.buf[i]
  68. return buf.tok, buf.lit
  69. }
  70. func (p *Parser) scanIgnoreWhitespace() (tok ast.Token, lit string) {
  71. tok, lit = p.scan()
  72. for {
  73. if tok == ast.WS || tok == ast.COMMENT {
  74. tok, lit = p.scan()
  75. } else {
  76. break
  77. }
  78. }
  79. return tok, lit
  80. }
  81. func (p *Parser) unscan() { p.n++ }
  82. func NewParser(r io.Reader) *Parser {
  83. return &Parser{s: NewScanner(r)}
  84. }
  85. func NewParserWithSources(r io.Reader, sources []string) *Parser {
  86. return &Parser{s: NewScanner(r), sourceNames: sources}
  87. }
  88. func (p *Parser) ParseQueries() ([]ast.SelectStatement, error) {
  89. var stmts []ast.SelectStatement
  90. if stmt, err := p.Parse(); err != nil {
  91. return nil, err
  92. } else {
  93. stmts = append(stmts, *stmt)
  94. }
  95. for {
  96. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.SEMICOLON {
  97. if stmt, err := p.Parse(); err != nil {
  98. return nil, err
  99. } else {
  100. if stmt != nil {
  101. stmts = append(stmts, *stmt)
  102. }
  103. }
  104. } else if tok == ast.EOF {
  105. break
  106. }
  107. }
  108. return stmts, nil
  109. }
  110. func (p *Parser) Parse() (*ast.SelectStatement, error) {
  111. selects := &ast.SelectStatement{}
  112. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.EOF {
  113. return nil, nil
  114. } else if tok != ast.SELECT {
  115. return nil, fmt.Errorf("Found %q, Expected SELECT.\n", lit)
  116. }
  117. p.clause = "select"
  118. if fields, err := p.parseFields(); err != nil {
  119. return nil, err
  120. } else {
  121. selects.Fields = fields
  122. }
  123. p.clause = "from"
  124. if src, err := p.parseSource(); err != nil {
  125. return nil, err
  126. } else {
  127. selects.Sources = src
  128. }
  129. p.clause = "join"
  130. if joins, err := p.parseJoins(); err != nil {
  131. return nil, err
  132. } else {
  133. selects.Joins = joins
  134. }
  135. // The source names may be injected from outside to parse part of the sql
  136. if p.sourceNames == nil {
  137. p.sourceNames = getStreamNames(selects)
  138. }
  139. p.clause = "where"
  140. if exp, err := p.ParseCondition(); err != nil {
  141. return nil, err
  142. } else {
  143. if exp != nil {
  144. selects.Condition = exp
  145. }
  146. }
  147. p.clause = "groupby"
  148. if dims, err := p.parseDimensions(); err != nil {
  149. return nil, err
  150. } else {
  151. selects.Dimensions = dims
  152. }
  153. p.clause = "having"
  154. if having, err := p.parseHaving(); err != nil {
  155. return nil, err
  156. } else {
  157. selects.Having = having
  158. }
  159. p.clause = "orderby"
  160. if sorts, err := p.parseSorts(); err != nil {
  161. return nil, err
  162. } else {
  163. selects.SortFields = sorts
  164. }
  165. p.clause = ""
  166. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.SEMICOLON {
  167. validateFields(selects, p.sourceNames)
  168. p.unscan()
  169. return selects, nil
  170. } else if tok != ast.EOF {
  171. return nil, fmt.Errorf("found %q, expected EOF.", lit)
  172. }
  173. if err := Validate(selects); err != nil {
  174. return nil, err
  175. }
  176. validateFields(selects, p.sourceNames)
  177. return selects, nil
  178. }
  179. func (p *Parser) parseSource() (ast.Sources, error) {
  180. var sources ast.Sources
  181. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.FROM {
  182. return nil, fmt.Errorf("found %q, expected FROM.", lit)
  183. }
  184. if src, alias, err := p.parseSourceLiteral(); err != nil {
  185. return nil, err
  186. } else {
  187. sources = append(sources, &ast.Table{Name: src, Alias: alias})
  188. }
  189. return sources, nil
  190. }
  191. // TODO Current func has problems when the source includes white space.
  192. func (p *Parser) parseSourceLiteral() (string, string, error) {
  193. var sourceSeg []string
  194. var alias string
  195. for {
  196. // HASH, DIV & ADD token is specially support for MQTT topic name patterns.
  197. if tok, lit := p.scanIgnoreWhitespace(); tok.AllowedSourceToken() {
  198. sourceSeg = append(sourceSeg, lit)
  199. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == ast.AS {
  200. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  201. alias = lit2
  202. } else {
  203. return "", "", fmt.Errorf("found %q, expected JOIN key word.", lit)
  204. }
  205. } else if tok1.AllowedSourceToken() {
  206. sourceSeg = append(sourceSeg, lit1)
  207. } else {
  208. p.unscan()
  209. break
  210. }
  211. } else {
  212. p.unscan()
  213. break
  214. }
  215. }
  216. return strings.Join(sourceSeg, ""), alias, nil
  217. }
  218. func (p *Parser) parseFieldNameSections(isSubField bool) ([]string, error) {
  219. var fieldNameSects []string
  220. for {
  221. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.IDENT || tok == ast.ASTERISK {
  222. fieldNameSects = append(fieldNameSects, lit)
  223. if len(fieldNameSects) > 1 {
  224. break
  225. }
  226. if tok1, _ := p.scanIgnoreWhitespace(); isSubField || !tok1.AllowedSFNToken() {
  227. p.unscan()
  228. break
  229. }
  230. } else {
  231. p.unscan()
  232. break
  233. }
  234. }
  235. if len(fieldNameSects) == 0 {
  236. return nil, fmt.Errorf("Cannot find any field name.\n")
  237. }
  238. return fieldNameSects, nil
  239. }
  240. func (p *Parser) parseJoins() (ast.Joins, error) {
  241. var joins ast.Joins
  242. for {
  243. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.INNER || tok == ast.LEFT || tok == ast.RIGHT || tok == ast.FULL || tok == ast.CROSS {
  244. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.JOIN {
  245. jt := ast.INNER_JOIN
  246. switch tok {
  247. case ast.INNER:
  248. jt = ast.INNER_JOIN
  249. case ast.LEFT:
  250. jt = ast.LEFT_JOIN
  251. case ast.RIGHT:
  252. jt = ast.RIGHT_JOIN
  253. case ast.FULL:
  254. jt = ast.FULL_JOIN
  255. case ast.CROSS:
  256. jt = ast.CROSS_JOIN
  257. }
  258. if j, err := p.ParseJoin(jt); err != nil {
  259. return nil, err
  260. } else {
  261. joins = append(joins, *j)
  262. }
  263. } else {
  264. return nil, fmt.Errorf("found %q, expected JOIN key word.", lit)
  265. }
  266. } else {
  267. p.unscan()
  268. if len(joins) > 0 {
  269. return joins, nil
  270. }
  271. return nil, nil
  272. }
  273. }
  274. }
  275. func (p *Parser) ParseJoin(joinType ast.JoinType) (*ast.Join, error) {
  276. j := &ast.Join{JoinType: joinType}
  277. if src, alias, err := p.parseSourceLiteral(); err != nil {
  278. return nil, err
  279. } else {
  280. j.Name = src
  281. j.Alias = alias
  282. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.ON {
  283. if ast.CROSS_JOIN == joinType {
  284. return nil, fmt.Errorf("On expression is not required for cross join type.\n")
  285. }
  286. if exp, err := p.ParseExpr(); err != nil {
  287. return nil, err
  288. } else {
  289. j.Expr = exp
  290. }
  291. } else {
  292. p.unscan()
  293. }
  294. }
  295. return j, nil
  296. }
  297. func (p *Parser) parseDimensions() (ast.Dimensions, error) {
  298. var ds ast.Dimensions
  299. if t, _ := p.scanIgnoreWhitespace(); t == ast.GROUP {
  300. if t1, l1 := p.scanIgnoreWhitespace(); t1 == ast.BY {
  301. for {
  302. if exp, err := p.ParseExpr(); err != nil {
  303. return nil, err
  304. } else {
  305. d := ast.Dimension{Expr: exp}
  306. ds = append(ds, d)
  307. }
  308. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.COMMA {
  309. continue
  310. }
  311. p.unscan()
  312. break
  313. }
  314. } else {
  315. return nil, fmt.Errorf("found %q, expected BY statement.", l1)
  316. }
  317. } else {
  318. p.unscan()
  319. }
  320. return ds, nil
  321. }
  322. func (p *Parser) parseHaving() (ast.Expr, error) {
  323. if tok, _ := p.scanIgnoreWhitespace(); tok != ast.HAVING {
  324. p.unscan()
  325. return nil, nil
  326. }
  327. expr, err := p.ParseExpr()
  328. if err != nil {
  329. return nil, err
  330. }
  331. return expr, nil
  332. }
  333. func (p *Parser) parseSorts() (ast.SortFields, error) {
  334. var ss ast.SortFields
  335. if t, _ := p.scanIgnoreWhitespace(); t == ast.ORDER {
  336. if t1, l1 := p.scanIgnoreWhitespace(); t1 == ast.BY {
  337. for {
  338. if t1, _ = p.scanIgnoreWhitespace(); t1 == ast.IDENT {
  339. s := ast.SortField{Ascending: true}
  340. p.unscan()
  341. if name, err := p.parseFieldNameSections(false); err == nil {
  342. if len(name) == 2 {
  343. s.StreamName = ast.StreamName(name[0])
  344. s.Name = name[1]
  345. p.unscan()
  346. p.unscan()
  347. } else {
  348. s.Name = name[0]
  349. }
  350. s.Uname = strings.Join(name, ast.COLUMN_SEPARATOR)
  351. } else {
  352. return nil, err
  353. }
  354. p.unscan()
  355. if exp, err := p.ParseExpr(); err != nil {
  356. return nil, err
  357. } else {
  358. s.FieldExpr = exp
  359. }
  360. if t2, _ := p.scanIgnoreWhitespace(); t2 == ast.DESC {
  361. s.Ascending = false
  362. ss = append(ss, s)
  363. } else if t2 == ast.ASC {
  364. ss = append(ss, s)
  365. } else {
  366. ss = append(ss, s)
  367. p.unscan()
  368. continue
  369. }
  370. } else if t1 == ast.COMMA {
  371. continue
  372. } else {
  373. p.unscan()
  374. break
  375. }
  376. }
  377. } else {
  378. return nil, fmt.Errorf("found %q, expected BY keyword.", l1)
  379. }
  380. } else {
  381. p.unscan()
  382. }
  383. return ss, nil
  384. }
  385. func (p *Parser) parseFields() (ast.Fields, error) {
  386. var fields ast.Fields
  387. for {
  388. field, err := p.parseField()
  389. if err != nil {
  390. return nil, err
  391. } else {
  392. fields = append(fields, *field)
  393. }
  394. tok, _ := p.scanIgnoreWhitespace()
  395. if tok != ast.COMMA {
  396. p.unscan()
  397. break
  398. }
  399. }
  400. return fields, nil
  401. }
  402. func (p *Parser) parseField() (*ast.Field, error) {
  403. field := &ast.Field{}
  404. if exp, err := p.ParseExpr(); err != nil {
  405. return nil, err
  406. } else {
  407. field.Name = nameExpr(exp)
  408. field.Expr = exp
  409. }
  410. if alias, err := p.parseAlias(); err != nil {
  411. return nil, err
  412. } else {
  413. if alias != "" {
  414. if field.Name == "*" {
  415. return nil, fmt.Errorf("alias is not supported for *")
  416. }
  417. field.AName = alias
  418. }
  419. }
  420. if field.Name == "" && field.AName == "" {
  421. field.Name = DEFAULT_FIELD_NAME_PREFIX + strconv.Itoa(p.f)
  422. p.f += 1
  423. }
  424. return field, nil
  425. }
  426. func nameExpr(exp ast.Expr) string {
  427. switch e := exp.(type) {
  428. case *ast.FieldRef:
  429. return e.Name
  430. case *ast.Call:
  431. return e.Name
  432. case *ast.Wildcard:
  433. return ast.Tokens[ast.ASTERISK]
  434. default:
  435. return ""
  436. }
  437. }
  438. func (p *Parser) parseAlias() (string, error) {
  439. tok, _ := p.scanIgnoreWhitespace()
  440. if tok == ast.AS {
  441. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.IDENT {
  442. return "", fmt.Errorf("found %q, expected as alias.", lit)
  443. } else {
  444. return lit, nil
  445. }
  446. }
  447. p.unscan()
  448. return "", nil
  449. }
  450. func (p *Parser) ParseExpr() (ast.Expr, error) {
  451. var err error
  452. root := &ast.BinaryExpr{}
  453. root.RHS, err = p.parseUnaryExpr(false)
  454. if err != nil {
  455. return nil, err
  456. }
  457. for {
  458. op, _ := p.scanIgnoreWhitespace()
  459. if !op.IsOperator() {
  460. p.unscan()
  461. return root.RHS, nil
  462. } else if op == ast.ASTERISK { // Change the asterisk to Mul token.
  463. op = ast.MUL
  464. } else if op == ast.LBRACKET { // LBRACKET is a special token, need to unscan
  465. op = ast.SUBSET
  466. p.unscan()
  467. } else if op == ast.IN { // IN is a special token, need to unscan
  468. p.unscan()
  469. } else if op == ast.NOT {
  470. afterNot, tk1 := p.scanIgnoreWhitespace()
  471. switch afterNot {
  472. case ast.IN: // IN is a special token, need to unscan
  473. op = ast.NOTIN
  474. p.unscan()
  475. break
  476. case ast.BETWEEN:
  477. op = ast.NOTBETWEEN
  478. node := root
  479. var lhs ast.Expr
  480. for {
  481. r, ok := node.RHS.(*ast.BinaryExpr)
  482. if !ok || r.OP.Precedence() >= op.Precedence() {
  483. lhs = node.RHS
  484. break
  485. }
  486. node = r
  487. }
  488. expr, err := p.parseBetween(lhs, ast.NOTBETWEEN)
  489. if err != nil {
  490. return nil, err
  491. }
  492. node.RHS = expr
  493. continue
  494. case ast.LIKE:
  495. op = ast.NOTLIKE
  496. default:
  497. return nil, fmt.Errorf("found %q, expected expression", tk1)
  498. }
  499. } else if op == ast.BETWEEN {
  500. node := root
  501. var lhs ast.Expr
  502. for {
  503. r, ok := node.RHS.(*ast.BinaryExpr)
  504. if !ok || r.OP.Precedence() >= op.Precedence() {
  505. lhs = node.RHS
  506. break
  507. }
  508. node = r
  509. }
  510. expr, err := p.parseBetween(lhs, op)
  511. if err != nil {
  512. return nil, err
  513. }
  514. node.RHS = expr
  515. continue
  516. }
  517. var rhs ast.Expr
  518. if rhs, err = p.parseUnaryExpr(op == ast.ARROW || op == ast.DOT); err != nil {
  519. return nil, err
  520. } else if op == ast.DOT {
  521. op = ast.ARROW
  522. }
  523. if op == ast.LIKE || op == ast.NOTLIKE {
  524. lp := &ast.LikePattern{
  525. Expr: rhs,
  526. }
  527. if l, ok := lp.Expr.(*ast.StringLiteral); ok {
  528. lp.Pattern, err = lp.Compile(l.Val)
  529. if err != nil {
  530. return nil, fmt.Errorf("invalid LIKE pattern: %s", err)
  531. }
  532. }
  533. rhs = lp
  534. }
  535. for node := root; ; {
  536. r, ok := node.RHS.(*ast.BinaryExpr)
  537. if !ok || r.OP.Precedence() >= op.Precedence() {
  538. node.RHS = &ast.BinaryExpr{LHS: node.RHS, RHS: rhs, OP: op}
  539. break
  540. }
  541. node = r
  542. }
  543. }
  544. }
  545. func (p *Parser) parseBetween(lhs ast.Expr, op ast.Token) (ast.Expr, error) {
  546. alhs, err := p.parseUnaryExpr(false)
  547. if err != nil {
  548. return nil, err
  549. }
  550. opp, _ := p.scanIgnoreWhitespace()
  551. if opp != ast.AND {
  552. return nil, fmt.Errorf("expect AND expression after between but found %s", opp)
  553. }
  554. arhs, err := p.parseUnaryExpr(false)
  555. if err != nil {
  556. return nil, err
  557. }
  558. return &ast.BinaryExpr{
  559. LHS: lhs,
  560. OP: op,
  561. RHS: &ast.BetweenExpr{
  562. Lower: alhs,
  563. Higher: arhs,
  564. },
  565. }, nil
  566. }
  567. func (p *Parser) parseUnaryExpr(isSubField bool) (ast.Expr, error) {
  568. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.LPAREN {
  569. expr, err := p.ParseExpr()
  570. if err != nil {
  571. return nil, err
  572. }
  573. // Expect an RPAREN at the end.
  574. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != ast.RPAREN {
  575. return nil, fmt.Errorf("found %q, expected right paren.", lit2)
  576. }
  577. return &ast.ParenExpr{Expr: expr}, nil
  578. } else if tok1 == ast.LBRACKET {
  579. return p.parseBracketExpr()
  580. } else if tok1 == ast.IN {
  581. return p.parseValueSetExpr()
  582. }
  583. p.unscan()
  584. tok, lit := p.scanIgnoreWhiteSpaceWithNegativeNum()
  585. if tok == ast.CASE {
  586. return p.parseCaseExpr()
  587. } else if tok == ast.IDENT {
  588. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.LPAREN {
  589. return p.parseCall(lit)
  590. }
  591. p.unscan() // Back the Lparen token
  592. p.unscan() // Back the ident token
  593. if n, err := p.parseFieldNameSections(isSubField); err != nil {
  594. return nil, err
  595. } else {
  596. if p.inmeta() {
  597. if len(n) == 2 {
  598. if len(p.sourceNames) > 0 && !contains(p.sourceNames, n[0]) {
  599. return &ast.BinaryExpr{
  600. LHS: &ast.MetaRef{StreamName: ast.DefaultStream, Name: n[0]},
  601. OP: ast.ARROW,
  602. RHS: &ast.JsonFieldRef{Name: n[1]},
  603. }, nil
  604. } else {
  605. return &ast.MetaRef{StreamName: ast.StreamName(n[0]), Name: n[1]}, nil
  606. }
  607. }
  608. if isSubField {
  609. return &ast.JsonFieldRef{Name: n[0]}, nil
  610. }
  611. return &ast.MetaRef{StreamName: ast.DefaultStream, Name: n[0]}, nil
  612. } else {
  613. if len(n) == 2 {
  614. if len(p.sourceNames) > 0 && !contains(p.sourceNames, n[0]) {
  615. return &ast.BinaryExpr{
  616. LHS: &ast.FieldRef{StreamName: ast.DefaultStream, Name: n[0]},
  617. OP: ast.ARROW,
  618. RHS: &ast.JsonFieldRef{Name: n[1]},
  619. }, nil
  620. } else {
  621. return &ast.FieldRef{StreamName: ast.StreamName(n[0]), Name: n[1]}, nil
  622. }
  623. }
  624. if isSubField {
  625. return &ast.JsonFieldRef{Name: n[0]}, nil
  626. }
  627. return &ast.FieldRef{StreamName: ast.DefaultStream, Name: n[0]}, nil
  628. }
  629. }
  630. } else if tok == ast.STRING || tok == ast.SINGLEQUOTE {
  631. return &ast.StringLiteral{Val: lit}, nil
  632. } else if tok == ast.INTEGER {
  633. val, _ := strconv.Atoi(lit)
  634. return &ast.IntegerLiteral{Val: val}, nil
  635. } else if tok == ast.NUMBER {
  636. if v, err := strconv.ParseFloat(lit, 64); err != nil {
  637. return nil, fmt.Errorf("found %q, invalid number value.", lit)
  638. } else {
  639. return &ast.NumberLiteral{Val: v}, nil
  640. }
  641. } else if tok == ast.TRUE || tok == ast.FALSE {
  642. if v, err := strconv.ParseBool(lit); err != nil {
  643. return nil, fmt.Errorf("found %q, invalid boolean value.", lit)
  644. } else {
  645. return &ast.BooleanLiteral{Val: v}, nil
  646. }
  647. } else if tok.IsTimeLiteral() {
  648. return &ast.TimeLiteral{Val: tok}, nil
  649. } else if tok == ast.ASTERISK {
  650. return p.parseAsterisk()
  651. }
  652. return nil, fmt.Errorf("found %q, expected expression.", lit)
  653. }
  654. func (p *Parser) parseValueSetExpr() (ast.Expr, error) {
  655. valsetExpr := &ast.ValueSetExpr{
  656. LiteralExprs: nil,
  657. ArrayExpr: nil,
  658. }
  659. // IN ("A", "B") or IN expression
  660. tk, _ := p.scanIgnoreWhitespace()
  661. if tk == ast.LPAREN {
  662. for {
  663. element, err := p.ParseExpr()
  664. if err != nil {
  665. return nil, fmt.Errorf("expect elements for IN expression, but %v", err)
  666. }
  667. valsetExpr.LiteralExprs = append(valsetExpr.LiteralExprs, element)
  668. if tok2, _ := p.scanIgnoreWhitespace(); tok2 != ast.COMMA {
  669. p.unscan()
  670. break
  671. }
  672. }
  673. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.RPAREN {
  674. return nil, fmt.Errorf("expect ) for IN expression, but got %q", lit)
  675. }
  676. return valsetExpr, nil
  677. } else {
  678. // back to IN
  679. p.unscan()
  680. }
  681. if exp, err := p.parseUnaryExpr(false); err != nil {
  682. return nil, fmt.Errorf("expect expression after IN, but got error %v", err)
  683. } else {
  684. return exp, nil
  685. }
  686. }
  687. func (p *Parser) parseBracketExpr() (ast.Expr, error) {
  688. tok2, lit2 := p.scanIgnoreWhiteSpaceWithNegativeNum()
  689. if tok2 == ast.RBRACKET {
  690. // field[]
  691. return &ast.ColonExpr{Start: &ast.IntegerLiteral{Val: 0}, End: &ast.IntegerLiteral{Val: math.MinInt32}}, nil
  692. } else if tok2 == ast.INTEGER {
  693. start, err := strconv.Atoi(lit2)
  694. if err != nil {
  695. return nil, fmt.Errorf("The start index %s is not an int value in bracket expression.", lit2)
  696. }
  697. if tok3, _ := p.scanIgnoreWhitespace(); tok3 == ast.RBRACKET {
  698. // Such as field[2]
  699. return &ast.IndexExpr{Index: &ast.IntegerLiteral{Val: start}}, nil
  700. } else if tok3 == ast.COLON {
  701. // Such as field[2:] or field[2:4]
  702. return p.parseColonExpr(&ast.IntegerLiteral{Val: start})
  703. }
  704. } else if tok2 == ast.COLON {
  705. // Such as field[:3] or [:]
  706. return p.parseColonExpr(&ast.IntegerLiteral{Val: 0})
  707. } else {
  708. p.unscan()
  709. start, err := p.ParseExpr()
  710. if err != nil {
  711. return nil, fmt.Errorf("The start index %s is invalid in bracket expression.", lit2)
  712. }
  713. if tok3, _ := p.scanIgnoreWhitespace(); tok3 == ast.RBRACKET {
  714. // Such as field[2]
  715. return &ast.IndexExpr{Index: start}, nil
  716. } else if tok3 == ast.COLON {
  717. // Such as field[2:] or field[2:4]
  718. return p.parseColonExpr(start)
  719. }
  720. }
  721. return nil, fmt.Errorf("Unexpected token %q. when parsing bracket expressions.", lit2)
  722. }
  723. func (p *Parser) parseColonExpr(start ast.Expr) (ast.Expr, error) {
  724. tok, lit := p.scanIgnoreWhiteSpaceWithNegativeNum()
  725. if tok == ast.INTEGER {
  726. end, err := strconv.Atoi(lit)
  727. if err != nil {
  728. return nil, fmt.Errorf("The end index %s is not an int value in bracket expression.", lit)
  729. }
  730. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == ast.RBRACKET {
  731. return &ast.ColonExpr{Start: start, End: &ast.IntegerLiteral{Val: end}}, nil
  732. } else {
  733. return nil, fmt.Errorf("Found %q, expected right bracket.", lit1)
  734. }
  735. } else if tok == ast.RBRACKET {
  736. return &ast.ColonExpr{Start: start, End: &ast.IntegerLiteral{Val: math.MinInt32}}, nil
  737. }
  738. p.unscan()
  739. end, err := p.ParseExpr()
  740. if err != nil {
  741. return nil, fmt.Errorf("The end index %s is invalid in bracket expression.", lit)
  742. }
  743. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == ast.RBRACKET {
  744. return &ast.ColonExpr{Start: start, End: end}, nil
  745. } else {
  746. return nil, fmt.Errorf("Found %q, expected right bracket.", lit1)
  747. }
  748. }
  749. func (p *Parser) scanIgnoreWhiteSpaceWithNegativeNum() (ast.Token, string) {
  750. tok, lit := p.scanIgnoreWhitespace()
  751. if tok == ast.SUB {
  752. _, _ = p.s.ScanWhiteSpace()
  753. r := p.s.read()
  754. if isDigit(r) {
  755. p.s.unread()
  756. tok, lit = p.s.ScanNumber(false, true)
  757. }
  758. }
  759. return tok, lit
  760. }
  761. func (p *Parser) parseAs(f *ast.Field) (*ast.Field, error) {
  762. tok, lit := p.scanIgnoreWhitespace()
  763. if tok != ast.IDENT {
  764. return nil, fmt.Errorf("found %q, expected as alias.", lit)
  765. }
  766. f.AName = lit
  767. return f, nil
  768. }
  769. var WindowFuncs = map[string]struct{}{
  770. "tumblingwindow": {},
  771. "hoppingwindow": {},
  772. "sessionwindow": {},
  773. "slidingwindow": {},
  774. "countwindow": {},
  775. }
  776. func convFuncName(n string) (string, bool) {
  777. lname := strings.ToLower(n)
  778. if _, ok := WindowFuncs[lname]; ok {
  779. return lname, ok
  780. } else {
  781. return function.ConvName(n)
  782. }
  783. }
  784. func (p *Parser) parseCall(n string) (ast.Expr, error) {
  785. // Check if n function exists and convert it to lowercase for built-in func
  786. name, ok := convFuncName(n)
  787. if !ok {
  788. return nil, fmt.Errorf("function %s not found", n)
  789. }
  790. p.inFunc = name
  791. defer func() { p.inFunc = "" }()
  792. ft := function.GetFuncType(name)
  793. if ft == ast.FuncTypeCols && p.clause != "select" {
  794. return nil, fmt.Errorf("function %s can only be used inside the select clause", n)
  795. }
  796. var args []ast.Expr
  797. for {
  798. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.RPAREN {
  799. break
  800. }
  801. p.unscan()
  802. if exp, err := p.ParseExpr(); err != nil {
  803. return nil, err
  804. } else {
  805. if ft == ast.FuncTypeCols {
  806. field := &ast.ColFuncField{Expr: exp, Name: nameExpr(exp)}
  807. args = append(args, field)
  808. } else {
  809. args = append(args, exp)
  810. }
  811. }
  812. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.COMMA {
  813. if tok != ast.RPAREN {
  814. return nil, fmt.Errorf("found function call %q, expected ), but with %q.", name, lit)
  815. }
  816. break
  817. }
  818. }
  819. if wt, err := validateWindows(name, args); wt == ast.NOT_WINDOW {
  820. if valErr := validateFuncs(name, args); valErr != nil {
  821. return nil, valErr
  822. }
  823. // Add context for some aggregate func
  824. if name == "deduplicate" {
  825. args = append([]ast.Expr{&ast.Wildcard{Token: ast.ASTERISK}}, args...)
  826. }
  827. c := &ast.Call{Name: name, Args: args, FuncId: p.fn, FuncType: ft}
  828. p.fn += 1
  829. e := p.parseOver(c)
  830. return c, e
  831. } else {
  832. if err != nil {
  833. return nil, err
  834. }
  835. win, err := p.ConvertToWindows(wt, args)
  836. if err != nil {
  837. return nil, err
  838. }
  839. // parse filter clause
  840. f, err := p.parseFilter()
  841. if err != nil {
  842. return nil, err
  843. } else if f != nil {
  844. win.Filter = f
  845. }
  846. return win, nil
  847. }
  848. }
  849. func (p *Parser) parseCaseExpr() (*ast.CaseExpr, error) {
  850. c := &ast.CaseExpr{}
  851. tok, _ := p.scanIgnoreWhitespace()
  852. p.unscan()
  853. if tok != ast.WHEN { // no condition value for case, additional validation needed
  854. if exp, err := p.ParseExpr(); err != nil {
  855. return nil, err
  856. } else {
  857. c.Value = exp
  858. }
  859. }
  860. loop:
  861. for {
  862. tok, _ := p.scanIgnoreWhitespace()
  863. switch tok {
  864. case ast.WHEN:
  865. if exp, err := p.ParseExpr(); err != nil {
  866. return nil, err
  867. } else {
  868. if c.WhenClauses == nil {
  869. c.WhenClauses = make([]*ast.WhenClause, 0)
  870. }
  871. if c.Value == nil && !ast.IsBooleanArg(exp) {
  872. return nil, fmt.Errorf("invalid CASE expression, WHEN expression must be a bool condition")
  873. }
  874. w := &ast.WhenClause{
  875. Expr: exp,
  876. }
  877. tokThen, _ := p.scanIgnoreWhitespace()
  878. if tokThen != ast.THEN {
  879. return nil, fmt.Errorf("invalid CASE expression, THEN expected after WHEN")
  880. } else {
  881. if expThen, err := p.ParseExpr(); err != nil {
  882. return nil, err
  883. } else {
  884. w.Result = expThen
  885. c.WhenClauses = append(c.WhenClauses, w)
  886. }
  887. }
  888. }
  889. case ast.ELSE:
  890. if c.WhenClauses != nil {
  891. if exp, err := p.ParseExpr(); err != nil {
  892. return nil, err
  893. } else {
  894. c.ElseClause = exp
  895. }
  896. } else {
  897. return nil, fmt.Errorf("invalid CASE expression, WHEN expected before ELSE")
  898. }
  899. case ast.END:
  900. if c.WhenClauses != nil {
  901. break loop
  902. }
  903. return nil, fmt.Errorf("invalid CASE expression, WHEN expected before END")
  904. default:
  905. return nil, fmt.Errorf("invalid CASE expression, END expected")
  906. }
  907. }
  908. return c, nil
  909. }
  910. func validateWindows(fname string, args []ast.Expr) (ast.WindowType, error) {
  911. switch fname {
  912. case "tumblingwindow":
  913. if err := validateWindow(fname, 2, args); err != nil {
  914. return ast.TUMBLING_WINDOW, err
  915. }
  916. return ast.TUMBLING_WINDOW, nil
  917. case "hoppingwindow":
  918. if err := validateWindow(fname, 3, args); err != nil {
  919. return ast.HOPPING_WINDOW, err
  920. }
  921. return ast.HOPPING_WINDOW, nil
  922. case "sessionwindow":
  923. if err := validateWindow(fname, 3, args); err != nil {
  924. return ast.SESSION_WINDOW, err
  925. }
  926. return ast.SESSION_WINDOW, nil
  927. case "slidingwindow":
  928. if err := validateWindow(fname, 2, args); err != nil {
  929. return ast.SLIDING_WINDOW, err
  930. }
  931. return ast.SLIDING_WINDOW, nil
  932. case "countwindow":
  933. if len(args) == 1 {
  934. if para1, ok := args[0].(*ast.IntegerLiteral); ok && para1.Val > 0 {
  935. return ast.COUNT_WINDOW, nil
  936. } else {
  937. return ast.COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s.", args[0])
  938. }
  939. } else if len(args) == 2 {
  940. if para1, ok1 := args[0].(*ast.IntegerLiteral); ok1 {
  941. if para2, ok2 := args[1].(*ast.IntegerLiteral); ok2 {
  942. if para1.Val < para2.Val {
  943. return ast.COUNT_WINDOW, fmt.Errorf("The second parameter value %d should be less than the first parameter %d.", para2.Val, para1.Val)
  944. } else {
  945. return ast.COUNT_WINDOW, nil
  946. }
  947. }
  948. }
  949. return ast.COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s, %s.", args[0], args[1])
  950. } else {
  951. return ast.COUNT_WINDOW, fmt.Errorf("Invalid parameter count.")
  952. }
  953. }
  954. return ast.NOT_WINDOW, nil
  955. }
  956. func validateWindow(funcName string, expectLen int, args []ast.Expr) error {
  957. if len(args) != expectLen {
  958. return fmt.Errorf("The arguments for %s should be %d.\n", funcName, expectLen)
  959. }
  960. if _, ok := args[0].(*ast.TimeLiteral); !ok {
  961. return fmt.Errorf("The 1st argument for %s is expecting timer literal expression. One value of [dd|hh|mi|ss|ms].\n", funcName)
  962. }
  963. for i := 1; i < len(args); i++ {
  964. if _, ok := args[i].(*ast.IntegerLiteral); !ok {
  965. return fmt.Errorf("The %d argument for %s is expecting interger literal expression. \n", i, funcName)
  966. }
  967. }
  968. return nil
  969. }
  970. func (p *Parser) ConvertToWindows(wtype ast.WindowType, args []ast.Expr) (*ast.Window, error) {
  971. win := &ast.Window{WindowType: wtype}
  972. if wtype == ast.COUNT_WINDOW {
  973. win.Length = &ast.IntegerLiteral{Val: args[0].(*ast.IntegerLiteral).Val}
  974. if len(args) == 2 {
  975. win.Interval = &ast.IntegerLiteral{Val: args[1].(*ast.IntegerLiteral).Val}
  976. }
  977. return win, nil
  978. }
  979. if tl, ok := args[0].(*ast.TimeLiteral); ok {
  980. switch tl.Val {
  981. case ast.DD, ast.HH, ast.MI, ast.SS, ast.MS:
  982. win.TimeUnit = tl
  983. default:
  984. return nil, fmt.Errorf("Invalid timeliteral %s", tl.Val)
  985. }
  986. } else {
  987. return nil, fmt.Errorf("Invalid timeliteral %s", tl.Val)
  988. }
  989. win.Length = &ast.IntegerLiteral{Val: args[1].(*ast.IntegerLiteral).Val}
  990. if len(args) > 2 {
  991. win.Interval = &ast.IntegerLiteral{Val: args[2].(*ast.IntegerLiteral).Val}
  992. } else {
  993. win.Interval = &ast.IntegerLiteral{Val: 0}
  994. }
  995. return win, nil
  996. }
  997. func (p *Parser) ParseCreateStmt() (ast.Statement, error) {
  998. _, lit := p.scanIgnoreWhitespace()
  999. lit = strings.ToUpper(lit)
  1000. if lit == ast.CREATE {
  1001. _, lit1 := p.scanIgnoreWhitespace()
  1002. stmt := &ast.StreamStmt{}
  1003. lit1 = strings.ToUpper(lit1)
  1004. switch lit1 {
  1005. case ast.STREAM:
  1006. stmt.StreamType = ast.TypeStream
  1007. case ast.TABLE:
  1008. stmt.StreamType = ast.TypeTable
  1009. default:
  1010. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  1011. }
  1012. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1013. stmt.Name = ast.StreamName(lit2)
  1014. if fields, err := p.parseStreamFields(); err != nil {
  1015. return nil, err
  1016. } else {
  1017. stmt.StreamFields = fields
  1018. }
  1019. if opts, err := p.parseStreamOptions(); err != nil {
  1020. return nil, err
  1021. } else {
  1022. stmt.Options = opts
  1023. }
  1024. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == ast.SEMICOLON {
  1025. p.unscan()
  1026. } else if tok3 == ast.EOF {
  1027. // Finish parsing create stream statement. Jump to validate
  1028. } else {
  1029. return nil, fmt.Errorf("found %q, expected semicolon or EOF.", lit3)
  1030. }
  1031. } else {
  1032. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  1033. }
  1034. if valErr := validateStream(stmt); valErr != nil {
  1035. return nil, valErr
  1036. }
  1037. return stmt, nil
  1038. } else {
  1039. p.unscan()
  1040. return nil, nil
  1041. }
  1042. }
  1043. // TODO more accurate validation for table
  1044. func validateStream(stmt *ast.StreamStmt) error {
  1045. f := stmt.Options.FORMAT
  1046. if f == "" {
  1047. f = message.FormatJson
  1048. }
  1049. lf := strings.ToLower(f)
  1050. switch lf {
  1051. case message.FormatBinary:
  1052. if stmt.StreamType == ast.TypeTable {
  1053. return fmt.Errorf("'binary' format is not supported for table")
  1054. }
  1055. switch len(stmt.StreamFields) {
  1056. case 0:
  1057. // do nothing for schemaless
  1058. case 1:
  1059. f := stmt.StreamFields[0]
  1060. if bt, ok := f.FieldType.(*ast.BasicType); ok {
  1061. if bt.Type == ast.BYTEA {
  1062. break
  1063. }
  1064. }
  1065. return fmt.Errorf("'binary' format stream can have only 'bytea' type field")
  1066. default:
  1067. return fmt.Errorf("'binary' format stream can have only one field")
  1068. }
  1069. default:
  1070. if !message.IsFormatSupported(lf) {
  1071. return fmt.Errorf("option 'format=%s' is invalid", f)
  1072. }
  1073. }
  1074. return nil
  1075. }
  1076. func (p *Parser) parseShowStmt() (ast.Statement, error) {
  1077. _, lit := p.scanIgnoreWhitespace()
  1078. lit = strings.ToUpper(lit)
  1079. if lit == ast.SHOW {
  1080. _, lit1 := p.scanIgnoreWhitespace()
  1081. lit1 = strings.ToUpper(lit1)
  1082. switch lit1 {
  1083. case ast.STREAMS:
  1084. ss := &ast.ShowStreamsStatement{}
  1085. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.EOF || tok2 == ast.SEMICOLON {
  1086. return ss, nil
  1087. } else {
  1088. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  1089. }
  1090. case ast.TABLES:
  1091. ss := &ast.ShowTablesStatement{}
  1092. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.EOF || tok2 == ast.SEMICOLON {
  1093. return ss, nil
  1094. } else {
  1095. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  1096. }
  1097. default:
  1098. return nil, fmt.Errorf("found %q, expected keyword streams or tables.", lit1)
  1099. }
  1100. } else {
  1101. p.unscan()
  1102. return nil, nil
  1103. }
  1104. }
  1105. func (p *Parser) parseDescribeStmt() (ast.Statement, error) {
  1106. _, lit := p.scanIgnoreWhitespace()
  1107. lit = strings.ToUpper(lit)
  1108. if lit == ast.DESCRIBE {
  1109. _, lit1 := p.scanIgnoreWhitespace()
  1110. lit1 = strings.ToUpper(lit1)
  1111. switch lit1 {
  1112. case ast.STREAM:
  1113. dss := &ast.DescribeStreamStatement{}
  1114. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1115. dss.Name = lit2
  1116. return dss, nil
  1117. } else {
  1118. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  1119. }
  1120. case ast.TABLE:
  1121. dss := &ast.DescribeTableStatement{}
  1122. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1123. dss.Name = lit2
  1124. return dss, nil
  1125. } else {
  1126. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  1127. }
  1128. default:
  1129. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  1130. }
  1131. } else {
  1132. p.unscan()
  1133. return nil, nil
  1134. }
  1135. }
  1136. func (p *Parser) parseExplainStmt() (ast.Statement, error) {
  1137. _, lit := p.scanIgnoreWhitespace()
  1138. lit = strings.ToUpper(lit)
  1139. if lit == ast.EXPLAIN {
  1140. _, lit1 := p.scanIgnoreWhitespace()
  1141. lit1 = strings.ToUpper(lit1)
  1142. switch lit1 {
  1143. case ast.STREAM:
  1144. ess := &ast.ExplainStreamStatement{}
  1145. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1146. ess.Name = lit2
  1147. return ess, nil
  1148. } else {
  1149. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  1150. }
  1151. case ast.TABLE:
  1152. ess := &ast.ExplainTableStatement{}
  1153. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1154. ess.Name = lit2
  1155. return ess, nil
  1156. } else {
  1157. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  1158. }
  1159. default:
  1160. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  1161. }
  1162. } else {
  1163. p.unscan()
  1164. return nil, nil
  1165. }
  1166. }
  1167. func (p *Parser) parseDropStmt() (ast.Statement, error) {
  1168. _, lit := p.scanIgnoreWhitespace()
  1169. lit = strings.ToUpper(lit)
  1170. if lit == ast.DROP {
  1171. _, lit1 := p.scanIgnoreWhitespace()
  1172. lit1 = strings.ToUpper(lit1)
  1173. switch lit1 {
  1174. case ast.STREAM:
  1175. ess := &ast.DropStreamStatement{}
  1176. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1177. ess.Name = lit2
  1178. return ess, nil
  1179. } else {
  1180. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  1181. }
  1182. case ast.TABLE:
  1183. ess := &ast.DropTableStatement{}
  1184. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1185. ess.Name = lit2
  1186. return ess, nil
  1187. } else {
  1188. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  1189. }
  1190. default:
  1191. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  1192. }
  1193. } else {
  1194. p.unscan()
  1195. return nil, nil
  1196. }
  1197. }
  1198. func (p *Parser) parseStreamFields() (ast.StreamFields, error) {
  1199. lStack := &stack.Stack{}
  1200. var fields ast.StreamFields
  1201. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.LPAREN {
  1202. lStack.Push(lit)
  1203. for {
  1204. // For the schemaless streams
  1205. // create stream demo () WITH (FORMAT="JSON", DATASOURCE="demo" TYPE="edgex")
  1206. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.RPAREN {
  1207. lStack.Pop()
  1208. if _, lit2 := p.scanIgnoreWhitespace(); strings.ToUpper(lit2) != ast.WITH {
  1209. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  1210. }
  1211. return fields, nil
  1212. } else {
  1213. p.unscan()
  1214. }
  1215. if f, err := p.parseStreamField(); err != nil {
  1216. return nil, err
  1217. } else {
  1218. fields = append(fields, *f)
  1219. }
  1220. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.RPAREN {
  1221. lStack.Pop()
  1222. tok2, lit2 := p.scanIgnoreWhitespace()
  1223. lit2 = strings.ToUpper(lit2)
  1224. if lit2 == ast.WITH {
  1225. // Check the stack for LPAREN; If the stack for LPAREN is not zero, then it's not correct.
  1226. if lStack.Len() > 0 {
  1227. return nil, fmt.Errorf("Parenthesis is not matched.")
  1228. }
  1229. break
  1230. } else if tok2 == ast.COMMA {
  1231. if lStack.Len() > 0 {
  1232. return nil, fmt.Errorf("Parenthesis is in create record type not matched.")
  1233. }
  1234. p.unscan()
  1235. break
  1236. } else if tok2 == ast.RPAREN { // The nested type definition of ARRAY and Struct, such as "field ARRAY(STRUCT(f BIGINT))"
  1237. if lStack.Len() > 0 {
  1238. return nil, fmt.Errorf("Parenthesis is not matched.")
  1239. }
  1240. p.unscan()
  1241. break
  1242. } else {
  1243. if lStack.Len() == 0 {
  1244. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  1245. }
  1246. p.unscan()
  1247. }
  1248. } else {
  1249. p.unscan()
  1250. }
  1251. }
  1252. } else {
  1253. return nil, fmt.Errorf("found %q, expected lparen after stream name.", lit)
  1254. }
  1255. return fields, nil
  1256. }
  1257. func (p *Parser) parseStreamField() (*ast.StreamField, error) {
  1258. field := &ast.StreamField{}
  1259. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.IDENT {
  1260. field.Name = lit
  1261. _, lit1 := p.scanIgnoreWhitespace()
  1262. if t := ast.GetDataType(lit1); t != ast.UNKNOWN && t.IsSimpleType() {
  1263. field.FieldType = &ast.BasicType{Type: t}
  1264. } else if t == ast.ARRAY {
  1265. if f, e := p.parseStreamArrayType(); e != nil {
  1266. return nil, e
  1267. } else {
  1268. field.FieldType = f
  1269. }
  1270. } else if t == ast.STRUCT {
  1271. if f, e := p.parseStreamStructType(); e != nil {
  1272. return nil, e
  1273. } else {
  1274. field.FieldType = f
  1275. }
  1276. } else if t == ast.UNKNOWN {
  1277. return nil, fmt.Errorf("found %q, expect valid stream field types(BIGINT | FLOAT | STRINGS | DATETIME | BOOLEAN | BYTEA | ARRAY | STRUCT).", lit1)
  1278. }
  1279. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.COMMA {
  1280. // Just consume the comma.
  1281. } else if tok2 == ast.RPAREN {
  1282. p.unscan()
  1283. } else {
  1284. return nil, fmt.Errorf("found %q, expect comma or rparen.", lit2)
  1285. }
  1286. } else {
  1287. return nil, fmt.Errorf("found %q, expect stream field name.", lit)
  1288. }
  1289. return field, nil
  1290. }
  1291. func (p *Parser) parseStreamArrayType() (ast.FieldType, error) {
  1292. lStack := &stack.Stack{}
  1293. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.LPAREN {
  1294. lStack.Push(ast.LPAREN)
  1295. tok1, lit1 := p.scanIgnoreWhitespace()
  1296. t := ast.GetDataType(lit1)
  1297. if t != ast.UNKNOWN && t.IsSimpleType() {
  1298. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.RPAREN {
  1299. lStack.Pop()
  1300. if lStack.Len() > 0 {
  1301. return nil, fmt.Errorf("Parenthesis is in array type not matched.")
  1302. }
  1303. return &ast.ArrayType{Type: t}, nil
  1304. } else {
  1305. return nil, fmt.Errorf("found %q, expect rparen in array type definition.", lit2)
  1306. }
  1307. } else if t == ast.STRUCT {
  1308. if f, err := p.parseStreamStructType(); err != nil {
  1309. return nil, err
  1310. } else {
  1311. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.RPAREN {
  1312. lStack.Pop()
  1313. if lStack.Len() > 0 {
  1314. return nil, fmt.Errorf("Parenthesis is in struct of array type %q not matched.", tok1)
  1315. }
  1316. return &ast.ArrayType{Type: ast.STRUCT, FieldType: f}, nil
  1317. } else {
  1318. return nil, fmt.Errorf("found %q, expect rparen in struct of array type definition.", lit2)
  1319. }
  1320. }
  1321. } else if tok1 == ast.COMMA {
  1322. p.unscan()
  1323. } else {
  1324. return nil, fmt.Errorf("found %q, expect stream data types.", lit1)
  1325. }
  1326. }
  1327. return nil, nil
  1328. }
  1329. func (p *Parser) parseStreamStructType() (ast.FieldType, error) {
  1330. rf := &ast.RecType{}
  1331. if sfs, err := p.parseStreamFields(); err != nil {
  1332. return nil, err
  1333. } else {
  1334. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.COMMA {
  1335. rf.StreamFields = sfs
  1336. p.unscan()
  1337. } else if tok2 == ast.RPAREN {
  1338. rf.StreamFields = sfs
  1339. p.unscan()
  1340. } else {
  1341. return nil, fmt.Errorf("found %q, expect comma in create stream record statement.", lit2)
  1342. }
  1343. }
  1344. return rf, nil
  1345. }
  1346. func (p *Parser) parseStreamOptions() (*ast.Options, error) {
  1347. opts := &ast.Options{STRICT_VALIDATION: false}
  1348. v := reflect.ValueOf(opts)
  1349. lStack := &stack.Stack{}
  1350. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.LPAREN {
  1351. lStack.Push(ast.LPAREN)
  1352. for {
  1353. tok1, lit1 := p.scanIgnoreWhitespace()
  1354. lit1 = strings.ToUpper(lit1)
  1355. if ast.IsStreamOptionKeyword(tok1, lit1) {
  1356. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.EQ {
  1357. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == ast.STRING {
  1358. switch lit1 {
  1359. case ast.STRICT_VALIDATION:
  1360. if val := strings.ToUpper(lit3); (val != "TRUE") && (val != "FALSE") {
  1361. return nil, fmt.Errorf("found %q, expect TRUE/FALSE value in %s option.", lit3, lit1)
  1362. } else {
  1363. opts.STRICT_VALIDATION = val == "TRUE"
  1364. }
  1365. case ast.RETAIN_SIZE:
  1366. if val, err := strconv.Atoi(lit3); err != nil {
  1367. return nil, fmt.Errorf("found %q, expect number value in %s option.", lit3, lit1)
  1368. } else {
  1369. opts.RETAIN_SIZE = val
  1370. }
  1371. case ast.SHARED:
  1372. if val := strings.ToUpper(lit3); (val != "TRUE") && (val != "FALSE") {
  1373. return nil, fmt.Errorf("found %q, expect TRUE/FALSE value in %s option.", lit3, lit1)
  1374. } else {
  1375. opts.SHARED = val == "TRUE"
  1376. }
  1377. case ast.KIND:
  1378. val := strings.ToLower(lit3)
  1379. opts.KIND = val
  1380. default:
  1381. f := v.Elem().FieldByName(lit1)
  1382. if f.IsValid() {
  1383. f.SetString(lit3)
  1384. } else { // should not happen
  1385. return nil, fmt.Errorf("invalid field %s.", lit1)
  1386. }
  1387. }
  1388. } else {
  1389. return nil, fmt.Errorf("found %q, expect string value in option.", lit3)
  1390. }
  1391. } else {
  1392. return nil, fmt.Errorf("found %q, expect equals(=) in options.", lit2)
  1393. }
  1394. } else if tok1 == ast.COMMA {
  1395. continue
  1396. } else if tok1 == ast.RPAREN {
  1397. if lStack.Pop(); lStack.Len() == 0 {
  1398. break
  1399. }
  1400. return nil, fmt.Errorf("Parenthesis is not matched in options definition.")
  1401. } else {
  1402. return nil, fmt.Errorf("found %q, unknown option keys(DATASOURCE|FORMAT|KEY|CONF_KEY|SHARED|STRICT_VALIDATION|TYPE|TIMESTAMP|TIMESTAMP_FORMAT|RETAIN_SIZE|SCHEMAID).", lit1)
  1403. }
  1404. }
  1405. } else {
  1406. return nil, fmt.Errorf("found %q, expect stream options.", lit)
  1407. }
  1408. if opts.KIND == ast.StreamKindLookup && opts.TYPE == "memory" && opts.KEY == "" {
  1409. return nil, fmt.Errorf("Option \"key\" is required for memory lookup table.")
  1410. }
  1411. return opts, nil
  1412. }
  1413. // Only support filter on window now
  1414. func (p *Parser) parseFilter() (ast.Expr, error) {
  1415. if tok, _ := p.scanIgnoreWhitespace(); tok != ast.FILTER {
  1416. p.unscan()
  1417. return nil, nil
  1418. }
  1419. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.LPAREN {
  1420. return nil, fmt.Errorf("Found %q after FILTER, expect parentheses.", lit)
  1421. }
  1422. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.WHERE {
  1423. return nil, fmt.Errorf("Found %q after FILTER(, expect WHERE.", lit)
  1424. }
  1425. expr, err := p.ParseExpr()
  1426. if err != nil {
  1427. return nil, err
  1428. }
  1429. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.RPAREN {
  1430. return nil, fmt.Errorf("Found %q after FILTER, expect right parentheses.", lit)
  1431. }
  1432. return expr, nil
  1433. }
  1434. func (p *Parser) parseAsterisk() (ast.Expr, error) {
  1435. switch p.inFunc {
  1436. case "mqtt", "meta":
  1437. return &ast.MetaRef{StreamName: ast.DefaultStream, Name: "*"}, nil
  1438. default:
  1439. return &ast.Wildcard{Token: ast.ASTERISK}, nil
  1440. }
  1441. }
  1442. func (p *Parser) inmeta() bool {
  1443. return p.inFunc == "meta" || p.inFunc == "mqtt"
  1444. }
  1445. func (p *Parser) parseOver(c *ast.Call) error {
  1446. if tok, _ := p.scanIgnoreWhitespace(); tok != ast.OVER {
  1447. p.unscan()
  1448. return nil
  1449. } else if function.IsAnalyticFunc(c.Name) {
  1450. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.LPAREN {
  1451. if t, _ := p.scanIgnoreWhitespace(); t == ast.PARTITION {
  1452. if t1, l1 := p.scanIgnoreWhitespace(); t1 == ast.BY {
  1453. pe := &ast.PartitionExpr{}
  1454. for {
  1455. if exp, err := p.ParseExpr(); err != nil {
  1456. return err
  1457. } else {
  1458. pe.Exprs = append(pe.Exprs, exp)
  1459. }
  1460. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.COMMA {
  1461. continue
  1462. }
  1463. p.unscan()
  1464. break
  1465. }
  1466. if len(pe.Exprs) == 0 {
  1467. return fmt.Errorf("PARTITION BY must have at least one expression.")
  1468. }
  1469. c.Partition = pe
  1470. } else {
  1471. return fmt.Errorf("found %q, expected by after partition.", l1)
  1472. }
  1473. } else {
  1474. p.unscan()
  1475. }
  1476. if t, _ := p.scanIgnoreWhitespace(); t == ast.WHEN {
  1477. if exp, err := p.ParseExpr(); err != nil {
  1478. return err
  1479. } else {
  1480. c.WhenExpr = exp
  1481. }
  1482. } else {
  1483. p.unscan()
  1484. }
  1485. if c.Partition != nil || c.WhenExpr != nil {
  1486. if ttt, _ := p.scanIgnoreWhitespace(); ttt != ast.RPAREN {
  1487. return fmt.Errorf("Found %q, expect right parentheses after OVER ", ttt)
  1488. }
  1489. }
  1490. if c.Partition == nil && c.WhenExpr == nil {
  1491. ttt, _ := p.scanIgnoreWhitespace()
  1492. return fmt.Errorf("Found %q after OVER (, expect partition by or when.", ttt)
  1493. }
  1494. return nil
  1495. } else {
  1496. return fmt.Errorf("Found %q after OVER, expect parentheses.", tok1)
  1497. }
  1498. } else {
  1499. return fmt.Errorf("Found OVER after non analytic function %s", c.Name)
  1500. }
  1501. }