parser.go 42 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608
  1. // Copyright 2022-2023 EMQ Technologies Co., Ltd.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package xsql
  15. import (
  16. "fmt"
  17. "io"
  18. "math"
  19. "reflect"
  20. "strconv"
  21. "strings"
  22. "github.com/golang-collections/collections/stack"
  23. "github.com/lf-edge/ekuiper/internal/binder/function"
  24. "github.com/lf-edge/ekuiper/pkg/ast"
  25. "github.com/lf-edge/ekuiper/pkg/message"
  26. )
  27. type Parser struct {
  28. s *Scanner
  29. i int // buffer index
  30. n int // buffer char count
  31. buf [3]struct {
  32. tok ast.Token
  33. lit string
  34. }
  35. inFunc string // currently parsing function name
  36. f int // anonymous field index number
  37. fn int // function index number
  38. clause string
  39. sourceNames []string // source names in the from/join clause
  40. }
  41. func (p *Parser) ParseCondition() (ast.Expr, error) {
  42. if tok, _ := p.scanIgnoreWhitespace(); tok != ast.WHERE {
  43. p.unscan()
  44. return nil, nil
  45. }
  46. expr, err := p.ParseExpr()
  47. if err != nil {
  48. return nil, err
  49. }
  50. return expr, nil
  51. }
  52. func (p *Parser) scan() (tok ast.Token, lit string) {
  53. if p.n > 0 {
  54. p.n--
  55. return p.curr()
  56. }
  57. tok, lit = p.s.Scan()
  58. if tok != ast.WS && tok != ast.COMMENT {
  59. p.i = (p.i + 1) % len(p.buf)
  60. buf := &p.buf[p.i]
  61. buf.tok, buf.lit = tok, lit
  62. }
  63. return
  64. }
  65. func (p *Parser) curr() (ast.Token, string) {
  66. i := (p.i - p.n + len(p.buf)) % len(p.buf)
  67. buf := &p.buf[i]
  68. return buf.tok, buf.lit
  69. }
  70. func (p *Parser) scanIgnoreWhitespace() (tok ast.Token, lit string) {
  71. tok, lit = p.scan()
  72. for {
  73. if tok == ast.WS || tok == ast.COMMENT {
  74. tok, lit = p.scan()
  75. } else {
  76. break
  77. }
  78. }
  79. return tok, lit
  80. }
  81. func (p *Parser) unscan() { p.n++ }
  82. func NewParser(r io.Reader) *Parser {
  83. return &Parser{s: NewScanner(r)}
  84. }
  85. func NewParserWithSources(r io.Reader, sources []string) *Parser {
  86. return &Parser{s: NewScanner(r), sourceNames: sources}
  87. }
  88. func (p *Parser) ParseQueries() ([]ast.SelectStatement, error) {
  89. var stmts []ast.SelectStatement
  90. if stmt, err := p.Parse(); err != nil {
  91. return nil, err
  92. } else {
  93. stmts = append(stmts, *stmt)
  94. }
  95. for {
  96. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.SEMICOLON {
  97. if stmt, err := p.Parse(); err != nil {
  98. return nil, err
  99. } else {
  100. if stmt != nil {
  101. stmts = append(stmts, *stmt)
  102. }
  103. }
  104. } else if tok == ast.EOF {
  105. break
  106. }
  107. }
  108. return stmts, nil
  109. }
  110. func (p *Parser) Parse() (*ast.SelectStatement, error) {
  111. selects := &ast.SelectStatement{}
  112. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.EOF {
  113. return nil, nil
  114. } else if tok != ast.SELECT {
  115. return nil, fmt.Errorf("Found %q, Expected SELECT.\n", lit)
  116. }
  117. p.clause = "select"
  118. if fields, err := p.parseFields(); err != nil {
  119. return nil, err
  120. } else {
  121. selects.Fields = fields
  122. }
  123. p.clause = "from"
  124. if src, err := p.parseSource(); err != nil {
  125. return nil, err
  126. } else {
  127. selects.Sources = src
  128. }
  129. p.clause = "join"
  130. if joins, err := p.parseJoins(); err != nil {
  131. return nil, err
  132. } else {
  133. selects.Joins = joins
  134. }
  135. // The source names may be injected from outside to parse part of the sql
  136. if p.sourceNames == nil {
  137. p.sourceNames = getStreamNames(selects)
  138. }
  139. p.clause = "where"
  140. if exp, err := p.ParseCondition(); err != nil {
  141. return nil, err
  142. } else {
  143. if exp != nil {
  144. selects.Condition = exp
  145. }
  146. }
  147. p.clause = "groupby"
  148. if dims, err := p.parseDimensions(); err != nil {
  149. return nil, err
  150. } else {
  151. selects.Dimensions = dims
  152. }
  153. p.clause = "having"
  154. if having, err := p.parseHaving(); err != nil {
  155. return nil, err
  156. } else {
  157. selects.Having = having
  158. }
  159. p.clause = "orderby"
  160. if sorts, err := p.parseSorts(); err != nil {
  161. return nil, err
  162. } else {
  163. selects.SortFields = sorts
  164. }
  165. p.clause = ""
  166. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.SEMICOLON {
  167. validateFields(selects, p.sourceNames)
  168. p.unscan()
  169. return selects, nil
  170. } else if tok != ast.EOF {
  171. return nil, fmt.Errorf("found %q, expected EOF.", lit)
  172. }
  173. if err := Validate(selects); err != nil {
  174. return nil, err
  175. }
  176. validateFields(selects, p.sourceNames)
  177. return selects, nil
  178. }
  179. func (p *Parser) parseSource() (ast.Sources, error) {
  180. var sources ast.Sources
  181. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.FROM {
  182. return nil, fmt.Errorf("found %q, expected FROM.", lit)
  183. }
  184. if src, alias, err := p.parseSourceLiteral(); err != nil {
  185. return nil, err
  186. } else {
  187. sources = append(sources, &ast.Table{Name: src, Alias: alias})
  188. }
  189. return sources, nil
  190. }
  191. // TODO Current func has problems when the source includes white space.
  192. func (p *Parser) parseSourceLiteral() (string, string, error) {
  193. var sourceSeg []string
  194. var alias string
  195. for {
  196. // HASH, DIV & ADD token is specially support for MQTT topic name patterns.
  197. if tok, lit := p.scanIgnoreWhitespace(); tok.AllowedSourceToken() {
  198. sourceSeg = append(sourceSeg, lit)
  199. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == ast.AS {
  200. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  201. alias = lit2
  202. } else {
  203. return "", "", fmt.Errorf("found %q, expected JOIN key word.", lit)
  204. }
  205. } else if tok1.AllowedSourceToken() {
  206. sourceSeg = append(sourceSeg, lit1)
  207. } else {
  208. p.unscan()
  209. break
  210. }
  211. } else {
  212. p.unscan()
  213. break
  214. }
  215. }
  216. return strings.Join(sourceSeg, ""), alias, nil
  217. }
  218. func (p *Parser) parseFieldNameSections(isSubField bool) ([]string, error) {
  219. var fieldNameSects []string
  220. for {
  221. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.IDENT || tok == ast.ASTERISK {
  222. fieldNameSects = append(fieldNameSects, lit)
  223. if len(fieldNameSects) > 1 {
  224. break
  225. }
  226. if tok1, _ := p.scanIgnoreWhitespace(); isSubField || !tok1.AllowedSFNToken() {
  227. p.unscan()
  228. break
  229. }
  230. } else {
  231. p.unscan()
  232. break
  233. }
  234. }
  235. if len(fieldNameSects) == 0 {
  236. return nil, fmt.Errorf("Cannot find any field name.\n")
  237. }
  238. return fieldNameSects, nil
  239. }
  240. func (p *Parser) parseJoins() (ast.Joins, error) {
  241. var joins ast.Joins
  242. for {
  243. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.INNER || tok == ast.LEFT || tok == ast.RIGHT || tok == ast.FULL || tok == ast.CROSS {
  244. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.JOIN {
  245. jt := ast.INNER_JOIN
  246. switch tok {
  247. case ast.INNER:
  248. jt = ast.INNER_JOIN
  249. case ast.LEFT:
  250. jt = ast.LEFT_JOIN
  251. case ast.RIGHT:
  252. jt = ast.RIGHT_JOIN
  253. case ast.FULL:
  254. jt = ast.FULL_JOIN
  255. case ast.CROSS:
  256. jt = ast.CROSS_JOIN
  257. }
  258. if j, err := p.ParseJoin(jt); err != nil {
  259. return nil, err
  260. } else {
  261. joins = append(joins, *j)
  262. }
  263. } else {
  264. return nil, fmt.Errorf("found %q, expected JOIN key word.", lit)
  265. }
  266. } else {
  267. p.unscan()
  268. if len(joins) > 0 {
  269. return joins, nil
  270. }
  271. return nil, nil
  272. }
  273. }
  274. }
  275. func (p *Parser) ParseJoin(joinType ast.JoinType) (*ast.Join, error) {
  276. j := &ast.Join{JoinType: joinType}
  277. if src, alias, err := p.parseSourceLiteral(); err != nil {
  278. return nil, err
  279. } else {
  280. j.Name = src
  281. j.Alias = alias
  282. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.ON {
  283. if ast.CROSS_JOIN == joinType {
  284. return nil, fmt.Errorf("On expression is not required for cross join type.\n")
  285. }
  286. if exp, err := p.ParseExpr(); err != nil {
  287. return nil, err
  288. } else {
  289. j.Expr = exp
  290. }
  291. } else {
  292. p.unscan()
  293. }
  294. }
  295. return j, nil
  296. }
  297. func (p *Parser) parseDimensions() (ast.Dimensions, error) {
  298. var ds ast.Dimensions
  299. if t, _ := p.scanIgnoreWhitespace(); t == ast.GROUP {
  300. if t1, l1 := p.scanIgnoreWhitespace(); t1 == ast.BY {
  301. for {
  302. if exp, err := p.ParseExpr(); err != nil {
  303. return nil, err
  304. } else {
  305. d := ast.Dimension{Expr: exp}
  306. ds = append(ds, d)
  307. }
  308. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.COMMA {
  309. continue
  310. }
  311. p.unscan()
  312. break
  313. }
  314. } else {
  315. return nil, fmt.Errorf("found %q, expected BY statement.", l1)
  316. }
  317. } else {
  318. p.unscan()
  319. }
  320. return ds, nil
  321. }
  322. func (p *Parser) parseHaving() (ast.Expr, error) {
  323. if tok, _ := p.scanIgnoreWhitespace(); tok != ast.HAVING {
  324. p.unscan()
  325. return nil, nil
  326. }
  327. expr, err := p.ParseExpr()
  328. if err != nil {
  329. return nil, err
  330. }
  331. return expr, nil
  332. }
  333. func (p *Parser) parseSorts() (ast.SortFields, error) {
  334. var ss ast.SortFields
  335. if t, _ := p.scanIgnoreWhitespace(); t == ast.ORDER {
  336. if t1, l1 := p.scanIgnoreWhitespace(); t1 == ast.BY {
  337. for {
  338. if t1, _ = p.scanIgnoreWhitespace(); t1 == ast.IDENT {
  339. s := ast.SortField{Ascending: true}
  340. p.unscan()
  341. if name, err := p.parseFieldNameSections(false); err == nil {
  342. if len(name) == 2 {
  343. s.StreamName = ast.StreamName(name[0])
  344. s.Name = name[1]
  345. p.unscan()
  346. p.unscan()
  347. } else {
  348. s.Name = name[0]
  349. }
  350. s.Uname = strings.Join(name, ast.COLUMN_SEPARATOR)
  351. } else {
  352. return nil, err
  353. }
  354. p.unscan()
  355. if exp, err := p.ParseExpr(); err != nil {
  356. return nil, err
  357. } else {
  358. s.FieldExpr = exp
  359. }
  360. if t2, _ := p.scanIgnoreWhitespace(); t2 == ast.DESC {
  361. s.Ascending = false
  362. ss = append(ss, s)
  363. } else if t2 == ast.ASC {
  364. ss = append(ss, s)
  365. } else {
  366. ss = append(ss, s)
  367. p.unscan()
  368. continue
  369. }
  370. } else if t1 == ast.COMMA {
  371. continue
  372. } else {
  373. p.unscan()
  374. break
  375. }
  376. }
  377. } else {
  378. return nil, fmt.Errorf("found %q, expected BY keyword.", l1)
  379. }
  380. } else {
  381. p.unscan()
  382. }
  383. return ss, nil
  384. }
  385. func (p *Parser) parseFields() (ast.Fields, error) {
  386. var fields ast.Fields
  387. for {
  388. field, err := p.parseField()
  389. if err != nil {
  390. return nil, err
  391. } else {
  392. fields = append(fields, *field)
  393. }
  394. tok, _ := p.scanIgnoreWhitespace()
  395. if tok != ast.COMMA {
  396. p.unscan()
  397. break
  398. }
  399. }
  400. return fields, nil
  401. }
  402. func (p *Parser) parseField() (*ast.Field, error) {
  403. field := &ast.Field{}
  404. if exp, err := p.ParseExpr(); err != nil {
  405. return nil, err
  406. } else {
  407. field.Name = nameExpr(exp)
  408. field.Expr = exp
  409. }
  410. if alias, err := p.parseAlias(); err != nil {
  411. return nil, err
  412. } else {
  413. if alias != "" {
  414. if field.Name == "*" {
  415. return nil, fmt.Errorf("alias is not supported for *")
  416. }
  417. field.AName = alias
  418. }
  419. }
  420. if field.Name == "" && field.AName == "" {
  421. field.Name = DEFAULT_FIELD_NAME_PREFIX + strconv.Itoa(p.f)
  422. p.f += 1
  423. }
  424. return field, nil
  425. }
  426. func nameExpr(exp ast.Expr) string {
  427. switch e := exp.(type) {
  428. case *ast.FieldRef:
  429. return e.Name
  430. case *ast.Call:
  431. return e.Name
  432. case *ast.Wildcard:
  433. return ast.Tokens[ast.ASTERISK]
  434. default:
  435. return ""
  436. }
  437. }
  438. func (p *Parser) parseAlias() (string, error) {
  439. tok, _ := p.scanIgnoreWhitespace()
  440. if tok == ast.AS {
  441. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.IDENT {
  442. return "", fmt.Errorf("found %q, expected as alias.", lit)
  443. } else {
  444. return lit, nil
  445. }
  446. }
  447. p.unscan()
  448. return "", nil
  449. }
  450. func (p *Parser) ParseExpr() (ast.Expr, error) {
  451. var err error
  452. root := &ast.BinaryExpr{}
  453. root.RHS, err = p.parseUnaryExpr(false)
  454. if err != nil {
  455. return nil, err
  456. }
  457. for {
  458. op, _ := p.scanIgnoreWhitespace()
  459. if !op.IsOperator() {
  460. p.unscan()
  461. return root.RHS, nil
  462. } else if op == ast.ASTERISK { // Change the asterisk to Mul token.
  463. op = ast.MUL
  464. } else if op == ast.LBRACKET { // LBRACKET is a special token, need to unscan
  465. op = ast.SUBSET
  466. p.unscan()
  467. } else if op == ast.IN { // IN is a special token, need to unscan
  468. p.unscan()
  469. } else if op == ast.NOT {
  470. afterNot, tk1 := p.scanIgnoreWhitespace()
  471. switch afterNot {
  472. case ast.IN: // IN is a special token, need to unscan
  473. op = ast.NOTIN
  474. p.unscan()
  475. break
  476. case ast.BETWEEN:
  477. op = ast.NOTBETWEEN
  478. node := root
  479. var lhs ast.Expr
  480. for {
  481. r, ok := node.RHS.(*ast.BinaryExpr)
  482. if !ok || r.OP.Precedence() >= op.Precedence() {
  483. lhs = node.RHS
  484. break
  485. }
  486. node = r
  487. }
  488. expr, err := p.parseBetween(lhs, ast.NOTBETWEEN)
  489. if err != nil {
  490. return nil, err
  491. }
  492. node.RHS = expr
  493. continue
  494. case ast.LIKE:
  495. op = ast.NOTLIKE
  496. default:
  497. return nil, fmt.Errorf("found %q, expected expression", tk1)
  498. }
  499. } else if op == ast.BETWEEN {
  500. node := root
  501. var lhs ast.Expr
  502. for {
  503. r, ok := node.RHS.(*ast.BinaryExpr)
  504. if !ok || r.OP.Precedence() >= op.Precedence() {
  505. lhs = node.RHS
  506. break
  507. }
  508. node = r
  509. }
  510. expr, err := p.parseBetween(lhs, op)
  511. if err != nil {
  512. return nil, err
  513. }
  514. node.RHS = expr
  515. continue
  516. }
  517. var rhs ast.Expr
  518. if rhs, err = p.parseUnaryExpr(op == ast.ARROW || op == ast.DOT); err != nil {
  519. return nil, err
  520. } else if op == ast.DOT {
  521. op = ast.ARROW
  522. }
  523. if op == ast.LIKE || op == ast.NOTLIKE {
  524. lp := &ast.LikePattern{
  525. Expr: rhs,
  526. }
  527. if l, ok := lp.Expr.(*ast.StringLiteral); ok {
  528. lp.Pattern, err = lp.Compile(l.Val)
  529. if err != nil {
  530. return nil, fmt.Errorf("invalid LIKE pattern: %s", err)
  531. }
  532. }
  533. rhs = lp
  534. }
  535. for node := root; ; {
  536. r, ok := node.RHS.(*ast.BinaryExpr)
  537. if !ok || r.OP.Precedence() >= op.Precedence() {
  538. node.RHS = &ast.BinaryExpr{LHS: node.RHS, RHS: rhs, OP: op}
  539. break
  540. }
  541. node = r
  542. }
  543. }
  544. }
  545. func (p *Parser) parseBetween(lhs ast.Expr, op ast.Token) (ast.Expr, error) {
  546. alhs, err := p.parseUnaryExpr(false)
  547. if err != nil {
  548. return nil, err
  549. }
  550. opp, _ := p.scanIgnoreWhitespace()
  551. if opp != ast.AND {
  552. return nil, fmt.Errorf("expect AND expression after between but found %s", opp)
  553. }
  554. arhs, err := p.parseUnaryExpr(false)
  555. if err != nil {
  556. return nil, err
  557. }
  558. return &ast.BinaryExpr{
  559. LHS: lhs,
  560. OP: op,
  561. RHS: &ast.BetweenExpr{
  562. Lower: alhs,
  563. Higher: arhs,
  564. },
  565. }, nil
  566. }
  567. func (p *Parser) parseUnaryExpr(isSubField bool) (ast.Expr, error) {
  568. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.LPAREN {
  569. expr, err := p.ParseExpr()
  570. if err != nil {
  571. return nil, err
  572. }
  573. // Expect an RPAREN at the end.
  574. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 != ast.RPAREN {
  575. return nil, fmt.Errorf("found %q, expected right paren.", lit2)
  576. }
  577. return &ast.ParenExpr{Expr: expr}, nil
  578. } else if tok1 == ast.LBRACKET {
  579. return p.parseBracketExpr()
  580. } else if tok1 == ast.IN {
  581. return p.parseValueSetExpr()
  582. }
  583. p.unscan()
  584. tok, lit := p.scanIgnoreWhiteSpaceWithNegativeNum()
  585. if tok == ast.CASE {
  586. return p.parseCaseExpr()
  587. } else if tok == ast.IDENT {
  588. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.LPAREN {
  589. return p.parseCall(lit)
  590. }
  591. p.unscan() // Back the Lparen token
  592. p.unscan() // Back the ident token
  593. if n, err := p.parseFieldNameSections(isSubField); err != nil {
  594. return nil, err
  595. } else {
  596. if p.inmeta() {
  597. if len(n) == 2 {
  598. if len(p.sourceNames) > 0 && !contains(p.sourceNames, n[0]) {
  599. return &ast.BinaryExpr{
  600. LHS: &ast.MetaRef{StreamName: ast.DefaultStream, Name: n[0]},
  601. OP: ast.ARROW,
  602. RHS: &ast.JsonFieldRef{Name: n[1]},
  603. }, nil
  604. } else {
  605. return &ast.MetaRef{StreamName: ast.StreamName(n[0]), Name: n[1]}, nil
  606. }
  607. }
  608. if isSubField {
  609. return &ast.JsonFieldRef{Name: n[0]}, nil
  610. }
  611. return &ast.MetaRef{StreamName: ast.DefaultStream, Name: n[0]}, nil
  612. } else {
  613. if len(n) == 2 {
  614. if len(p.sourceNames) > 0 && !contains(p.sourceNames, n[0]) {
  615. return &ast.BinaryExpr{
  616. LHS: &ast.FieldRef{StreamName: ast.DefaultStream, Name: n[0]},
  617. OP: ast.ARROW,
  618. RHS: &ast.JsonFieldRef{Name: n[1]},
  619. }, nil
  620. } else {
  621. return &ast.FieldRef{StreamName: ast.StreamName(n[0]), Name: n[1]}, nil
  622. }
  623. }
  624. if isSubField {
  625. return &ast.JsonFieldRef{Name: n[0]}, nil
  626. }
  627. return &ast.FieldRef{StreamName: ast.DefaultStream, Name: n[0]}, nil
  628. }
  629. }
  630. } else if tok == ast.STRING || tok == ast.SINGLEQUOTE {
  631. return &ast.StringLiteral{Val: lit}, nil
  632. } else if tok == ast.INTEGER {
  633. val, _ := strconv.Atoi(lit)
  634. return &ast.IntegerLiteral{Val: val}, nil
  635. } else if tok == ast.NUMBER {
  636. if v, err := strconv.ParseFloat(lit, 64); err != nil {
  637. return nil, fmt.Errorf("found %q, invalid number value.", lit)
  638. } else {
  639. return &ast.NumberLiteral{Val: v}, nil
  640. }
  641. } else if tok == ast.TRUE || tok == ast.FALSE {
  642. if v, err := strconv.ParseBool(lit); err != nil {
  643. return nil, fmt.Errorf("found %q, invalid boolean value.", lit)
  644. } else {
  645. return &ast.BooleanLiteral{Val: v}, nil
  646. }
  647. } else if tok.IsTimeLiteral() {
  648. return &ast.TimeLiteral{Val: tok}, nil
  649. } else if tok == ast.ASTERISK {
  650. return p.parseAsterisk()
  651. }
  652. return nil, fmt.Errorf("found %q, expected expression.", lit)
  653. }
  654. func (p *Parser) parseValueSetExpr() (ast.Expr, error) {
  655. valsetExpr := &ast.ValueSetExpr{
  656. LiteralExprs: nil,
  657. ArrayExpr: nil,
  658. }
  659. // IN ("A", "B") or IN expression
  660. tk, _ := p.scanIgnoreWhitespace()
  661. if tk == ast.LPAREN {
  662. for {
  663. element, err := p.ParseExpr()
  664. if err != nil {
  665. return nil, fmt.Errorf("expect elements for IN expression, but %v", err)
  666. }
  667. valsetExpr.LiteralExprs = append(valsetExpr.LiteralExprs, element)
  668. if tok2, _ := p.scanIgnoreWhitespace(); tok2 != ast.COMMA {
  669. p.unscan()
  670. break
  671. }
  672. }
  673. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.RPAREN {
  674. return nil, fmt.Errorf("expect ) for IN expression, but got %q", lit)
  675. }
  676. return valsetExpr, nil
  677. } else {
  678. // back to IN
  679. p.unscan()
  680. }
  681. if exp, err := p.parseUnaryExpr(false); err != nil {
  682. return nil, fmt.Errorf("expect expression after IN, but got error %v", err)
  683. } else {
  684. return exp, nil
  685. }
  686. }
  687. func (p *Parser) parseBracketExpr() (ast.Expr, error) {
  688. tok2, lit2 := p.scanIgnoreWhiteSpaceWithNegativeNum()
  689. if tok2 == ast.RBRACKET {
  690. // field[]
  691. return &ast.ColonExpr{Start: &ast.IntegerLiteral{Val: 0}, End: &ast.IntegerLiteral{Val: math.MinInt32}}, nil
  692. } else if tok2 == ast.INTEGER {
  693. start, err := strconv.Atoi(lit2)
  694. if err != nil {
  695. return nil, fmt.Errorf("The start index %s is not an int value in bracket expression.", lit2)
  696. }
  697. if tok3, _ := p.scanIgnoreWhitespace(); tok3 == ast.RBRACKET {
  698. // Such as field[2]
  699. return &ast.IndexExpr{Index: &ast.IntegerLiteral{Val: start}}, nil
  700. } else if tok3 == ast.COLON {
  701. // Such as field[2:] or field[2:4]
  702. return p.parseColonExpr(&ast.IntegerLiteral{Val: start})
  703. }
  704. } else if tok2 == ast.COLON {
  705. // Such as field[:3] or [:]
  706. return p.parseColonExpr(&ast.IntegerLiteral{Val: 0})
  707. } else {
  708. p.unscan()
  709. start, err := p.ParseExpr()
  710. if err != nil {
  711. return nil, fmt.Errorf("The start index %s is invalid in bracket expression.", lit2)
  712. }
  713. if tok3, _ := p.scanIgnoreWhitespace(); tok3 == ast.RBRACKET {
  714. // Such as field[2]
  715. return &ast.IndexExpr{Index: start}, nil
  716. } else if tok3 == ast.COLON {
  717. // Such as field[2:] or field[2:4]
  718. return p.parseColonExpr(start)
  719. }
  720. }
  721. return nil, fmt.Errorf("Unexpected token %q. when parsing bracket expressions.", lit2)
  722. }
  723. func (p *Parser) parseColonExpr(start ast.Expr) (ast.Expr, error) {
  724. tok, lit := p.scanIgnoreWhiteSpaceWithNegativeNum()
  725. if tok == ast.INTEGER {
  726. end, err := strconv.Atoi(lit)
  727. if err != nil {
  728. return nil, fmt.Errorf("The end index %s is not an int value in bracket expression.", lit)
  729. }
  730. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == ast.RBRACKET {
  731. return &ast.ColonExpr{Start: start, End: &ast.IntegerLiteral{Val: end}}, nil
  732. } else {
  733. return nil, fmt.Errorf("Found %q, expected right bracket.", lit1)
  734. }
  735. } else if tok == ast.RBRACKET {
  736. return &ast.ColonExpr{Start: start, End: &ast.IntegerLiteral{Val: math.MinInt32}}, nil
  737. }
  738. p.unscan()
  739. end, err := p.ParseExpr()
  740. if err != nil {
  741. return nil, fmt.Errorf("The end index %s is invalid in bracket expression.", lit)
  742. }
  743. if tok1, lit1 := p.scanIgnoreWhitespace(); tok1 == ast.RBRACKET {
  744. return &ast.ColonExpr{Start: start, End: end}, nil
  745. } else {
  746. return nil, fmt.Errorf("Found %q, expected right bracket.", lit1)
  747. }
  748. }
  749. func (p *Parser) scanIgnoreWhiteSpaceWithNegativeNum() (ast.Token, string) {
  750. tok, lit := p.scanIgnoreWhitespace()
  751. if tok == ast.SUB {
  752. _, _ = p.s.ScanWhiteSpace()
  753. r := p.s.read()
  754. if isDigit(r) {
  755. p.s.unread()
  756. tok, lit = p.s.ScanNumber(false, true)
  757. }
  758. }
  759. return tok, lit
  760. }
  761. func (p *Parser) parseAs(f *ast.Field) (*ast.Field, error) {
  762. tok, lit := p.scanIgnoreWhitespace()
  763. if tok != ast.IDENT {
  764. return nil, fmt.Errorf("found %q, expected as alias.", lit)
  765. }
  766. f.AName = lit
  767. return f, nil
  768. }
  769. var WindowFuncs = map[string]struct{}{
  770. "tumblingwindow": {},
  771. "hoppingwindow": {},
  772. "sessionwindow": {},
  773. "slidingwindow": {},
  774. "countwindow": {},
  775. }
  776. func convFuncName(n string) (string, bool) {
  777. lname := strings.ToLower(n)
  778. if _, ok := WindowFuncs[lname]; ok {
  779. return lname, ok
  780. } else {
  781. return function.ConvName(n)
  782. }
  783. }
  784. func (p *Parser) parseCall(n string) (ast.Expr, error) {
  785. // Check if n function exists and convert it to lowercase for built-in func
  786. name, ok := convFuncName(n)
  787. if !ok {
  788. return nil, fmt.Errorf("function %s not found", n)
  789. }
  790. p.inFunc = name
  791. defer func() { p.inFunc = "" }()
  792. ft := function.GetFuncType(name)
  793. if ft == ast.FuncTypeCols && p.clause != "select" {
  794. return nil, fmt.Errorf("function %s can only be used inside the select clause", n)
  795. }
  796. var args []ast.Expr
  797. for {
  798. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.RPAREN {
  799. break
  800. }
  801. p.unscan()
  802. if exp, err := p.ParseExpr(); err != nil {
  803. return nil, err
  804. } else {
  805. if ft == ast.FuncTypeCols {
  806. field := &ast.ColFuncField{Expr: exp, Name: nameExpr(exp)}
  807. args = append(args, field)
  808. } else {
  809. args = append(args, exp)
  810. }
  811. }
  812. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.COMMA {
  813. if tok != ast.RPAREN {
  814. return nil, fmt.Errorf("found function call %q, expected ), but with %q.", name, lit)
  815. }
  816. break
  817. }
  818. }
  819. if wt, err := validateWindows(name, args); wt == ast.NOT_WINDOW {
  820. if valErr := validateFuncs(name, args); valErr != nil {
  821. return nil, valErr
  822. }
  823. // Add context for some aggregate func
  824. if name == "deduplicate" {
  825. args = append([]ast.Expr{&ast.Wildcard{Token: ast.ASTERISK}}, args...)
  826. }
  827. c := &ast.Call{Name: name, Args: args, FuncId: p.fn, FuncType: ft}
  828. p.fn += 1
  829. e := p.parseOver(c)
  830. return c, e
  831. } else {
  832. if err != nil {
  833. return nil, err
  834. }
  835. win, err := p.ConvertToWindows(wt, args)
  836. if err != nil {
  837. return nil, err
  838. }
  839. // parse filter clause
  840. f, err := p.parseFilter()
  841. if err != nil {
  842. return nil, err
  843. } else if f != nil {
  844. win.Filter = f
  845. }
  846. return win, nil
  847. }
  848. }
  849. func (p *Parser) parseCaseExpr() (*ast.CaseExpr, error) {
  850. c := &ast.CaseExpr{}
  851. tok, _ := p.scanIgnoreWhitespace()
  852. p.unscan()
  853. if tok != ast.WHEN { // no condition value for case, additional validation needed
  854. if exp, err := p.ParseExpr(); err != nil {
  855. return nil, err
  856. } else {
  857. c.Value = exp
  858. }
  859. }
  860. loop:
  861. for {
  862. tok, _ := p.scanIgnoreWhitespace()
  863. switch tok {
  864. case ast.WHEN:
  865. if exp, err := p.ParseExpr(); err != nil {
  866. return nil, err
  867. } else {
  868. if c.WhenClauses == nil {
  869. c.WhenClauses = make([]*ast.WhenClause, 0)
  870. }
  871. if c.Value == nil && !ast.IsBooleanArg(exp) {
  872. return nil, fmt.Errorf("invalid CASE expression, WHEN expression must be a bool condition")
  873. }
  874. w := &ast.WhenClause{
  875. Expr: exp,
  876. }
  877. tokThen, _ := p.scanIgnoreWhitespace()
  878. if tokThen != ast.THEN {
  879. return nil, fmt.Errorf("invalid CASE expression, THEN expected after WHEN")
  880. } else {
  881. if expThen, err := p.ParseExpr(); err != nil {
  882. return nil, err
  883. } else {
  884. w.Result = expThen
  885. c.WhenClauses = append(c.WhenClauses, w)
  886. }
  887. }
  888. }
  889. case ast.ELSE:
  890. if c.WhenClauses != nil {
  891. if exp, err := p.ParseExpr(); err != nil {
  892. return nil, err
  893. } else {
  894. c.ElseClause = exp
  895. }
  896. } else {
  897. return nil, fmt.Errorf("invalid CASE expression, WHEN expected before ELSE")
  898. }
  899. case ast.END:
  900. if c.WhenClauses != nil {
  901. break loop
  902. }
  903. return nil, fmt.Errorf("invalid CASE expression, WHEN expected before END")
  904. default:
  905. return nil, fmt.Errorf("invalid CASE expression, END expected")
  906. }
  907. }
  908. return c, nil
  909. }
  910. func validateWindows(fname string, args []ast.Expr) (ast.WindowType, error) {
  911. switch fname {
  912. case "tumblingwindow":
  913. if err := validateWindow(fname, 2, args); err != nil {
  914. return ast.TUMBLING_WINDOW, err
  915. }
  916. return ast.TUMBLING_WINDOW, nil
  917. case "hoppingwindow":
  918. if err := validateWindow(fname, 3, args); err != nil {
  919. return ast.HOPPING_WINDOW, err
  920. }
  921. return ast.HOPPING_WINDOW, nil
  922. case "sessionwindow":
  923. if err := validateWindow(fname, 3, args); err != nil {
  924. return ast.SESSION_WINDOW, err
  925. }
  926. return ast.SESSION_WINDOW, nil
  927. case "slidingwindow":
  928. if err := validateWindow(fname, 2, args); err != nil {
  929. return ast.SLIDING_WINDOW, err
  930. }
  931. return ast.SLIDING_WINDOW, nil
  932. case "countwindow":
  933. if len(args) == 1 {
  934. if para1, ok := args[0].(*ast.IntegerLiteral); ok && para1.Val > 0 {
  935. return ast.COUNT_WINDOW, nil
  936. } else {
  937. return ast.COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s.", args[0])
  938. }
  939. } else if len(args) == 2 {
  940. if para1, ok1 := args[0].(*ast.IntegerLiteral); ok1 {
  941. if para2, ok2 := args[1].(*ast.IntegerLiteral); ok2 {
  942. if para1.Val < para2.Val {
  943. return ast.COUNT_WINDOW, fmt.Errorf("The second parameter value %d should be less than the first parameter %d.", para2.Val, para1.Val)
  944. } else {
  945. return ast.COUNT_WINDOW, nil
  946. }
  947. }
  948. }
  949. return ast.COUNT_WINDOW, fmt.Errorf("Invalid parameter value %s, %s.", args[0], args[1])
  950. } else {
  951. return ast.COUNT_WINDOW, fmt.Errorf("Invalid parameter count.")
  952. }
  953. }
  954. return ast.NOT_WINDOW, nil
  955. }
  956. func validateWindow(funcName string, expectLen int, args []ast.Expr) error {
  957. if len(args) != expectLen {
  958. return fmt.Errorf("The arguments for %s should be %d.\n", funcName, expectLen)
  959. }
  960. if _, ok := args[0].(*ast.TimeLiteral); !ok {
  961. return fmt.Errorf("The 1st argument for %s is expecting timer literal expression. One value of [dd|hh|mi|ss|ms].\n", funcName)
  962. }
  963. for i := 1; i < len(args); i++ {
  964. if _, ok := args[i].(*ast.IntegerLiteral); !ok {
  965. return fmt.Errorf("The %d argument for %s is expecting interger literal expression. \n", i, funcName)
  966. }
  967. }
  968. return nil
  969. }
  970. func (p *Parser) ConvertToWindows(wtype ast.WindowType, args []ast.Expr) (*ast.Window, error) {
  971. win := &ast.Window{WindowType: wtype}
  972. if wtype == ast.COUNT_WINDOW {
  973. win.Length = &ast.IntegerLiteral{Val: args[0].(*ast.IntegerLiteral).Val}
  974. if len(args) == 2 {
  975. win.Interval = &ast.IntegerLiteral{Val: args[1].(*ast.IntegerLiteral).Val}
  976. }
  977. return win, nil
  978. }
  979. unit := 1
  980. v := args[0].(*ast.TimeLiteral).Val
  981. switch v {
  982. case ast.DD:
  983. unit = 24 * 3600 * 1000
  984. case ast.HH:
  985. unit = 3600 * 1000
  986. case ast.MI:
  987. unit = 60 * 1000
  988. case ast.SS:
  989. unit = 1000
  990. case ast.MS:
  991. unit = 1
  992. default:
  993. return nil, fmt.Errorf("Invalid timeliteral %s", v)
  994. }
  995. win.Length = &ast.IntegerLiteral{Val: args[1].(*ast.IntegerLiteral).Val * unit}
  996. if len(args) > 2 {
  997. win.Interval = &ast.IntegerLiteral{Val: args[2].(*ast.IntegerLiteral).Val * unit}
  998. } else {
  999. win.Interval = &ast.IntegerLiteral{Val: 0}
  1000. }
  1001. return win, nil
  1002. }
  1003. func (p *Parser) ParseCreateStmt() (ast.Statement, error) {
  1004. _, lit := p.scanIgnoreWhitespace()
  1005. lit = strings.ToUpper(lit)
  1006. if lit == ast.CREATE {
  1007. _, lit1 := p.scanIgnoreWhitespace()
  1008. stmt := &ast.StreamStmt{}
  1009. lit1 = strings.ToUpper(lit1)
  1010. switch lit1 {
  1011. case ast.STREAM:
  1012. stmt.StreamType = ast.TypeStream
  1013. case ast.TABLE:
  1014. stmt.StreamType = ast.TypeTable
  1015. default:
  1016. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  1017. }
  1018. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1019. stmt.Name = ast.StreamName(lit2)
  1020. if fields, err := p.parseStreamFields(); err != nil {
  1021. return nil, err
  1022. } else {
  1023. stmt.StreamFields = fields
  1024. }
  1025. if opts, err := p.parseStreamOptions(); err != nil {
  1026. return nil, err
  1027. } else {
  1028. stmt.Options = opts
  1029. }
  1030. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == ast.SEMICOLON {
  1031. p.unscan()
  1032. } else if tok3 == ast.EOF {
  1033. // Finish parsing create stream statement. Jump to validate
  1034. } else {
  1035. return nil, fmt.Errorf("found %q, expected semicolon or EOF.", lit3)
  1036. }
  1037. } else {
  1038. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  1039. }
  1040. if valErr := validateStream(stmt); valErr != nil {
  1041. return nil, valErr
  1042. }
  1043. return stmt, nil
  1044. } else {
  1045. p.unscan()
  1046. return nil, nil
  1047. }
  1048. }
  1049. // TODO more accurate validation for table
  1050. func validateStream(stmt *ast.StreamStmt) error {
  1051. f := stmt.Options.FORMAT
  1052. if f == "" {
  1053. f = message.FormatJson
  1054. }
  1055. lf := strings.ToLower(f)
  1056. switch lf {
  1057. case message.FormatBinary:
  1058. if stmt.StreamType == ast.TypeTable {
  1059. return fmt.Errorf("'binary' format is not supported for table")
  1060. }
  1061. switch len(stmt.StreamFields) {
  1062. case 0:
  1063. // do nothing for schemaless
  1064. case 1:
  1065. f := stmt.StreamFields[0]
  1066. if bt, ok := f.FieldType.(*ast.BasicType); ok {
  1067. if bt.Type == ast.BYTEA {
  1068. break
  1069. }
  1070. }
  1071. return fmt.Errorf("'binary' format stream can have only 'bytea' type field")
  1072. default:
  1073. return fmt.Errorf("'binary' format stream can have only one field")
  1074. }
  1075. default:
  1076. if !message.IsFormatSupported(lf) {
  1077. return fmt.Errorf("option 'format=%s' is invalid", f)
  1078. }
  1079. }
  1080. return nil
  1081. }
  1082. func (p *Parser) parseShowStmt() (ast.Statement, error) {
  1083. _, lit := p.scanIgnoreWhitespace()
  1084. lit = strings.ToUpper(lit)
  1085. if lit == ast.SHOW {
  1086. _, lit1 := p.scanIgnoreWhitespace()
  1087. lit1 = strings.ToUpper(lit1)
  1088. switch lit1 {
  1089. case ast.STREAMS:
  1090. ss := &ast.ShowStreamsStatement{}
  1091. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.EOF || tok2 == ast.SEMICOLON {
  1092. return ss, nil
  1093. } else {
  1094. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  1095. }
  1096. case ast.TABLES:
  1097. ss := &ast.ShowTablesStatement{}
  1098. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.EOF || tok2 == ast.SEMICOLON {
  1099. return ss, nil
  1100. } else {
  1101. return nil, fmt.Errorf("found %q, expected semecolon or EOF.", lit2)
  1102. }
  1103. default:
  1104. return nil, fmt.Errorf("found %q, expected keyword streams or tables.", lit1)
  1105. }
  1106. } else {
  1107. p.unscan()
  1108. return nil, nil
  1109. }
  1110. }
  1111. func (p *Parser) parseDescribeStmt() (ast.Statement, error) {
  1112. _, lit := p.scanIgnoreWhitespace()
  1113. lit = strings.ToUpper(lit)
  1114. if lit == ast.DESCRIBE {
  1115. _, lit1 := p.scanIgnoreWhitespace()
  1116. lit1 = strings.ToUpper(lit1)
  1117. switch lit1 {
  1118. case ast.STREAM:
  1119. dss := &ast.DescribeStreamStatement{}
  1120. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1121. dss.Name = lit2
  1122. return dss, nil
  1123. } else {
  1124. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  1125. }
  1126. case ast.TABLE:
  1127. dss := &ast.DescribeTableStatement{}
  1128. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1129. dss.Name = lit2
  1130. return dss, nil
  1131. } else {
  1132. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  1133. }
  1134. default:
  1135. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  1136. }
  1137. } else {
  1138. p.unscan()
  1139. return nil, nil
  1140. }
  1141. }
  1142. func (p *Parser) parseExplainStmt() (ast.Statement, error) {
  1143. _, lit := p.scanIgnoreWhitespace()
  1144. lit = strings.ToUpper(lit)
  1145. if lit == ast.EXPLAIN {
  1146. _, lit1 := p.scanIgnoreWhitespace()
  1147. lit1 = strings.ToUpper(lit1)
  1148. switch lit1 {
  1149. case ast.STREAM:
  1150. ess := &ast.ExplainStreamStatement{}
  1151. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1152. ess.Name = lit2
  1153. return ess, nil
  1154. } else {
  1155. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  1156. }
  1157. case ast.TABLE:
  1158. ess := &ast.ExplainTableStatement{}
  1159. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1160. ess.Name = lit2
  1161. return ess, nil
  1162. } else {
  1163. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  1164. }
  1165. default:
  1166. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  1167. }
  1168. } else {
  1169. p.unscan()
  1170. return nil, nil
  1171. }
  1172. }
  1173. func (p *Parser) parseDropStmt() (ast.Statement, error) {
  1174. _, lit := p.scanIgnoreWhitespace()
  1175. lit = strings.ToUpper(lit)
  1176. if lit == ast.DROP {
  1177. _, lit1 := p.scanIgnoreWhitespace()
  1178. lit1 = strings.ToUpper(lit1)
  1179. switch lit1 {
  1180. case ast.STREAM:
  1181. ess := &ast.DropStreamStatement{}
  1182. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1183. ess.Name = lit2
  1184. return ess, nil
  1185. } else {
  1186. return nil, fmt.Errorf("found %q, expected stream name.", lit2)
  1187. }
  1188. case ast.TABLE:
  1189. ess := &ast.DropTableStatement{}
  1190. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.IDENT {
  1191. ess.Name = lit2
  1192. return ess, nil
  1193. } else {
  1194. return nil, fmt.Errorf("found %q, expected table name.", lit2)
  1195. }
  1196. default:
  1197. return nil, fmt.Errorf("found %q, expected keyword stream or table.", lit1)
  1198. }
  1199. } else {
  1200. p.unscan()
  1201. return nil, nil
  1202. }
  1203. }
  1204. func (p *Parser) parseStreamFields() (ast.StreamFields, error) {
  1205. lStack := &stack.Stack{}
  1206. var fields ast.StreamFields
  1207. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.LPAREN {
  1208. lStack.Push(lit)
  1209. for {
  1210. // For the schemaless streams
  1211. // create stream demo () WITH (FORMAT="JSON", DATASOURCE="demo" TYPE="edgex")
  1212. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.RPAREN {
  1213. lStack.Pop()
  1214. if _, lit2 := p.scanIgnoreWhitespace(); strings.ToUpper(lit2) != ast.WITH {
  1215. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  1216. }
  1217. return fields, nil
  1218. } else {
  1219. p.unscan()
  1220. }
  1221. if f, err := p.parseStreamField(); err != nil {
  1222. return nil, err
  1223. } else {
  1224. fields = append(fields, *f)
  1225. }
  1226. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.RPAREN {
  1227. lStack.Pop()
  1228. tok2, lit2 := p.scanIgnoreWhitespace()
  1229. lit2 = strings.ToUpper(lit2)
  1230. if lit2 == ast.WITH {
  1231. // Check the stack for LPAREN; If the stack for LPAREN is not zero, then it's not correct.
  1232. if lStack.Len() > 0 {
  1233. return nil, fmt.Errorf("Parenthesis is not matched.")
  1234. }
  1235. break
  1236. } else if tok2 == ast.COMMA {
  1237. if lStack.Len() > 0 {
  1238. return nil, fmt.Errorf("Parenthesis is in create record type not matched.")
  1239. }
  1240. p.unscan()
  1241. break
  1242. } else if tok2 == ast.RPAREN { // The nested type definition of ARRAY and Struct, such as "field ARRAY(STRUCT(f BIGINT))"
  1243. if lStack.Len() > 0 {
  1244. return nil, fmt.Errorf("Parenthesis is not matched.")
  1245. }
  1246. p.unscan()
  1247. break
  1248. } else {
  1249. if lStack.Len() == 0 {
  1250. return nil, fmt.Errorf("found %q, expected is with.", lit2)
  1251. }
  1252. p.unscan()
  1253. }
  1254. } else {
  1255. p.unscan()
  1256. }
  1257. }
  1258. } else {
  1259. return nil, fmt.Errorf("found %q, expected lparen after stream name.", lit)
  1260. }
  1261. return fields, nil
  1262. }
  1263. func (p *Parser) parseStreamField() (*ast.StreamField, error) {
  1264. field := &ast.StreamField{}
  1265. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.IDENT {
  1266. field.Name = lit
  1267. _, lit1 := p.scanIgnoreWhitespace()
  1268. if t := ast.GetDataType(lit1); t != ast.UNKNOWN && t.IsSimpleType() {
  1269. field.FieldType = &ast.BasicType{Type: t}
  1270. } else if t == ast.ARRAY {
  1271. if f, e := p.parseStreamArrayType(); e != nil {
  1272. return nil, e
  1273. } else {
  1274. field.FieldType = f
  1275. }
  1276. } else if t == ast.STRUCT {
  1277. if f, e := p.parseStreamStructType(); e != nil {
  1278. return nil, e
  1279. } else {
  1280. field.FieldType = f
  1281. }
  1282. } else if t == ast.UNKNOWN {
  1283. return nil, fmt.Errorf("found %q, expect valid stream field types(BIGINT | FLOAT | STRINGS | DATETIME | BOOLEAN | BYTEA | ARRAY | STRUCT).", lit1)
  1284. }
  1285. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.COMMA {
  1286. // Just consume the comma.
  1287. } else if tok2 == ast.RPAREN {
  1288. p.unscan()
  1289. } else {
  1290. return nil, fmt.Errorf("found %q, expect comma or rparen.", lit2)
  1291. }
  1292. } else {
  1293. return nil, fmt.Errorf("found %q, expect stream field name.", lit)
  1294. }
  1295. return field, nil
  1296. }
  1297. func (p *Parser) parseStreamArrayType() (ast.FieldType, error) {
  1298. lStack := &stack.Stack{}
  1299. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.LPAREN {
  1300. lStack.Push(ast.LPAREN)
  1301. tok1, lit1 := p.scanIgnoreWhitespace()
  1302. t := ast.GetDataType(lit1)
  1303. if t != ast.UNKNOWN && t.IsSimpleType() {
  1304. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.RPAREN {
  1305. lStack.Pop()
  1306. if lStack.Len() > 0 {
  1307. return nil, fmt.Errorf("Parenthesis is in array type not matched.")
  1308. }
  1309. return &ast.ArrayType{Type: t}, nil
  1310. } else {
  1311. return nil, fmt.Errorf("found %q, expect rparen in array type definition.", lit2)
  1312. }
  1313. } else if t == ast.STRUCT {
  1314. if f, err := p.parseStreamStructType(); err != nil {
  1315. return nil, err
  1316. } else {
  1317. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.RPAREN {
  1318. lStack.Pop()
  1319. if lStack.Len() > 0 {
  1320. return nil, fmt.Errorf("Parenthesis is in struct of array type %q not matched.", tok1)
  1321. }
  1322. return &ast.ArrayType{Type: ast.STRUCT, FieldType: f}, nil
  1323. } else {
  1324. return nil, fmt.Errorf("found %q, expect rparen in struct of array type definition.", lit2)
  1325. }
  1326. }
  1327. } else if tok1 == ast.COMMA {
  1328. p.unscan()
  1329. } else {
  1330. return nil, fmt.Errorf("found %q, expect stream data types.", lit1)
  1331. }
  1332. }
  1333. return nil, nil
  1334. }
  1335. func (p *Parser) parseStreamStructType() (ast.FieldType, error) {
  1336. rf := &ast.RecType{}
  1337. if sfs, err := p.parseStreamFields(); err != nil {
  1338. return nil, err
  1339. } else {
  1340. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.COMMA {
  1341. rf.StreamFields = sfs
  1342. p.unscan()
  1343. } else if tok2 == ast.RPAREN {
  1344. rf.StreamFields = sfs
  1345. p.unscan()
  1346. } else {
  1347. return nil, fmt.Errorf("found %q, expect comma in create stream record statement.", lit2)
  1348. }
  1349. }
  1350. return rf, nil
  1351. }
  1352. func (p *Parser) parseStreamOptions() (*ast.Options, error) {
  1353. opts := &ast.Options{STRICT_VALIDATION: false}
  1354. v := reflect.ValueOf(opts)
  1355. lStack := &stack.Stack{}
  1356. if tok, lit := p.scanIgnoreWhitespace(); tok == ast.LPAREN {
  1357. lStack.Push(ast.LPAREN)
  1358. for {
  1359. tok1, lit1 := p.scanIgnoreWhitespace()
  1360. lit1 = strings.ToUpper(lit1)
  1361. if ast.IsStreamOptionKeyword(tok1, lit1) {
  1362. if tok2, lit2 := p.scanIgnoreWhitespace(); tok2 == ast.EQ {
  1363. if tok3, lit3 := p.scanIgnoreWhitespace(); tok3 == ast.STRING {
  1364. switch lit1 {
  1365. case ast.STRICT_VALIDATION:
  1366. if val := strings.ToUpper(lit3); (val != "TRUE") && (val != "FALSE") {
  1367. return nil, fmt.Errorf("found %q, expect TRUE/FALSE value in %s option.", lit3, lit1)
  1368. } else {
  1369. opts.STRICT_VALIDATION = val == "TRUE"
  1370. }
  1371. case ast.RETAIN_SIZE:
  1372. if val, err := strconv.Atoi(lit3); err != nil {
  1373. return nil, fmt.Errorf("found %q, expect number value in %s option.", lit3, lit1)
  1374. } else {
  1375. opts.RETAIN_SIZE = val
  1376. }
  1377. case ast.SHARED:
  1378. if val := strings.ToUpper(lit3); (val != "TRUE") && (val != "FALSE") {
  1379. return nil, fmt.Errorf("found %q, expect TRUE/FALSE value in %s option.", lit3, lit1)
  1380. } else {
  1381. opts.SHARED = val == "TRUE"
  1382. }
  1383. case ast.KIND:
  1384. val := strings.ToLower(lit3)
  1385. opts.KIND = val
  1386. default:
  1387. f := v.Elem().FieldByName(lit1)
  1388. if f.IsValid() {
  1389. f.SetString(lit3)
  1390. } else { // should not happen
  1391. return nil, fmt.Errorf("invalid field %s.", lit1)
  1392. }
  1393. }
  1394. } else {
  1395. return nil, fmt.Errorf("found %q, expect string value in option.", lit3)
  1396. }
  1397. } else {
  1398. return nil, fmt.Errorf("found %q, expect equals(=) in options.", lit2)
  1399. }
  1400. } else if tok1 == ast.COMMA {
  1401. continue
  1402. } else if tok1 == ast.RPAREN {
  1403. if lStack.Pop(); lStack.Len() == 0 {
  1404. break
  1405. }
  1406. return nil, fmt.Errorf("Parenthesis is not matched in options definition.")
  1407. } else {
  1408. return nil, fmt.Errorf("found %q, unknown option keys(DATASOURCE|FORMAT|KEY|CONF_KEY|SHARED|STRICT_VALIDATION|TYPE|TIMESTAMP|TIMESTAMP_FORMAT|RETAIN_SIZE|SCHEMAID).", lit1)
  1409. }
  1410. }
  1411. } else {
  1412. return nil, fmt.Errorf("found %q, expect stream options.", lit)
  1413. }
  1414. if opts.KIND == ast.StreamKindLookup && opts.TYPE == "memory" && opts.KEY == "" {
  1415. return nil, fmt.Errorf("Option \"key\" is required for memory lookup table.")
  1416. }
  1417. return opts, nil
  1418. }
  1419. // Only support filter on window now
  1420. func (p *Parser) parseFilter() (ast.Expr, error) {
  1421. if tok, _ := p.scanIgnoreWhitespace(); tok != ast.FILTER {
  1422. p.unscan()
  1423. return nil, nil
  1424. }
  1425. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.LPAREN {
  1426. return nil, fmt.Errorf("Found %q after FILTER, expect parentheses.", lit)
  1427. }
  1428. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.WHERE {
  1429. return nil, fmt.Errorf("Found %q after FILTER(, expect WHERE.", lit)
  1430. }
  1431. expr, err := p.ParseExpr()
  1432. if err != nil {
  1433. return nil, err
  1434. }
  1435. if tok, lit := p.scanIgnoreWhitespace(); tok != ast.RPAREN {
  1436. return nil, fmt.Errorf("Found %q after FILTER, expect right parentheses.", lit)
  1437. }
  1438. return expr, nil
  1439. }
  1440. func (p *Parser) parseAsterisk() (ast.Expr, error) {
  1441. switch p.inFunc {
  1442. case "mqtt", "meta":
  1443. return &ast.MetaRef{StreamName: ast.DefaultStream, Name: "*"}, nil
  1444. default:
  1445. return &ast.Wildcard{Token: ast.ASTERISK}, nil
  1446. }
  1447. }
  1448. func (p *Parser) inmeta() bool {
  1449. return p.inFunc == "meta" || p.inFunc == "mqtt"
  1450. }
  1451. func (p *Parser) parseOver(c *ast.Call) error {
  1452. if tok, _ := p.scanIgnoreWhitespace(); tok != ast.OVER {
  1453. p.unscan()
  1454. return nil
  1455. } else if function.IsAnalyticFunc(c.Name) {
  1456. if tok1, _ := p.scanIgnoreWhitespace(); tok1 == ast.LPAREN {
  1457. if t, _ := p.scanIgnoreWhitespace(); t == ast.PARTITION {
  1458. if t1, l1 := p.scanIgnoreWhitespace(); t1 == ast.BY {
  1459. pe := &ast.PartitionExpr{}
  1460. for {
  1461. if exp, err := p.ParseExpr(); err != nil {
  1462. return err
  1463. } else {
  1464. pe.Exprs = append(pe.Exprs, exp)
  1465. }
  1466. if tok, _ := p.scanIgnoreWhitespace(); tok == ast.COMMA {
  1467. continue
  1468. }
  1469. p.unscan()
  1470. break
  1471. }
  1472. if len(pe.Exprs) == 0 {
  1473. return fmt.Errorf("PARTITION BY must have at least one expression.")
  1474. }
  1475. c.Partition = pe
  1476. } else {
  1477. return fmt.Errorf("found %q, expected by after partition.", l1)
  1478. }
  1479. } else {
  1480. p.unscan()
  1481. }
  1482. if t, _ := p.scanIgnoreWhitespace(); t == ast.WHEN {
  1483. if exp, err := p.ParseExpr(); err != nil {
  1484. return err
  1485. } else {
  1486. c.WhenExpr = exp
  1487. }
  1488. } else {
  1489. p.unscan()
  1490. }
  1491. if c.Partition != nil || c.WhenExpr != nil {
  1492. if ttt, _ := p.scanIgnoreWhitespace(); ttt != ast.RPAREN {
  1493. return fmt.Errorf("Found %q, expect right parentheses after OVER ", ttt)
  1494. }
  1495. }
  1496. if c.Partition == nil && c.WhenExpr == nil {
  1497. ttt, _ := p.scanIgnoreWhitespace()
  1498. return fmt.Errorf("Found %q after OVER (, expect partition by or when.", ttt)
  1499. }
  1500. return nil
  1501. } else {
  1502. return fmt.Errorf("Found %q after OVER, expect parentheses.", tok1)
  1503. }
  1504. } else {
  1505. return fmt.Errorf("Found OVER after non analytic function %s", c.Name)
  1506. }
  1507. }