krotik
/
eliasdb


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203
							/*
 * EliasDB
 *
 * Copyright 2016 Matthias Ladkau. All rights reserved.
 *
 * This Source Code Form is subject to the terms of the Mozilla Public
 * License, v. 2.0. If a copy of the MPL was not distributed with this
 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
 */

/*
Package parser contains the EQL parser.

Lexer

Lex() is a lexer function to convert a given search query into a list of tokens.

Based on a talk by Rob Pike: Lexical Scanning in Go

https://www.youtube.com/watch?v=HxaD_trXwRE

Parser

Parse() is a parser which produces a parse tree from a given set of lexer tokens.

Based on an article by Douglas Crockford: Top Down Operator Precedence

http://crockford.com/javascript/tdop/tdop.html

which is based on the ideas of Vaughan Pratt and his paper: Top Down Operator Precedence

http://portal.acm.org/citation.cfm?id=512931
https://tdop.github.io/

ParseWithRuntime() parses a given input and decorates the resulting parse tree
with runtime components which can be used to interpret the parsed query.
*/
package parser

/*
LexTokenID represents a unique lexer token ID
*/
type LexTokenID int

/*
Available lexer token types
*/
const (
	TokenError LexTokenID = iota // Lexing error token with a message as val
	TokenEOF                     // End-of-file token

	TokenVALUE    // Simple value
	TokenNODEKIND // Node kind value

	TokenGeneral // General token used for plain ASTs

	TOKENodeSYMBOLS // Used to separate symbols from other tokens in this list

	TokenGEQ
	TokenLEQ
	TokenNEQ
	TokenEQ
	TokenGT
	TokenLT
	TokenLPAREN
	TokenRPAREN
	TokenLBRACK
	TokenRBRACK
	TokenCOMMA
	TokenAT
	TokenPLUS
	TokenMINUS
	TokenTIMES
	TokenDIV
	TokenDIVINT
	TokenMODINT

	// The colon ':' has a context specific meaning and is not processed by the parser

	TOKENodeKEYWORDS // Used to separate keywords from other tokens in this list

	TokenGET
	TokenLOOKUP
	TokenFROM
	TokenGROUP
	TokenWITH
	TokenLIST
	TokenNULLTRAVERSAL
	TokenFILTERING
	TokenORDERING
	TokenWHERE
	TokenTRAVERSE
	TokenEND
	TokenPRIMARY
	TokenSHOW
	TokenAS
	TokenFORMAT
	TokenAND
	TokenOR
	TokenLIKE
	TokenIN
	TokenCONTAINS
	TokenBEGINSWITH
	TokenENDSWITH
	TokenCONTAINSNOT
	TokenNOT
	TokenNOTIN
	TokenFALSE
	TokenTRUE
	TokenUNIQUE
	TokenUNIQUECOUNT
	TokenNULL
	TokenISNULL
	TokenISNOTNULL
	TokenASCENDING
	TokenDESCENDING
)

/*
Available parser AST node types
*/
const (
	NodeEOF = "EOF"

	NodeVALUE         = "value"
	NodeTRUE          = "true"
	NodeFALSE         = "false"
	NodeNULL          = "null"
	NodeFUNC          = "func"
	NodeORDERING      = "ordering"
	NodeFILTERING     = "filtering"
	NodeNULLTRAVERSAL = "nulltraversal"

	// Special tokens - always handled in a denotation function

	NodeCOMMA  = "comma"
	NodeGROUP  = "group"
	NodeEND    = "end"
	NodeAS     = "as"
	NodeFORMAT = "format"

	// Keywords

	NodeGET    = "get"
	NodeLOOKUP = "lookup"
	NodeFROM   = "from"
	NodeWHERE  = "where"

	NodeUNIQUE      = "unique"
	NodeUNIQUECOUNT = "uniquecount"
	NodeISNOTNULL   = "isnotnull"
	NodeASCENDING   = "asc"
	NodeDESCENDING  = "desc"

	NodeTRAVERSE = "traverse"
	NodePRIMARY  = "primary"
	NodeSHOW     = "show"
	NodeSHOWTERM = "showterm"
	NodeWITH     = "with"
	NodeLIST     = "list"

	// Boolean operations

	NodeOR  = "or"
	NodeAND = "and"
	NodeNOT = "not"

	NodeGEQ = ">="
	NodeLEQ = "<="
	NodeNEQ = "!="
	NodeEQ  = "="
	NodeGT  = ">"
	NodeLT  = "<"

	// List operations

	NodeIN    = "in"
	NodeNOTIN = "notin"

	// String operations

	NodeLIKE        = "like"
	NodeCONTAINS    = "contains"
	NodeBEGINSWITH  = "beginswith"
	NodeENDSWITH    = "endswith"
	NodeCONTAINSNOT = "containsnot"

	// Simple arithmetic expressions

	NodePLUS   = "plus"
	NodeMINUS  = "minus"
	NodeTIMES  = "times"
	NodeDIV    = "div"
	NodeMODINT = "modint"
	NodeDIVINT = "divint"

	// Brackets

	NodeLPAREN = "("
	NodeRPAREN = ")"
	NodeLBRACK = "["
	NodeRBRACK = "]"
)