improve error messages
This commit is contained in:
parent
2cad424379
commit
247c7a26b7
|
@ -22,6 +22,7 @@
|
||||||
> import qualified Text.Parsec as P (ParseError)
|
> import qualified Text.Parsec as P (ParseError)
|
||||||
> import Text.Parsec.Perm (permute,(<$?>), (<|?>))
|
> import Text.Parsec.Perm (permute,(<$?>), (<|?>))
|
||||||
> import qualified Text.Parsec.Expr as E
|
> import qualified Text.Parsec.Expr as E
|
||||||
|
> import Data.List (intercalate)
|
||||||
|
|
||||||
> import Language.SQL.SimpleSQL.Syntax
|
> import Language.SQL.SimpleSQL.Syntax
|
||||||
|
|
||||||
|
@ -132,7 +133,7 @@ which parses as a typed literal
|
||||||
> [(:[]) <$> oneOf "nNbBxX"
|
> [(:[]) <$> oneOf "nNbBxX"
|
||||||
> ,string "u&"
|
> ,string "u&"
|
||||||
> ,string "U&"
|
> ,string "U&"
|
||||||
> ] <* lookAhead (char '\'')
|
> ] <* lookAhead quote
|
||||||
|
|
||||||
> literal :: Parser ValueExpr
|
> literal :: Parser ValueExpr
|
||||||
> literal = number <|> stringValue <|> interval <|> try characterSetLiteral
|
> literal = number <|> stringValue <|> interval <|> try characterSetLiteral
|
||||||
|
@ -187,6 +188,9 @@ The parsing for the aggregate extensions is here as well:
|
||||||
|
|
||||||
aggregate([all|distinct] args [order by orderitems])
|
aggregate([all|distinct] args [order by orderitems])
|
||||||
|
|
||||||
|
TODO: try to refactor the parser to not allow distinct/all or order by
|
||||||
|
if there are no value exprs
|
||||||
|
|
||||||
> aggOrApp :: [Name] -> Parser ValueExpr
|
> aggOrApp :: [Name] -> Parser ValueExpr
|
||||||
> aggOrApp n =
|
> aggOrApp n =
|
||||||
> makeApp n
|
> makeApp n
|
||||||
|
@ -220,8 +224,7 @@ always used with the optionSuffix combinator.
|
||||||
> <*> option [] orderBy
|
> <*> option [] orderBy
|
||||||
> <*> optionMaybe frameClause)
|
> <*> optionMaybe frameClause)
|
||||||
> where
|
> where
|
||||||
> partitionBy = keyword_ "partition" >>
|
> partitionBy = keywords_ ["partition","by"] >> commaSep1 valueExpr
|
||||||
> keyword_ "by" >> commaSep1 valueExpr
|
|
||||||
> frameClause =
|
> frameClause =
|
||||||
> mkFrame <$> choice [FrameRows <$ keyword_ "rows"
|
> mkFrame <$> choice [FrameRows <$ keyword_ "rows"
|
||||||
> ,FrameRange <$ keyword_ "range"]
|
> ,FrameRange <$ keyword_ "range"]
|
||||||
|
@ -235,7 +238,9 @@ always used with the optionSuffix combinator.
|
||||||
> -- use the bexpression style from the between parsing for frame between
|
> -- use the bexpression style from the between parsing for frame between
|
||||||
> frameLimit useB =
|
> frameLimit useB =
|
||||||
> choice
|
> choice
|
||||||
> [Current <$ keyword_ "current" <* keyword_ "row"
|
> [Current <$ keywords_ ["current", "row"]
|
||||||
|
> -- todo: create an automatic left factor for stuff like
|
||||||
|
> -- this
|
||||||
> ,keyword_ "unbounded" >>
|
> ,keyword_ "unbounded" >>
|
||||||
> choice [UnboundedPreceding <$ keyword_ "preceding"
|
> choice [UnboundedPreceding <$ keyword_ "preceding"
|
||||||
> ,UnboundedFollowing <$ keyword_ "following"]
|
> ,UnboundedFollowing <$ keyword_ "following"]
|
||||||
|
@ -413,7 +418,7 @@ this is parsed as a postfix operator which is why it is in this form
|
||||||
> ,InList <$> commaSep1 valueExpr])
|
> ,InList <$> commaSep1 valueExpr])
|
||||||
> where
|
> where
|
||||||
> inty = choice [True <$ keyword_ "in"
|
> inty = choice [True <$ keyword_ "in"
|
||||||
> ,False <$ keyword_ "not" <* keyword_ "in"]
|
> ,False <$ keywords_ ["not","in"]]
|
||||||
> mkIn i v = \e -> In i e v
|
> mkIn i v = \e -> In i e v
|
||||||
|
|
||||||
|
|
||||||
|
@ -438,7 +443,7 @@ and operator. This is the call to valueExprB.
|
||||||
> where
|
> where
|
||||||
> opName = choice
|
> opName = choice
|
||||||
> ["between" <$ keyword_ "between"
|
> ["between" <$ keyword_ "between"
|
||||||
> ,"not between" <$ try (keyword_ "not" <* keyword_ "between")]
|
> ,"not between" <$ try (keywords_ ["not","between"])]
|
||||||
> makeOp n b c = \a -> SpecialOp [n] [a,b,c]
|
> makeOp n b c = \a -> SpecialOp [n] [a,b,c]
|
||||||
|
|
||||||
subquery expression:
|
subquery expression:
|
||||||
|
@ -508,13 +513,14 @@ typename: used in casts. Special cases for the multi keyword typenames
|
||||||
that SQL supports.
|
that SQL supports.
|
||||||
|
|
||||||
> typeName :: Parser TypeName
|
> typeName :: Parser TypeName
|
||||||
> typeName = choice (multiWordParsers
|
> typeName = (choice (multiWordParsers
|
||||||
> ++ [TypeName <$> identifierBlacklist blacklist])
|
> ++ [TypeName <$> identifierBlacklist blacklist])
|
||||||
> >>= optionSuffix precision
|
> >>= optionSuffix precision
|
||||||
|
> ) <?> "typename"
|
||||||
> where
|
> where
|
||||||
> multiWordParsers =
|
> multiWordParsers =
|
||||||
> flip map multiWordTypeNames
|
> flip map multiWordTypeNames
|
||||||
> $ \ks -> (TypeName . unwords) <$> try (mapM keyword ks)
|
> $ \ks -> (TypeName . unwords) <$> try (keywords ks)
|
||||||
> multiWordTypeNames = map words
|
> multiWordTypeNames = map words
|
||||||
> ["double precision"
|
> ["double precision"
|
||||||
> ,"character varying"
|
> ,"character varying"
|
||||||
|
@ -628,13 +634,13 @@ TODO: carefully review the precedences and associativities.
|
||||||
> -- use try with the multi keywords because of shared
|
> -- use try with the multi keywords because of shared
|
||||||
> -- prefixes to the sets of keywords. Should left factor
|
> -- prefixes to the sets of keywords. Should left factor
|
||||||
> -- somehow
|
> -- somehow
|
||||||
> binaryKeywords nm assoc = binary (try $ mapM_ keyword_ (words nm)) nm assoc
|
> binaryKeywords nm assoc = binary (try $ keywords_ (words nm)) nm assoc
|
||||||
> binary p nm assoc =
|
> binary p nm assoc =
|
||||||
> E.Infix (p >> return (\a b -> BinOp a [Name nm] b)) assoc
|
> E.Infix (p >> return (\a b -> BinOp a [Name nm] b)) assoc
|
||||||
> prefixKeyword nm = prefix (keyword_ nm) nm
|
> prefixKeyword nm = prefix (keyword_ nm) nm
|
||||||
> prefixSym nm = prefix (symbol_ nm) nm
|
> prefixSym nm = prefix (symbol_ nm) nm
|
||||||
> prefix p nm = prefix' (p >> return (PrefixOp [Name nm]))
|
> prefix p nm = prefix' (p >> return (PrefixOp [Name nm]))
|
||||||
> postfixKeywords nm = postfix (try $ mapM_ keyword_ (words nm)) nm
|
> postfixKeywords nm = postfix (try $ keywords_ (words nm)) nm
|
||||||
> postfix p nm = postfix' (p >> return (PostfixOp [Name nm]))
|
> postfix p nm = postfix' (p >> return (PostfixOp [Name nm]))
|
||||||
> -- hack from here
|
> -- hack from here
|
||||||
> -- http://stackoverflow.com/questions/10475337/parsec-expr-repeated-prefix-postfix-operator-not-supported
|
> -- http://stackoverflow.com/questions/10475337/parsec-expr-repeated-prefix-postfix-operator-not-supported
|
||||||
|
@ -724,6 +730,8 @@ tref
|
||||||
> <*> optionMaybe (joinCondition nat))
|
> <*> optionMaybe (joinCondition nat))
|
||||||
> >>= optionSuffix joinTrefSuffix
|
> >>= optionSuffix joinTrefSuffix
|
||||||
|
|
||||||
|
TODO: factor the join stuff to produce better error messages
|
||||||
|
|
||||||
> joinType :: Parser JoinType
|
> joinType :: Parser JoinType
|
||||||
> joinType = choice
|
> joinType = choice
|
||||||
> [JCross <$ keyword_ "cross" <* keyword_ "join"
|
> [JCross <$ keyword_ "cross" <* keyword_ "join"
|
||||||
|
@ -761,7 +769,7 @@ pretty trivial.
|
||||||
> whereClause = keyword_ "where" *> valueExpr
|
> whereClause = keyword_ "where" *> valueExpr
|
||||||
|
|
||||||
> groupByClause :: Parser [GroupingExpr]
|
> groupByClause :: Parser [GroupingExpr]
|
||||||
> groupByClause = keyword_ "group" *> keyword_ "by"
|
> groupByClause = keywords_ ["group","by"]
|
||||||
> *> commaSep1 groupingExpression
|
> *> commaSep1 groupingExpression
|
||||||
> where
|
> where
|
||||||
> groupingExpression =
|
> groupingExpression =
|
||||||
|
@ -771,7 +779,7 @@ pretty trivial.
|
||||||
> ,keyword_ "rollup" >>
|
> ,keyword_ "rollup" >>
|
||||||
> Rollup <$> parens (commaSep groupingExpression)
|
> Rollup <$> parens (commaSep groupingExpression)
|
||||||
> ,GroupingParens <$> parens (commaSep groupingExpression)
|
> ,GroupingParens <$> parens (commaSep groupingExpression)
|
||||||
> ,keyword_ "grouping" >> keyword_ "sets" >>
|
> ,keywords_ ["grouping", "sets"] >>
|
||||||
> GroupingSets <$> parens (commaSep groupingExpression)
|
> GroupingSets <$> parens (commaSep groupingExpression)
|
||||||
> ,SimpleGroup <$> valueExpr
|
> ,SimpleGroup <$> valueExpr
|
||||||
> ]
|
> ]
|
||||||
|
@ -780,13 +788,14 @@ pretty trivial.
|
||||||
> having = keyword_ "having" *> valueExpr
|
> having = keyword_ "having" *> valueExpr
|
||||||
|
|
||||||
> orderBy :: Parser [SortSpec]
|
> orderBy :: Parser [SortSpec]
|
||||||
> orderBy = keyword_ "order" *> keyword_ "by" *> commaSep1 ob
|
> orderBy = keywords_ ["order","by"] *> commaSep1 ob
|
||||||
> where
|
> where
|
||||||
> ob = SortSpec
|
> ob = SortSpec
|
||||||
> <$> valueExpr
|
> <$> valueExpr
|
||||||
> <*> option DirDefault (choice [Asc <$ keyword_ "asc"
|
> <*> option DirDefault (choice [Asc <$ keyword_ "asc"
|
||||||
> ,Desc <$ keyword_ "desc"])
|
> ,Desc <$ keyword_ "desc"])
|
||||||
> <*> option NullsOrderDefault
|
> <*> option NullsOrderDefault
|
||||||
|
> -- todo: left factor better
|
||||||
> (keyword_ "nulls" >>
|
> (keyword_ "nulls" >>
|
||||||
> choice [NullsFirst <$ keyword "first"
|
> choice [NullsFirst <$ keyword "first"
|
||||||
> ,NullsLast <$ keyword "last"])
|
> ,NullsLast <$ keyword "last"])
|
||||||
|
@ -805,7 +814,7 @@ allows offset and fetch in either order
|
||||||
|
|
||||||
> fetch :: Parser ValueExpr
|
> fetch :: Parser ValueExpr
|
||||||
> fetch = choice [ansiFetch, limit]
|
> fetch = choice [ansiFetch, limit]
|
||||||
> where
|
> where --todo: better left factoring
|
||||||
> ansiFetch = keyword_ "fetch" >>
|
> ansiFetch = keyword_ "fetch" >>
|
||||||
> choice [keyword_ "first",keyword_ "next"]
|
> choice [keyword_ "first",keyword_ "next"]
|
||||||
> *> valueExpr
|
> *> valueExpr
|
||||||
|
@ -971,8 +980,8 @@ make this choice.
|
||||||
> identifier = lexeme ((:) <$> firstChar <*> many nonFirstChar)
|
> identifier = lexeme ((:) <$> firstChar <*> many nonFirstChar)
|
||||||
> <?> "identifier"
|
> <?> "identifier"
|
||||||
> where
|
> where
|
||||||
> firstChar = letter <|> char '_'
|
> firstChar = letter <|> char '_' <?> "identifier"
|
||||||
> nonFirstChar = digit <|> firstChar
|
> nonFirstChar = digit <|> firstChar <?> ""
|
||||||
|
|
||||||
> quotedIdentifier :: Parser String
|
> quotedIdentifier :: Parser String
|
||||||
> quotedIdentifier = char '"' *> manyTill anyChar doubleQuote
|
> quotedIdentifier = char '"' *> manyTill anyChar doubleQuote
|
||||||
|
@ -998,7 +1007,7 @@ todo: work out the symbol parsing better
|
||||||
> <?> s
|
> <?> s
|
||||||
|
|
||||||
> questionMark :: Parser Char
|
> questionMark :: Parser Char
|
||||||
> questionMark = lexeme $ char '?'
|
> questionMark = lexeme (char '?') <?> "question mark"
|
||||||
|
|
||||||
> openParen :: Parser Char
|
> openParen :: Parser Char
|
||||||
> openParen = lexeme $ char '('
|
> openParen = lexeme $ char '('
|
||||||
|
@ -1014,13 +1023,16 @@ todo: work out the symbol parsing better
|
||||||
|
|
||||||
|
|
||||||
> comma :: Parser Char
|
> comma :: Parser Char
|
||||||
> comma = lexeme $ char ','
|
> comma = lexeme (char ',') <?> "comma"
|
||||||
|
|
||||||
> semi :: Parser Char
|
> semi :: Parser Char
|
||||||
> semi = lexeme $ char ';'
|
> semi = lexeme (char ';') <?> "semicolon"
|
||||||
|
|
||||||
> doubleQuote :: Parser Char
|
> doubleQuote :: Parser Char
|
||||||
> doubleQuote = lexeme $ char '"'
|
> doubleQuote = lexeme (char '"') <?> "double quotes"
|
||||||
|
|
||||||
|
> quote :: Parser Char
|
||||||
|
> quote = lexeme (char '\'') <?> "single quote"
|
||||||
|
|
||||||
> --stringToken :: Parser String
|
> --stringToken :: Parser String
|
||||||
> --stringToken = lexeme (char '\'' *> manyTill anyChar (char '\''))
|
> --stringToken = lexeme (char '\'' *> manyTill anyChar (char '\''))
|
||||||
|
@ -1028,23 +1040,25 @@ todo: work out the symbol parsing better
|
||||||
> -- string stuff
|
> -- string stuff
|
||||||
> stringToken :: Parser String
|
> stringToken :: Parser String
|
||||||
> stringToken =
|
> stringToken =
|
||||||
> lexeme (char '\'' *> manyTill anyChar (char '\'')
|
> lexeme (nlquote *> manyTill anyChar nlquote
|
||||||
> >>= optionSuffix moreString)
|
> >>= optionSuffix moreString)
|
||||||
> <?> "string"
|
> <?> "string"
|
||||||
> where
|
> where
|
||||||
> moreString s0 = choice
|
> moreString s0 = choice
|
||||||
> [-- handle two adjacent quotes
|
> [-- handle two adjacent quotes
|
||||||
> do
|
> do
|
||||||
> void $ char '\''
|
> void nlquote
|
||||||
> s <- manyTill anyChar (char '\'')
|
> s <- manyTill anyChar nlquote
|
||||||
> optionSuffix moreString (s0 ++ "'" ++ s)
|
> optionSuffix moreString (s0 ++ "'" ++ s)
|
||||||
> ,-- handle string in separate parts
|
> ,-- handle string in separate parts
|
||||||
> -- e.g. 'part 1' 'part 2'
|
> -- e.g. 'part 1' 'part 2'
|
||||||
> do
|
> do
|
||||||
> try (whitespace <* char '\'')
|
> try (whitespace <* nlquote)
|
||||||
> s <- manyTill anyChar (char '\'')
|
> s <- manyTill anyChar nlquote
|
||||||
> optionSuffix moreString (s0 ++ s)
|
> optionSuffix moreString (s0 ++ s)
|
||||||
> ]
|
> ]
|
||||||
|
> -- non lexeme quote
|
||||||
|
> nlquote = char '\'' <?> "single quote"
|
||||||
|
|
||||||
= helper functions
|
= helper functions
|
||||||
|
|
||||||
|
@ -1054,6 +1068,15 @@ todo: work out the symbol parsing better
|
||||||
> guard (map toLower i == k)
|
> guard (map toLower i == k)
|
||||||
> return k) <?> k
|
> return k) <?> k
|
||||||
|
|
||||||
|
helper function to improve error messages
|
||||||
|
|
||||||
|
> keywords :: [String] -> Parser [String]
|
||||||
|
> keywords ks = mapM keyword ks <?> intercalate " " ks
|
||||||
|
|
||||||
|
> keywords_ :: [String] -> Parser ()
|
||||||
|
> keywords_ ks = mapM_ keyword_ ks <?> intercalate " " ks
|
||||||
|
|
||||||
|
|
||||||
> parens :: Parser a -> Parser a
|
> parens :: Parser a -> Parser a
|
||||||
> parens = between openParen closeParen
|
> parens = between openParen closeParen
|
||||||
|
|
||||||
|
|
6
TODO
6
TODO
|
@ -115,7 +115,11 @@ quantified comparison: left factor with normal comparison
|
||||||
multi word operator names in expressions
|
multi word operator names in expressions
|
||||||
hardcode all the symbols in the symbol parser/split?
|
hardcode all the symbols in the symbol parser/split?
|
||||||
left factor the not in 'not in' and 'not between', maybe others
|
left factor the not in 'not in' and 'not between', maybe others
|
||||||
|
rules for changing the multi keyword parsing:
|
||||||
|
if a keyword must be followed by another
|
||||||
|
e.g. left join, want to refactor to produce 'expected "left join"'
|
||||||
|
if the keyword is optionally followed by another, e.g. with
|
||||||
|
recursive, then don't do this.
|
||||||
|
|
||||||
future big feature summary:
|
future big feature summary:
|
||||||
all ansi sql queries
|
all ansi sql queries
|
||||||
|
|
Loading…
Reference in a new issue