1
Fork 0

improve error messages

This commit is contained in:
Jake Wheat 2014-04-18 12:28:05 +03:00
parent 2cad424379
commit 247c7a26b7
2 changed files with 54 additions and 27 deletions

View file

@ -22,6 +22,7 @@
> import qualified Text.Parsec as P (ParseError) > import qualified Text.Parsec as P (ParseError)
> import Text.Parsec.Perm (permute,(<$?>), (<|?>)) > import Text.Parsec.Perm (permute,(<$?>), (<|?>))
> import qualified Text.Parsec.Expr as E > import qualified Text.Parsec.Expr as E
> import Data.List (intercalate)
> import Language.SQL.SimpleSQL.Syntax > import Language.SQL.SimpleSQL.Syntax
@ -132,7 +133,7 @@ which parses as a typed literal
> [(:[]) <$> oneOf "nNbBxX" > [(:[]) <$> oneOf "nNbBxX"
> ,string "u&" > ,string "u&"
> ,string "U&" > ,string "U&"
> ] <* lookAhead (char '\'') > ] <* lookAhead quote
> literal :: Parser ValueExpr > literal :: Parser ValueExpr
> literal = number <|> stringValue <|> interval <|> try characterSetLiteral > literal = number <|> stringValue <|> interval <|> try characterSetLiteral
@ -187,6 +188,9 @@ The parsing for the aggregate extensions is here as well:
aggregate([all|distinct] args [order by orderitems]) aggregate([all|distinct] args [order by orderitems])
TODO: try to refactor the parser to not allow distinct/all or order by
if there are no value exprs
> aggOrApp :: [Name] -> Parser ValueExpr > aggOrApp :: [Name] -> Parser ValueExpr
> aggOrApp n = > aggOrApp n =
> makeApp n > makeApp n
@ -220,8 +224,7 @@ always used with the optionSuffix combinator.
> <*> option [] orderBy > <*> option [] orderBy
> <*> optionMaybe frameClause) > <*> optionMaybe frameClause)
> where > where
> partitionBy = keyword_ "partition" >> > partitionBy = keywords_ ["partition","by"] >> commaSep1 valueExpr
> keyword_ "by" >> commaSep1 valueExpr
> frameClause = > frameClause =
> mkFrame <$> choice [FrameRows <$ keyword_ "rows" > mkFrame <$> choice [FrameRows <$ keyword_ "rows"
> ,FrameRange <$ keyword_ "range"] > ,FrameRange <$ keyword_ "range"]
@ -235,7 +238,9 @@ always used with the optionSuffix combinator.
> -- use the bexpression style from the between parsing for frame between > -- use the bexpression style from the between parsing for frame between
> frameLimit useB = > frameLimit useB =
> choice > choice
> [Current <$ keyword_ "current" <* keyword_ "row" > [Current <$ keywords_ ["current", "row"]
> -- todo: create an automatic left factor for stuff like
> -- this
> ,keyword_ "unbounded" >> > ,keyword_ "unbounded" >>
> choice [UnboundedPreceding <$ keyword_ "preceding" > choice [UnboundedPreceding <$ keyword_ "preceding"
> ,UnboundedFollowing <$ keyword_ "following"] > ,UnboundedFollowing <$ keyword_ "following"]
@ -413,7 +418,7 @@ this is parsed as a postfix operator which is why it is in this form
> ,InList <$> commaSep1 valueExpr]) > ,InList <$> commaSep1 valueExpr])
> where > where
> inty = choice [True <$ keyword_ "in" > inty = choice [True <$ keyword_ "in"
> ,False <$ keyword_ "not" <* keyword_ "in"] > ,False <$ keywords_ ["not","in"]]
> mkIn i v = \e -> In i e v > mkIn i v = \e -> In i e v
@ -438,7 +443,7 @@ and operator. This is the call to valueExprB.
> where > where
> opName = choice > opName = choice
> ["between" <$ keyword_ "between" > ["between" <$ keyword_ "between"
> ,"not between" <$ try (keyword_ "not" <* keyword_ "between")] > ,"not between" <$ try (keywords_ ["not","between"])]
> makeOp n b c = \a -> SpecialOp [n] [a,b,c] > makeOp n b c = \a -> SpecialOp [n] [a,b,c]
subquery expression: subquery expression:
@ -508,13 +513,14 @@ typename: used in casts. Special cases for the multi keyword typenames
that SQL supports. that SQL supports.
> typeName :: Parser TypeName > typeName :: Parser TypeName
> typeName = choice (multiWordParsers > typeName = (choice (multiWordParsers
> ++ [TypeName <$> identifierBlacklist blacklist]) > ++ [TypeName <$> identifierBlacklist blacklist])
> >>= optionSuffix precision > >>= optionSuffix precision
> ) <?> "typename"
> where > where
> multiWordParsers = > multiWordParsers =
> flip map multiWordTypeNames > flip map multiWordTypeNames
> $ \ks -> (TypeName . unwords) <$> try (mapM keyword ks) > $ \ks -> (TypeName . unwords) <$> try (keywords ks)
> multiWordTypeNames = map words > multiWordTypeNames = map words
> ["double precision" > ["double precision"
> ,"character varying" > ,"character varying"
@ -628,13 +634,13 @@ TODO: carefully review the precedences and associativities.
> -- use try with the multi keywords because of shared > -- use try with the multi keywords because of shared
> -- prefixes to the sets of keywords. Should left factor > -- prefixes to the sets of keywords. Should left factor
> -- somehow > -- somehow
> binaryKeywords nm assoc = binary (try $ mapM_ keyword_ (words nm)) nm assoc > binaryKeywords nm assoc = binary (try $ keywords_ (words nm)) nm assoc
> binary p nm assoc = > binary p nm assoc =
> E.Infix (p >> return (\a b -> BinOp a [Name nm] b)) assoc > E.Infix (p >> return (\a b -> BinOp a [Name nm] b)) assoc
> prefixKeyword nm = prefix (keyword_ nm) nm > prefixKeyword nm = prefix (keyword_ nm) nm
> prefixSym nm = prefix (symbol_ nm) nm > prefixSym nm = prefix (symbol_ nm) nm
> prefix p nm = prefix' (p >> return (PrefixOp [Name nm])) > prefix p nm = prefix' (p >> return (PrefixOp [Name nm]))
> postfixKeywords nm = postfix (try $ mapM_ keyword_ (words nm)) nm > postfixKeywords nm = postfix (try $ keywords_ (words nm)) nm
> postfix p nm = postfix' (p >> return (PostfixOp [Name nm])) > postfix p nm = postfix' (p >> return (PostfixOp [Name nm]))
> -- hack from here > -- hack from here
> -- http://stackoverflow.com/questions/10475337/parsec-expr-repeated-prefix-postfix-operator-not-supported > -- http://stackoverflow.com/questions/10475337/parsec-expr-repeated-prefix-postfix-operator-not-supported
@ -724,6 +730,8 @@ tref
> <*> optionMaybe (joinCondition nat)) > <*> optionMaybe (joinCondition nat))
> >>= optionSuffix joinTrefSuffix > >>= optionSuffix joinTrefSuffix
TODO: factor the join stuff to produce better error messages
> joinType :: Parser JoinType > joinType :: Parser JoinType
> joinType = choice > joinType = choice
> [JCross <$ keyword_ "cross" <* keyword_ "join" > [JCross <$ keyword_ "cross" <* keyword_ "join"
@ -761,7 +769,7 @@ pretty trivial.
> whereClause = keyword_ "where" *> valueExpr > whereClause = keyword_ "where" *> valueExpr
> groupByClause :: Parser [GroupingExpr] > groupByClause :: Parser [GroupingExpr]
> groupByClause = keyword_ "group" *> keyword_ "by" > groupByClause = keywords_ ["group","by"]
> *> commaSep1 groupingExpression > *> commaSep1 groupingExpression
> where > where
> groupingExpression = > groupingExpression =
@ -771,7 +779,7 @@ pretty trivial.
> ,keyword_ "rollup" >> > ,keyword_ "rollup" >>
> Rollup <$> parens (commaSep groupingExpression) > Rollup <$> parens (commaSep groupingExpression)
> ,GroupingParens <$> parens (commaSep groupingExpression) > ,GroupingParens <$> parens (commaSep groupingExpression)
> ,keyword_ "grouping" >> keyword_ "sets" >> > ,keywords_ ["grouping", "sets"] >>
> GroupingSets <$> parens (commaSep groupingExpression) > GroupingSets <$> parens (commaSep groupingExpression)
> ,SimpleGroup <$> valueExpr > ,SimpleGroup <$> valueExpr
> ] > ]
@ -780,13 +788,14 @@ pretty trivial.
> having = keyword_ "having" *> valueExpr > having = keyword_ "having" *> valueExpr
> orderBy :: Parser [SortSpec] > orderBy :: Parser [SortSpec]
> orderBy = keyword_ "order" *> keyword_ "by" *> commaSep1 ob > orderBy = keywords_ ["order","by"] *> commaSep1 ob
> where > where
> ob = SortSpec > ob = SortSpec
> <$> valueExpr > <$> valueExpr
> <*> option DirDefault (choice [Asc <$ keyword_ "asc" > <*> option DirDefault (choice [Asc <$ keyword_ "asc"
> ,Desc <$ keyword_ "desc"]) > ,Desc <$ keyword_ "desc"])
> <*> option NullsOrderDefault > <*> option NullsOrderDefault
> -- todo: left factor better
> (keyword_ "nulls" >> > (keyword_ "nulls" >>
> choice [NullsFirst <$ keyword "first" > choice [NullsFirst <$ keyword "first"
> ,NullsLast <$ keyword "last"]) > ,NullsLast <$ keyword "last"])
@ -805,7 +814,7 @@ allows offset and fetch in either order
> fetch :: Parser ValueExpr > fetch :: Parser ValueExpr
> fetch = choice [ansiFetch, limit] > fetch = choice [ansiFetch, limit]
> where > where --todo: better left factoring
> ansiFetch = keyword_ "fetch" >> > ansiFetch = keyword_ "fetch" >>
> choice [keyword_ "first",keyword_ "next"] > choice [keyword_ "first",keyword_ "next"]
> *> valueExpr > *> valueExpr
@ -971,8 +980,8 @@ make this choice.
> identifier = lexeme ((:) <$> firstChar <*> many nonFirstChar) > identifier = lexeme ((:) <$> firstChar <*> many nonFirstChar)
> <?> "identifier" > <?> "identifier"
> where > where
> firstChar = letter <|> char '_' > firstChar = letter <|> char '_' <?> "identifier"
> nonFirstChar = digit <|> firstChar > nonFirstChar = digit <|> firstChar <?> ""
> quotedIdentifier :: Parser String > quotedIdentifier :: Parser String
> quotedIdentifier = char '"' *> manyTill anyChar doubleQuote > quotedIdentifier = char '"' *> manyTill anyChar doubleQuote
@ -998,7 +1007,7 @@ todo: work out the symbol parsing better
> <?> s > <?> s
> questionMark :: Parser Char > questionMark :: Parser Char
> questionMark = lexeme $ char '?' > questionMark = lexeme (char '?') <?> "question mark"
> openParen :: Parser Char > openParen :: Parser Char
> openParen = lexeme $ char '(' > openParen = lexeme $ char '('
@ -1014,13 +1023,16 @@ todo: work out the symbol parsing better
> comma :: Parser Char > comma :: Parser Char
> comma = lexeme $ char ',' > comma = lexeme (char ',') <?> "comma"
> semi :: Parser Char > semi :: Parser Char
> semi = lexeme $ char ';' > semi = lexeme (char ';') <?> "semicolon"
> doubleQuote :: Parser Char > doubleQuote :: Parser Char
> doubleQuote = lexeme $ char '"' > doubleQuote = lexeme (char '"') <?> "double quotes"
> quote :: Parser Char
> quote = lexeme (char '\'') <?> "single quote"
> --stringToken :: Parser String > --stringToken :: Parser String
> --stringToken = lexeme (char '\'' *> manyTill anyChar (char '\'')) > --stringToken = lexeme (char '\'' *> manyTill anyChar (char '\''))
@ -1028,23 +1040,25 @@ todo: work out the symbol parsing better
> -- string stuff > -- string stuff
> stringToken :: Parser String > stringToken :: Parser String
> stringToken = > stringToken =
> lexeme (char '\'' *> manyTill anyChar (char '\'') > lexeme (nlquote *> manyTill anyChar nlquote
> >>= optionSuffix moreString) > >>= optionSuffix moreString)
> <?> "string" > <?> "string"
> where > where
> moreString s0 = choice > moreString s0 = choice
> [-- handle two adjacent quotes > [-- handle two adjacent quotes
> do > do
> void $ char '\'' > void nlquote
> s <- manyTill anyChar (char '\'') > s <- manyTill anyChar nlquote
> optionSuffix moreString (s0 ++ "'" ++ s) > optionSuffix moreString (s0 ++ "'" ++ s)
> ,-- handle string in separate parts > ,-- handle string in separate parts
> -- e.g. 'part 1' 'part 2' > -- e.g. 'part 1' 'part 2'
> do > do
> try (whitespace <* char '\'') > try (whitespace <* nlquote)
> s <- manyTill anyChar (char '\'') > s <- manyTill anyChar nlquote
> optionSuffix moreString (s0 ++ s) > optionSuffix moreString (s0 ++ s)
> ] > ]
> -- non lexeme quote
> nlquote = char '\'' <?> "single quote"
= helper functions = helper functions
@ -1054,6 +1068,15 @@ todo: work out the symbol parsing better
> guard (map toLower i == k) > guard (map toLower i == k)
> return k) <?> k > return k) <?> k
helper function to improve error messages
> keywords :: [String] -> Parser [String]
> keywords ks = mapM keyword ks <?> intercalate " " ks
> keywords_ :: [String] -> Parser ()
> keywords_ ks = mapM_ keyword_ ks <?> intercalate " " ks
> parens :: Parser a -> Parser a > parens :: Parser a -> Parser a
> parens = between openParen closeParen > parens = between openParen closeParen

6
TODO
View file

@ -115,7 +115,11 @@ quantified comparison: left factor with normal comparison
multi word operator names in expressions multi word operator names in expressions
hardcode all the symbols in the symbol parser/split? hardcode all the symbols in the symbol parser/split?
left factor the not in 'not in' and 'not between', maybe others left factor the not in 'not in' and 'not between', maybe others
rules for changing the multi keyword parsing:
if a keyword must be followed by another
e.g. left join, want to refactor to produce 'expected "left join"'
if the keyword is optionally followed by another, e.g. with
recursive, then don't do this.
future big feature summary: future big feature summary:
all ansi sql queries all ansi sql queries