simple-sql-parser/tools/Language/SQL/SimpleSQL/LexerTests.lhs



Test for the lexer

> module Language.SQL.SimpleSQL.LexerTests (lexerTests) where

> import Language.SQL.SimpleSQL.TestTypes
> import Language.SQL.SimpleSQL.Lex (Token(..))
> --import Debug.Trace
> import Data.Char (isAlpha)

> lexerTests :: TestItem
> lexerTests = Group "lexerTests" $
>     [Group "lexer token tests" [ansiLexerTests
>                                ,postgresLexerTests]]

> ansiLexerTable :: [(String,[Token])]
> ansiLexerTable =
>     -- single char symbols
>     map (\s -> ([s],[Symbol [s]])) "+-^*/%~&|?<>[]=,;()"
>     -- multi char symbols
>     ++ map (\s -> (s,[Symbol s])) [">=","<=","!=","<>","||"]
>     ++ (let idens = ["a", "_a", "test", "table", "Stuff", "STUFF"]
>         -- simple identifiers
>         in map (\i -> (i, [Identifier Nothing i])) idens
>            ++ map (\i -> ("\"" ++ i ++ "\"", [Identifier (Just ("\"","\"")) i])) idens
>            -- todo: in order to make lex . pretty id, need to
>            -- preserve the case of the u
>            ++ map (\i -> ("u&\"" ++ i ++ "\"", [Identifier (Just ("u&\"","\"")) i])) idens
>            -- host param
>            ++ map (\i -> (':':i, [HostParam i])) idens
>        )
>     -- quoted identifiers with embedded double quotes
>     -- the lexer doesn't unescape the quotes
>     ++ [("\"normal \"\" iden\"", [Identifier (Just ("\"","\"")) "normal \"\" iden"])]
>     -- strings
>     -- the lexer doesn't apply escapes at all
>     ++ [("'string'", [SqlString "'" "'" "string"])
>        ,("'normal '' quote'", [SqlString "'" "'" "normal '' quote"])
>        ,("'normalendquote '''", [SqlString "'" "'" "normalendquote ''"])]
>     -- csstrings
>     ++ map (\c -> (c ++ "'test'", [SqlString (c ++ "'") "'" "test"]))
>        ["n", "N","b", "B","x", "X", "u&"]
>     -- numbers
>     ++ [("10", [SqlNumber "10"])
>        ,(".1", [SqlNumber ".1"])
>        ,("5e3", [SqlNumber "5e3"])
>        ,("5e+3", [SqlNumber "5e+3"])
>        ,("5e-3", [SqlNumber "5e-3"])
>        ,("10.2", [SqlNumber "10.2"])
>        ,("10.2e7", [SqlNumber "10.2e7"])]
>     -- whitespace
>     ++ concat [[([a],[Whitespace [a]])
>                ,([a,b], [Whitespace [a,b]])]
>               | a <- " \n\t", b <- " \n\t"]
>     -- line comment
>     ++ map (\c -> (c, [LineComment c]))
>        ["--", "-- ", "-- this is a comment", "-- line com\n"]
>     -- block comment
>     ++ map (\c -> (c, [BlockComment c]))
>        ["/**/", "/* */","/* this is a comment */"
>        ,"/* this *is/ a comment */"
>        ]

> ansiLexerTests :: TestItem
> ansiLexerTests = Group "ansiLexerTests" $
>     [Group "ansi lexer token tests" $ [LexerTest ansi2011 s t |  (s,t) <- ansiLexerTable]
>     ,Group "ansi generated combination lexer tests" $
>     [ LexerTest ansi2011 (s ++ s1) (t ++ t1)
>     | (s,t) <- ansiLexerTable
>     , (s1,t1) <- ansiLexerTable

which combinations won't work:
<> <= >= || two single symbols which make a double char symbol
identifier + identifier if both are quoted or unquoted
string string
csstring string
line comment anything (can add newline?)
number number (todo: double check more carefully)

>     , isGood $ t ++ t1

>     ]
>     ,Group "adhoc lexer tests" $
>        map (uncurry $ LexerTest ansi2011)
>        [("", [])
>        ,("-- line com\nstuff", [LineComment "-- line com\n",Identifier Nothing "stuff"])
>        ]
>      ]

>  where
>    isGood :: [Token] -> Bool
>    isGood l = {-let b =-} and $ map not [p l | p <- map listPred badCombos]
>               -- in trace ("isGood " ++ show (l,b)) b
>    badCombos :: [((Token -> Bool),(Token -> Bool))]
>    badCombos = [symbolPair "<" ">"
>                ,symbolPair "<" "="
>                ,symbolPair ">" "="
>                ,symbolPair "!" "="
>                ,symbolPair "|" "|"
>                ,symbolPair "||" "|"
>                ,symbolPair "|" "||"
>                ,symbolPair "||" "||"
>                ,symbolPair "<" ">="

>                ,symbolPair "-" "-"
>                ,symbolPair "/" "*"
>                ,symbolPair "*" "/"

>                ,(isIdentifier, isIdentifier)
>                ,(isDQIdentifier, isDQIdentifier)
>                ,(isCQIdentifier, isDQIdentifier)
>                ,(isString, isNonCsString)
>                ,(isEofLineComment, const True)
>                ,(isNumber, isNumber)
>                ,(isHostParam,isIdentifier)
>                ,(isHostParam,isCsString)
>                ,(isHostParam,isCQIdentifier)
>                ,(isIdentifier,isCsString)
>                ,(isIdentifier,isCQIdentifier)
>                ,(isWhitespace, isWhitespace)
>                ,(isIdentifier, isNumber)
>                ,(isHostParam, isNumber)
>                ,(isMinus, isLineComment)
>                ]
>    isIdentifier (Identifier Nothing _) = True
>    isIdentifier _ = False
>    isDQIdentifier (Identifier (Just ("\"",_)) _) = True
>    isDQIdentifier _ = False
>    isCQIdentifier (Identifier (Just ((x:_),_)) _) | isAlpha x = True
>    isCQIdentifier _ = False
>    isCsString (SqlString (x:_) _ _) | isAlpha x = True
>    isCsString _ = False
>    isString (SqlString _ _ _) = True
>    isString _ = False
>    isNonCsString (SqlString [] _ _) = True
>    isNonCsString (SqlString (x:_) _ _) | not (isAlpha x) = True
>    isNonCsString _ = False
>    isEofLineComment (LineComment s) = last s /= '\n'
>    isEofLineComment _ = False
>    isLineComment (LineComment {}) = True
>    isLineComment _ = False
>    isNumber (SqlNumber{}) = True
>    isNumber _ = False
>    isHostParam (HostParam{}) = True
>    isHostParam _ = False
>    isWhitespace (Whitespace{}) = True
>    isWhitespace _ = False
>    isMinus (Symbol "-") = True
>    isMinus _ = False
>    symbolPair a b = ((==Symbol a), (==Symbol b))
>    listPred :: ((Token -> Bool),(Token -> Bool)) -> [Token] -> Bool
>    listPred _ [] = False
>    listPred _ [_] = False
>    listPred (p,p1) (t:t1:ts) | p t && p1 t1 = True
>                              | otherwise = listPred (p,p1) (t1:ts)

todo: lexing tests
do quickcheck testing:
can try to generate valid tokens then check they parse

same as above: can also try to pair tokens, create an accurate
  function to say which ones can appear adjacent, and test

I think this plus the explicit lists of tokens like above which do
basic sanity + explicit edge casts will provide a high level of
assurance.


> postgresLexerTable :: [(String,[Token])]
> postgresLexerTable =
>     -- single char symbols
>     map (\s -> ([s],[Symbol [s]])) "+-^*/%~&|?<>[]=,;():"
>     -- multi char symbols
>     ++ map (\s -> (s,[Symbol s])) [">=","<=","!=","<>","||", "::","..",":="]
>     -- todo: add many examples of generic symbols
>     -- also: do the testing for the ansi compatibility special cases
>     ++ (let idens = ["a", "_a", "test", "table", "Stuff", "STUFF"]
>         -- simple identifiers
>         in map (\i -> (i, [Identifier Nothing i])) idens
>            ++ map (\i -> ("\"" ++ i ++ "\"", [Identifier (Just ("\"","\"")) i])) idens
>            -- todo: in order to make lex . pretty id, need to
>            -- preserve the case of the u
>            ++ map (\i -> ("u&\"" ++ i ++ "\"", [Identifier (Just ("u&\"","\"")) i])) idens
>            -- host param
>            ++ map (\i -> (':':i, [HostParam i])) idens
>        )
>     -- positional var
>     ++ [("$1", [PositionalArg 1])]
>     -- quoted identifiers with embedded double quotes
>     ++ [("\"normal \"\" iden\"", [Identifier (Just ("\"","\"")) "normal \"\" iden"])]
>     -- strings
>     ++ [("'string'", [SqlString "'" "'" "string"])
>        ,("'normal '' quote'", [SqlString "'" "'" "normal '' quote"])
>        ,("'normalendquote '''", [SqlString "'" "'" "normalendquote ''"])
>        ,("e'this '' quote'", [SqlString "e'" "'" "this '' quote"])
>        ,("e'this \\' quote'", [SqlString "e'" "'" "this \\' quote"])
>        ,("'not this \\' quote", [SqlString "'" "'" "not this \\"
>                                 ,Whitespace " "
>                                 ,Identifier Nothing "quote"])
>        ,("$$ string 1 $$", [SqlString "$$" "$$" " string 1 "])
>        ,("$$ string $ 2 $$", [SqlString "$$" "$$" " string $ 2 "])
>        ,("$a$ $$string 3$$ $a$", [SqlString "$a$" "$a$" " $$string 3$$ "])
>        ]
>     -- csstrings
>     ++ map (\c -> (c ++ "'test'", [SqlString (c ++ "'") "'" "test"]))
>        ["n", "N","b", "B","x", "X", "u&", "e", "E"]
>     -- numbers
>     ++ [("10", [SqlNumber "10"])
>        ,(".1", [SqlNumber ".1"])
>        ,("5e3", [SqlNumber "5e3"])
>        ,("5e+3", [SqlNumber "5e+3"])
>        ,("5e-3", [SqlNumber "5e-3"])
>        ,("10.2", [SqlNumber "10.2"])
>        ,("10.2e7", [SqlNumber "10.2e7"])]
>     -- whitespace
>     ++ concat [[([a],[Whitespace [a]])
>                ,([a,b], [Whitespace [a,b]])]
>               | a <- " \n\t", b <- " \n\t"]
>     -- line comment
>     ++ map (\c -> (c, [LineComment c]))
>        ["--", "-- ", "-- this is a comment", "-- line com\n"]
>     -- block comment
>     ++ map (\c -> (c, [BlockComment c]))
>        ["/**/", "/* */","/* this is a comment */"
>        ,"/* this *is/ a comment */"
>        ]

> postgresLexerTests :: TestItem
> postgresLexerTests = Group "postgresLexerTests" $
>     [Group "postgres lexer token tests" $ [LexerTest postgres s t |  (s,t) <- postgresLexerTable]
>     ]
add separate lexer 2015-07-31 23:04:18 +02:00

			`Test for the lexer`

			`> module Language.SQL.SimpleSQL.LexerTests (lexerTests) where`

			`> import Language.SQL.SimpleSQL.TestTypes`
rename modules lexer->lex, parser->parse 2016-02-12 11:22:19 +01:00			`> import Language.SQL.SimpleSQL.Lex (Token(..))`
add separate lexer 2015-07-31 23:04:18 +02:00			`> --import Debug.Trace`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> import Data.Char (isAlpha)`
add separate lexer 2015-07-31 23:04:18 +02:00
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> lexerTests :: TestItem`
			`> lexerTests = Group "lexerTests" $`
work on postgresql lexing add positional arg add e' quoted strings add \' escaping in strings (not finished) add ::, :=, : symbols 2016-02-13 15:31:20 +01:00			`> [Group "lexer token tests" [ansiLexerTests`
			`> ,postgresLexerTests]]`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> ansiLexerTable :: [(String,[Token])]`
			`> ansiLexerTable =`
add separate lexer 2015-07-31 23:04:18 +02:00			`> -- single char symbols`
			`> map (\s -> ([s],[Symbol [s]])) "+-^*/%~&\|?<>[]=,;()"`
			`> -- multi char symbols`
			`> ++ map (\s -> (s,[Symbol s])) [">=","<=","!=","<>","\|\|"]`
			`> ++ (let idens = ["a", "_a", "test", "table", "Stuff", "STUFF"]`
			`> -- simple identifiers`
refactor the identifier syntax 2016-02-12 13:13:47 +01:00			`> in map (\i -> (i, [Identifier Nothing i])) idens`
			`> ++ map (\i -> ("\"" ++ i ++ "\"", [Identifier (Just ("\"","\"")) i])) idens`
add separate lexer 2015-07-31 23:04:18 +02:00			`> -- todo: in order to make lex . pretty id, need to`
			`> -- preserve the case of the u`
refactor the identifier syntax 2016-02-12 13:13:47 +01:00			`> ++ map (\i -> ("u&\"" ++ i ++ "\"", [Identifier (Just ("u&\"","\"")) i])) idens`
add separate lexer 2015-07-31 23:04:18 +02:00			`> -- host param`
			`> ++ map (\i -> (':':i, [HostParam i])) idens`
			`> )`
			`> -- quoted identifiers with embedded double quotes`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> -- the lexer doesn't unescape the quotes`
			`> ++ [("\"normal \"\" iden\"", [Identifier (Just ("\"","\"")) "normal \"\" iden"])]`
add separate lexer 2015-07-31 23:04:18 +02:00			`> -- strings`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> -- the lexer doesn't apply escapes at all`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> ++ [("'string'", [SqlString "'" "'" "string"])`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> ,("'normal '' quote'", [SqlString "'" "'" "normal '' quote"])`
			`> ,("'normalendquote '''", [SqlString "'" "'" "normalendquote ''"])]`
add separate lexer 2015-07-31 23:04:18 +02:00			`> -- csstrings`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> ++ map (\c -> (c ++ "'test'", [SqlString (c ++ "'") "'" "test"]))`
add separate lexer 2015-07-31 23:04:18 +02:00			`> ["n", "N","b", "B","x", "X", "u&"]`
			`> -- numbers`
			`> ++ [("10", [SqlNumber "10"])`
			`> ,(".1", [SqlNumber ".1"])`
			`> ,("5e3", [SqlNumber "5e3"])`
			`> ,("5e+3", [SqlNumber "5e+3"])`
			`> ,("5e-3", [SqlNumber "5e-3"])`
			`> ,("10.2", [SqlNumber "10.2"])`
			`> ,("10.2e7", [SqlNumber "10.2e7"])]`
			`> -- whitespace`
			`> ++ concat [[([a],[Whitespace [a]])`
			`> ,([a,b], [Whitespace [a,b]])]`
			`> \| a <- " \n\t", b <- " \n\t"]`
			`> -- line comment`
			`> ++ map (\c -> (c, [LineComment c]))`
tweak lexer tests 2015-08-02 14:58:09 +02:00			`> ["--", "-- ", "-- this is a comment", "-- line com\n"]`
add separate lexer 2015-07-31 23:04:18 +02:00			`> -- block comment`
			`> ++ map (\c -> (c, [BlockComment c]))`
			`> ["/*/", "/ /","/ this is a comment */"`
small fixes fix positions? small fixes to haddock add notes to top of lexer module simplify line comment lexer remove some trys from lexer fix the block comment parser to return all the comment text when there are embedded / * in the comment refactor the symbol, keyword and identifier blacklist checking into the low level token parsers instead of a separate step using guard 2015-08-01 12:22:07 +02:00			`> ,"/* this is/ a comment /"`
add separate lexer 2015-07-31 23:04:18 +02:00			`> ]`

new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> ansiLexerTests :: TestItem`
			`> ansiLexerTests = Group "ansiLexerTests" $`
			`> [Group "ansi lexer token tests" $ [LexerTest ansi2011 s t \| (s,t) <- ansiLexerTable]`
			`> ,Group "ansi generated combination lexer tests" $`
refactor dialect into a non enum and separate to own file 2016-02-12 11:51:06 +01:00			`> [ LexerTest ansi2011 (s ++ s1) (t ++ t1)`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> \| (s,t) <- ansiLexerTable`
			`> , (s1,t1) <- ansiLexerTable`
add separate lexer 2015-07-31 23:04:18 +02:00
			`which combinations won't work:`
			`<> <= >= \|\| two single symbols which make a double char symbol`
			`identifier + identifier if both are quoted or unquoted`
			`string string`
			`csstring string`
			`line comment anything (can add newline?)`
			`number number (todo: double check more carefully)`

			`> , isGood $ t ++ t1`

			`> ]`
rearrange tests slightly and hide/show tests in the website a bit better 2015-08-15 18:04:29 +02:00			`> ,Group "adhoc lexer tests" $`
refactor dialect into a non enum and separate to own file 2016-02-12 11:51:06 +01:00			`> map (uncurry $ LexerTest ansi2011)`
add separate lexer 2015-07-31 23:04:18 +02:00			`> [("", [])`
refactor the identifier syntax 2016-02-12 13:13:47 +01:00			`> ,("-- line com\nstuff", [LineComment "-- line com\n",Identifier Nothing "stuff"])`
add separate lexer 2015-07-31 23:04:18 +02:00			`> ]`
rearrange tests slightly and hide/show tests in the website a bit better 2015-08-15 18:04:29 +02:00			`> ]`
add separate lexer 2015-07-31 23:04:18 +02:00
			`> where`
			`> isGood :: [Token] -> Bool`
			`> isGood l = {-let b =-} and $ map not [p l \| p <- map listPred badCombos]`
			`> -- in trace ("isGood " ++ show (l,b)) b`
			`> badCombos :: [((Token -> Bool),(Token -> Bool))]`
			`> badCombos = [symbolPair "<" ">"`
			`> ,symbolPair "<" "="`
			`> ,symbolPair ">" "="`
			`> ,symbolPair "!" "="`
			`> ,symbolPair "\|" "\|"`
			`> ,symbolPair "\|\|" "\|"`
			`> ,symbolPair "\|" "\|\|"`
			`> ,symbolPair "\|\|" "\|\|"`
			`> ,symbolPair "<" ">="`

			`> ,symbolPair "-" "-"`
			`> ,symbolPair "/" "*"`
			`> ,symbolPair "*" "/"`

			`> ,(isIdentifier, isIdentifier)`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> ,(isDQIdentifier, isDQIdentifier)`
			`> ,(isCQIdentifier, isDQIdentifier)`
			`> ,(isString, isNonCsString)`
tweak lexer tests 2015-08-02 14:58:09 +02:00			`> ,(isEofLineComment, const True)`
add separate lexer 2015-07-31 23:04:18 +02:00			`> ,(isNumber, isNumber)`
			`> ,(isHostParam,isIdentifier)`
			`> ,(isHostParam,isCsString)`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> ,(isHostParam,isCQIdentifier)`
add separate lexer 2015-07-31 23:04:18 +02:00			`> ,(isIdentifier,isCsString)`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> ,(isIdentifier,isCQIdentifier)`
add separate lexer 2015-07-31 23:04:18 +02:00			`> ,(isWhitespace, isWhitespace)`
			`> ,(isIdentifier, isNumber)`
			`> ,(isHostParam, isNumber)`
			`> ,(isMinus, isLineComment)`
			`> ]`
refactor the identifier syntax 2016-02-12 13:13:47 +01:00			`> isIdentifier (Identifier Nothing _) = True`
add separate lexer 2015-07-31 23:04:18 +02:00			`> isIdentifier _ = False`
refactor the identifier syntax 2016-02-12 13:13:47 +01:00			`> isDQIdentifier (Identifier (Just ("\"",_)) _) = True`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> isDQIdentifier _ = False`
refactor the identifier syntax 2016-02-12 13:13:47 +01:00			`> isCQIdentifier (Identifier (Just ((x:_),_)) _) \| isAlpha x = True`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> isCQIdentifier _ = False`
			`> isCsString (SqlString (x:_) _ _) \| isAlpha x = True`
add separate lexer 2015-07-31 23:04:18 +02:00			`> isCsString _ = False`
new syntax for names and string literals 2016-02-12 12:09:58 +01:00			`> isString (SqlString _ _ _) = True`
			`> isString _ = False`
			`> isNonCsString (SqlString [] _ _) = True`
			`> isNonCsString (SqlString (x:_) _ _) \| not (isAlpha x) = True`
			`> isNonCsString _ = False`
tweak lexer tests 2015-08-02 14:58:09 +02:00			`> isEofLineComment (LineComment s) = last s /= '\n'`
			`> isEofLineComment _ = False`
			`> isLineComment (LineComment {}) = True`
add separate lexer 2015-07-31 23:04:18 +02:00			`> isLineComment _ = False`
			`> isNumber (SqlNumber{}) = True`
			`> isNumber _ = False`
			`> isHostParam (HostParam{}) = True`
			`> isHostParam _ = False`
			`> isWhitespace (Whitespace{}) = True`
			`> isWhitespace _ = False`
			`> isMinus (Symbol "-") = True`
			`> isMinus _ = False`
			`> symbolPair a b = ((==Symbol a), (==Symbol b))`
			`> listPred :: ((Token -> Bool),(Token -> Bool)) -> [Token] -> Bool`
			`> listPred _ [] = False`
			`> listPred _ [_] = False`
			`> listPred (p,p1) (t:t1:ts) \| p t && p1 t1 = True`
			`> \| otherwise = listPred (p,p1) (t1:ts)`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00
			`todo: lexing tests`
			`do quickcheck testing:`
			`can try to generate valid tokens then check they parse`

			`same as above: can also try to pair tokens, create an accurate`
			`function to say which ones can appear adjacent, and test`

			`I think this plus the explicit lists of tokens like above which do`
			`basic sanity + explicit edge casts will provide a high level of`
			`assurance.`



			`> postgresLexerTable :: [(String,[Token])]`
			`> postgresLexerTable =`
			`> -- single char symbols`
work on postgresql lexing add positional arg add e' quoted strings add \' escaping in strings (not finished) add ::, :=, : symbols 2016-02-13 15:31:20 +01:00			`> map (\s -> ([s],[Symbol [s]])) "+-^*/%~&\|?<>[]=,;():"`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> -- multi char symbols`
work on postgresql lexing add positional arg add e' quoted strings add \' escaping in strings (not finished) add ::, :=, : symbols 2016-02-13 15:31:20 +01:00			`> ++ map (\s -> (s,[Symbol s])) [">=","<=","!=","<>","\|\|", "::","..",":="]`
			`> -- todo: add many examples of generic symbols`
			`> -- also: do the testing for the ansi compatibility special cases`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> ++ (let idens = ["a", "_a", "test", "table", "Stuff", "STUFF"]`
			`> -- simple identifiers`
			`> in map (\i -> (i, [Identifier Nothing i])) idens`
			`> ++ map (\i -> ("\"" ++ i ++ "\"", [Identifier (Just ("\"","\"")) i])) idens`
			`> -- todo: in order to make lex . pretty id, need to`
			`> -- preserve the case of the u`
			`> ++ map (\i -> ("u&\"" ++ i ++ "\"", [Identifier (Just ("u&\"","\"")) i])) idens`
			`> -- host param`
			`> ++ map (\i -> (':':i, [HostParam i])) idens`
			`> )`
			`> -- positional var`
work on postgresql lexing add positional arg add e' quoted strings add \' escaping in strings (not finished) add ::, :=, : symbols 2016-02-13 15:31:20 +01:00			`> ++ [("$1", [PositionalArg 1])]`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> -- quoted identifiers with embedded double quotes`
work on postgresql lexing add positional arg add e' quoted strings add \' escaping in strings (not finished) add ::, :=, : symbols 2016-02-13 15:31:20 +01:00			`> ++ [("\"normal \"\" iden\"", [Identifier (Just ("\"","\"")) "normal \"\" iden"])]`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> -- strings`
			`> ++ [("'string'", [SqlString "'" "'" "string"])`
			`> ,("'normal '' quote'", [SqlString "'" "'" "normal '' quote"])`
work on postgresql lexing add positional arg add e' quoted strings add \' escaping in strings (not finished) add ::, :=, : symbols 2016-02-13 15:31:20 +01:00			`> ,("'normalendquote '''", [SqlString "'" "'" "normalendquote ''"])`
			`> ,("e'this '' quote'", [SqlString "e'" "'" "this '' quote"])`
			`> ,("e'this \\' quote'", [SqlString "e'" "'" "this \\' quote"])`
add lexing for \' only in e' strings and dollar strings in pg dialect 2016-02-13 16:07:27 +01:00			`> ,("'not this \\' quote", [SqlString "'" "'" "not this \\"`
			`> ,Whitespace " "`
			`> ,Identifier Nothing "quote"])`
			`> ,("$$ string 1 $$", [SqlString "$$" "$$" " string 1 "])`
			`> ,("$$ string $ 2 $$", [SqlString "$$" "$$" " string $ 2 "])`
			`> ,("$a$ $$string 3$$ $a$", [SqlString "$a$" "$a$" " $$string 3$$ "])`
don't unescape quotes in string literals and identifiers 2016-02-13 14:54:40 +01:00			`> ]`
			`> -- csstrings`
			`> ++ map (\c -> (c ++ "'test'", [SqlString (c ++ "'") "'" "test"]))`
			`> ["n", "N","b", "B","x", "X", "u&", "e", "E"]`
			`> -- numbers`
			`> ++ [("10", [SqlNumber "10"])`
			`> ,(".1", [SqlNumber ".1"])`
			`> ,("5e3", [SqlNumber "5e3"])`
			`> ,("5e+3", [SqlNumber "5e+3"])`
			`> ,("5e-3", [SqlNumber "5e-3"])`
			`> ,("10.2", [SqlNumber "10.2"])`
			`> ,("10.2e7", [SqlNumber "10.2e7"])]`
			`> -- whitespace`
			`> ++ concat [[([a],[Whitespace [a]])`
			`> ,([a,b], [Whitespace [a,b]])]`
			`> \| a <- " \n\t", b <- " \n\t"]`
			`> -- line comment`
			`> ++ map (\c -> (c, [LineComment c]))`
			`> ["--", "-- ", "-- this is a comment", "-- line com\n"]`
			`> -- block comment`
			`> ++ map (\c -> (c, [BlockComment c]))`
			`> ["/*/", "/ /","/ this is a comment */"`
			`> ,"/* this is/ a comment /"`
			`> ]`
work on postgresql lexing add positional arg add e' quoted strings add \' escaping in strings (not finished) add ::, :=, : symbols 2016-02-13 15:31:20 +01:00
			`> postgresLexerTests :: TestItem`
			`> postgresLexerTests = Group "postgresLexerTests" $`
			`> [Group "postgres lexer token tests" $ [LexerTest postgres s t \| (s,t) <- postgresLexerTable]`
			`> ]`