我正在尝试为简单语言编写解析器;现在基本上它有文字,ifs,函数应用程序,而不是其他。
这是我得到的代码:
import Text.ParserCombinators.Parsec
import Control.Monad (liftM)
data Expr = Term Term
| Apply Expr Expr
| If Expr Expr Expr
deriving (Show)
data Term = Bool Bool
| Num Double
| String String
| Identifier String
| Parens Expr
deriving (Show)
sstring s = spaces >> string s
schar c = spaces >> char c
keyword k = do
kw <- try (sstring k)
notFollowedBy alphaNum
return kw
pBool :: Parser Bool
pBool = do
bool <- keyword "True" <|> keyword "False"
case bool of
"True" -> return True
"False" -> return False
pDouble :: Parser Double
pDouble = do
ds <- many1 digit
dot <- optionMaybe $ char '.'
case dot of
Nothing -> return $ read ds
_ -> do
ds' <- many1 digit
return $ read (ds ++ "." ++ ds')
pString :: Parser String
pString = do
char '"'
str <- many1 $ noneOf "\""
char '"'
return str
pIdentifier :: Parser String
pIdentifier = spaces >> many1 letter
pParens :: Parser Expr
pParens = do
schar '('
expr <- pExpr
schar ')'
return expr
pTerm :: Parser Term
pTerm = try (liftM Bool pBool)
<|> try (liftM Num pDouble)
<|> try (liftM String pString)
<|> try (liftM Identifier pIdentifier)
<|> try (liftM Parens pParens)
-- TODO: make this left-associative
pApply :: Parser Expr
pApply = do
term <- pTerm'
mApp <- spaces >> optionMaybe pApply
return $ case mApp of
Just app -> Apply term app
Nothing -> term
-- pulls "parens" expressions out of terms
pTerm' :: Parser Expr
pTerm' = do
term <- pTerm
case term of
Parens expr -> return expr
otherwise -> return $ Term term
pIf :: Parser Expr
pIf = do
keyword "if"
cond <- pExpr
keyword "then"
ifTrue <- pExpr
keyword "else"
ifFalse <- pExpr
return $ If cond ifTrue ifFalse
pExpr :: Parser Expr
pExpr = try pIf <|> pApply
test parser = parse parser ""
现在,如果我尝试解析ghci中的单个数字表达式,那么一切都很好:
> test pExpr "1"
Right (Term (Num 1.0))
大!许多其他事情也有效:
> test pExpr "1.234"
Right (Term (Num 1.234))
> test pApply "neg 1"
Right (Apply (Term (Identifier "neg")) (Term (Num 1.0)))
> test pExpr "f g 1"
Right (Apply (Term (Identifier "f")) (Apply (Term (Identifier "g")) (Term (Num 1.0))))
但是现在,如果我尝试解析if
语句,我会收到错误:
> test pIf "if 1 then 2 else 3"
Left (line 1, column 4):
unexpected "1"
expecting space, "if", "True", "False", letter or "("
这对我来说没有意义!让我们一步一步,查看解析if语句的规则:
我们解析"if"
关键字(没问题)。然后,对于下一个解析(1
),我们需要解析pExpr
,它本身可以是pIf
或pApply
。好吧,这不是if,所以我们尝试apply,它本身尝试pTerm'
,尝试pTerm
,尝试pBool
,失败,然后是pNum
,哪个成功了!然后pTerm
成功Num 1.0
,pTerm'
成功Term (Num 1.0)
,这意味着pExpr
成功Term (Num 1.0)
,然后通过cond
进入{{1}}变量......对吗?嗯,显然不是,因为它失败了!我不明白为什么它会在这里失败。
答案 0 :(得分:3)
您没有吃掉所有空格,而then
和else
被解释为标识符。 lexeme
规则可以在任何令牌之后占用空间。您的pIdentifier
需要明确检查它是否没有吞噬一个保留字。我解决了这些问题,并冒昧地使用了一些现有的组合器,并改为应用风格......
import Text.ParserCombinators.Parsec
import Control.Applicative hiding ((<|>))
data Expr = Term Term
| Apply Expr Expr
| If Expr Expr Expr
deriving (Show)
data Term = Bool Bool
| Num Double
| String String
| Identifier String
| Parens Expr
deriving (Show)
keywords = ["if", "then", "else", "True", "False"]
lexeme p = p <* spaces
schar = lexeme . char
keyword k = lexeme . try $
string k <* notFollowedBy alphaNum
pBool :: Parser Bool
pBool = (True <$ keyword "True") <|> (False <$ keyword "False")
pDouble :: Parser Double
pDouble = lexeme $ do
ds <- many1 digit
option (read ds) $ do
char '.'
ds' <- many1 digit
return $ read (ds ++ "." ++ ds')
pString :: Parser String
pString = lexeme . between (char '"') (char '"') . many1 $ noneOf "\""
pIdentifier :: Parser String
pIdentifier = lexeme . try $ do
ident <- many1 letter
if ident `elem` keywords
then unexpected $ "reserved word " ++ show ident
else return ident
pParens :: Parser Expr
pParens = between (schar '(') (schar ')') pExpr
pTerm :: Parser Term
pTerm = choice [ Bool <$> pBool
, Num <$> pDouble
, String <$> pString
, Identifier <$> pIdentifier
, Parens <$> pParens
]
-- TODO: make this left-associative
pApply :: Parser Expr
pApply = do
term <- pTerm'
option term $
Apply term <$> pApply
-- pulls "parens" expressions out of terms
pTerm' :: Parser Expr
pTerm' = do
term <- pTerm
case term of
Parens expr -> return expr
_ -> return $ Term term
pIf :: Parser Expr
pIf = If <$ keyword "if" <*> pExpr
<* keyword "then" <*> pExpr
<* keyword "else" <*> pExpr
pExpr :: Parser Expr
pExpr = pIf <|> pApply
test parser = parse (spaces *> parser <* eof) ""
答案 1 :(得分:1)
您需要进行一些更改。
pExpr :: Parser Expr
pExpr = try pIf <|> pTerm'
pIf :: Parser Expr
pIf = do
keyword "if"
spaces
cond <- pExpr
keyword "then"
spaces
ifTrue <- pExpr
keyword "else"
spaces
ifFalse <- pExpr
return $ If cond ifTrue ifFalse