Cleaned up the parsing code
This commit is contained in:
parent
8158557bb9
commit
52bfdd126b
170
Nix/Parser.hs
170
Nix/Parser.hs
|
@ -25,27 +25,43 @@ nixApp = go <$> some (whiteSpace *> nixTerm True)
|
||||||
|
|
||||||
nixTerm :: Bool -> Parser NExpr
|
nixTerm :: Bool -> Parser NExpr
|
||||||
nixTerm allowLambdas = choice
|
nixTerm allowLambdas = choice
|
||||||
[ mkInt <$> decimal <?> "integer"
|
[ nixInt
|
||||||
|
, nixBool
|
||||||
, (string "true" *> pure (mkBool True)) <?> "bool"
|
, nixNull
|
||||||
, (string "false" *> pure (mkBool False)) <?> "bool"
|
, nixParens
|
||||||
, (string "null" *> pure mkNull) <?> "null"
|
, nixList
|
||||||
|
, nixPath
|
||||||
, between (symbolic '(') (symbolic ')') nixApp
|
|
||||||
<?> "parens"
|
|
||||||
|
|
||||||
, between (symbolic '[') (symbolic ']')
|
|
||||||
(Fix . NList <$> many (nixTerm False))
|
|
||||||
<?> "list"
|
|
||||||
|
|
||||||
, try (do chars <- some (satisfy isPathChar)
|
|
||||||
trace ("Path chars: " ++ show chars) $ return ()
|
|
||||||
guard ('/' `elem` chars)
|
|
||||||
return $ mkPath chars)
|
|
||||||
|
|
||||||
, maybeSetOrLambda allowLambdas
|
, maybeSetOrLambda allowLambdas
|
||||||
]
|
]
|
||||||
|
|
||||||
|
nixInt :: Parser NExpr
|
||||||
|
nixInt = mkInt <$> decimal <?> "integer"
|
||||||
|
|
||||||
|
nixBool :: Parser NExpr
|
||||||
|
nixBool = (string "true" *> pure (mkBool True))
|
||||||
|
<|> (string "false" *> pure (mkBool False))
|
||||||
|
<?> "bool"
|
||||||
|
|
||||||
|
nixNull :: Parser NExpr
|
||||||
|
nixNull = string "null" *> pure mkNull <?> "null"
|
||||||
|
|
||||||
|
nixParens :: Parser NExpr
|
||||||
|
nixParens = between (symbolic '(') (symbolic ')') nixApp <?> "parens"
|
||||||
|
|
||||||
|
nixList :: Parser NExpr
|
||||||
|
nixList = between (symbolic '[') (symbolic ']')
|
||||||
|
(Fix . NList <$> many (nixTerm False))
|
||||||
|
<?> "list"
|
||||||
|
|
||||||
|
nixPath :: Parser NExpr
|
||||||
|
nixPath = try $ do
|
||||||
|
chars <- some (satisfy isPathChar)
|
||||||
|
trace ("Path chars: " ++ show chars) $ return ()
|
||||||
|
guard ('/' `elem` chars)
|
||||||
|
return $ mkPath chars
|
||||||
|
where
|
||||||
|
isPathChar c = isAlpha c || c `Prelude.elem` ".:/"
|
||||||
|
|
||||||
maybeSetOrLambda :: Bool -> Parser NExpr
|
maybeSetOrLambda :: Bool -> Parser NExpr
|
||||||
maybeSetOrLambda allowLambdas = do
|
maybeSetOrLambda allowLambdas = do
|
||||||
trace "maybeSetOrLambda" $ return ()
|
trace "maybeSetOrLambda" $ return ()
|
||||||
|
@ -66,17 +82,6 @@ maybeSetOrLambda allowLambdas = do
|
||||||
else error "Unexpected lambda"
|
else error "Unexpected lambda"
|
||||||
else keyName <?> "string"
|
else keyName <?> "string"
|
||||||
|
|
||||||
isPathChar :: Char -> Bool
|
|
||||||
isPathChar c = isAlpha c || c `Prelude.elem` ".:/"
|
|
||||||
|
|
||||||
oneChar :: Parser NExpr
|
|
||||||
oneChar = mkStr . singleton <$> anyChar
|
|
||||||
|
|
||||||
stringChar :: Parser NExpr
|
|
||||||
stringChar = char '\\' *> oneChar
|
|
||||||
<|> (string "${" *> nixApp <* char '}')
|
|
||||||
<|> (mkStr . pack <$> many (noneOf "\"\\"))
|
|
||||||
|
|
||||||
symName :: Parser Text
|
symName :: Parser Text
|
||||||
symName = do
|
symName = do
|
||||||
chars <- some (satisfy (\c -> isAlpha c || c == '.'))
|
chars <- some (satisfy (\c -> isAlpha c || c == '.'))
|
||||||
|
@ -89,38 +94,30 @@ stringish
|
||||||
= (char '"' *>
|
= (char '"' *>
|
||||||
(Fix . NConcat <$> manyTill stringChar (char '"')))
|
(Fix . NConcat <$> manyTill stringChar (char '"')))
|
||||||
<|> (char '$' *> between (symbolic '{') (symbolic '}') nixApp)
|
<|> (char '$' *> between (symbolic '{') (symbolic '}') nixApp)
|
||||||
|
where
|
||||||
keyName :: Parser NExpr
|
stringChar :: Parser NExpr
|
||||||
keyName = (stringish <|> (mkSym <$> symName)) <* whiteSpace
|
stringChar = char '\\' *> oneChar
|
||||||
|
<|> (string "${" *> nixApp <* char '}')
|
||||||
nvPair :: Parser (NExpr, NExpr)
|
<|> (mkStr . pack <$> many (noneOf "\"\\"))
|
||||||
nvPair = (,) <$> keyName
|
where
|
||||||
<*> (symbolic '=' *> nixApp)
|
oneChar = mkStr . singleton <$> anyChar
|
||||||
|
|
||||||
argExpr :: Parser NExpr
|
argExpr :: Parser NExpr
|
||||||
argExpr = (Fix . NArgSet . Map.fromList <$> argList)
|
argExpr = (Fix . NArgSet . Map.fromList <$> argList)
|
||||||
<|> ((mkSym <$> symName) <?> "argname")
|
<|> ((mkSym <$> symName) <?> "argname")
|
||||||
|
where
|
||||||
|
argList = between (symbolic '{') (symbolic '}')
|
||||||
|
((argName <* whiteSpace) `sepBy` symbolic ',')
|
||||||
|
<?> "arglist"
|
||||||
|
|
||||||
argList :: Parser [(Text, Maybe NExpr)]
|
argName = (,) <$> (symName <* whiteSpace)
|
||||||
argList = between (symbolic '{') (symbolic '}')
|
<*> optional (try (symbolic '?' *> nixApp))
|
||||||
((argName <* whiteSpace) `sepBy` symbolic ',')
|
1
|
||||||
<?> "arglist"
|
nvPair :: Parser (NExpr, NExpr)
|
||||||
|
nvPair = (,) <$> keyName <*> (symbolic '=' *> nixApp)
|
||||||
|
|
||||||
argName :: Parser (Text, Maybe NExpr)
|
keyName :: Parser NExpr
|
||||||
argName = (,) <$> (symName <* whiteSpace)
|
keyName = (stringish <|> (mkSym <$> symName)) <* whiteSpace
|
||||||
<*> optional (try (symbolic '?' *> nixApp))
|
|
||||||
|
|
||||||
-- whiteSymbolic :: Char -> Parser Char
|
|
||||||
-- whiteSymbolic c = whiteSpace *> symbolic c
|
|
||||||
|
|
||||||
lookaheadForSet :: Parser Bool
|
|
||||||
lookaheadForSet = do
|
|
||||||
trace "lookaheadForSet" $ return ()
|
|
||||||
x <- (symbolic '{' *> return True) <|> return False
|
|
||||||
if not x then return x else do
|
|
||||||
y <- (keyName *> return True) <|> return False
|
|
||||||
if not y then return y else
|
|
||||||
(symbolic '=' *> return True) <|> return False
|
|
||||||
|
|
||||||
setOrArgs :: Parser NExpr
|
setOrArgs :: Parser NExpr
|
||||||
setOrArgs = do
|
setOrArgs = do
|
||||||
|
@ -143,5 +140,68 @@ setOrArgs = do
|
||||||
symbolic ':' *> ((Fix .) . NAbs <$> pure args <*> nixApp)
|
symbolic ':' *> ((Fix .) . NAbs <$> pure args <*> nixApp)
|
||||||
<|> pure args
|
<|> pure args
|
||||||
|
|
||||||
|
lookaheadForSet :: Parser Bool
|
||||||
|
lookaheadForSet = do
|
||||||
|
trace "lookaheadForSet" $ return ()
|
||||||
|
x <- (symbolic '{' *> return True) <|> return False
|
||||||
|
if not x then return x else do
|
||||||
|
y <- (keyName *> return True) <|> return False
|
||||||
|
if not y then return y else
|
||||||
|
(symbolic '=' *> return True) <|> return False
|
||||||
|
|
||||||
parseNixFile :: MonadIO m => FilePath -> m (Result NExpr)
|
parseNixFile :: MonadIO m => FilePath -> m (Result NExpr)
|
||||||
parseNixFile = parseFromFileEx nixApp
|
parseNixFile = parseFromFileEx nixApp
|
||||||
|
|
||||||
|
{-
|
||||||
|
|
||||||
|
Grammar of the Nix language (LL(n)). I conditionalize terms in the grammar
|
||||||
|
with a predicate suffix in square brackets. If the predicate fails, we
|
||||||
|
back-track. WS is used to indicate where arbitrary whitespace is allowed.
|
||||||
|
|
||||||
|
top ::= app
|
||||||
|
|
||||||
|
Applied expressions, or "expr expr", express function application. Since they
|
||||||
|
do not mean this within lists, we must call it out as a separate grammar rule so
|
||||||
|
that we can make clear when it is allowed.
|
||||||
|
|
||||||
|
app ::= expr WS+ app | (epsilon)
|
||||||
|
|
||||||
|
expr ::= atom
|
||||||
|
| '(' app ')'
|
||||||
|
| '[' list_members ']'
|
||||||
|
| "rec"[opt] '{' set_members[one kv_pair exists] '}'
|
||||||
|
| argspec ':' app
|
||||||
|
|
||||||
|
atom ::= INTEGER
|
||||||
|
| "true" | "false"
|
||||||
|
| "null"
|
||||||
|
| CHAR(0-9A-Za-z_./)+[elem '/']
|
||||||
|
| '"' string '"'
|
||||||
|
|
||||||
|
Strings are a bit special in that not only do they observe escaping conventions,
|
||||||
|
but they allow for interpolation of arbitrary Nix expressions. This means
|
||||||
|
they form a sub-grammar, so we assume a lexical context switch here.
|
||||||
|
|
||||||
|
string ::= string_elem string | (epsilon)
|
||||||
|
|
||||||
|
string_elem ::= '\' ANYCHAR | subexpr | ANYCHAR+
|
||||||
|
|
||||||
|
subexpr ::= "${" WS* app "}"
|
||||||
|
|
||||||
|
list_members ::= expr WS+ list_members | (epsilon)
|
||||||
|
|
||||||
|
set_members ::= kv_pair WS* ';' WS* set_members | (epsilon)
|
||||||
|
|
||||||
|
kv_pair ::= stringish WS* '=' WS* app
|
||||||
|
|
||||||
|
stringish ::= string | CHAR(0-9A-Za-z_.)+ | subexpr
|
||||||
|
|
||||||
|
argspec ::= CHAR(0-9A-Za-z_)+ | '{' arg_list '}'
|
||||||
|
|
||||||
|
arg_list ::= arg_specifier | arg_specifier ',' arg_list
|
||||||
|
|
||||||
|
arg_specifier ::= CHAR(0-9A-Za-z_)+ default_value[opt]
|
||||||
|
|
||||||
|
default_value ::= '?' app
|
||||||
|
|
||||||
|
-}
|
||||||
|
|
Loading…
Reference in a new issue