2022-05-02 11:13:13 -04:00
|
|
|
|
module Quox.Lexer
|
|
|
|
|
|
|
|
|
|
import Quox.Error
|
|
|
|
|
|
|
|
|
|
import Data.String
|
|
|
|
|
import public Text.Lexer
|
2022-05-02 16:40:28 -04:00
|
|
|
|
import Generics.Derive
|
2022-05-02 11:13:13 -04:00
|
|
|
|
|
2022-05-02 16:38:37 -04:00
|
|
|
|
%default total
|
2022-05-02 16:40:28 -04:00
|
|
|
|
%language ElabReflection
|
2022-05-02 16:38:37 -04:00
|
|
|
|
|
2022-05-02 11:13:13 -04:00
|
|
|
|
|
|
|
|
|
public export
|
|
|
|
|
record Error where
|
|
|
|
|
constructor Err
|
|
|
|
|
line, col : Int
|
|
|
|
|
char : Char
|
|
|
|
|
|
|
|
|
|
public export
|
|
|
|
|
data Punc
|
|
|
|
|
= LParen | RParen
|
|
|
|
|
| LSquare | RSquare
|
|
|
|
|
| LBrace | RBrace
|
|
|
|
|
| Comma
|
|
|
|
|
| Colon | DblColon
|
|
|
|
|
| Arrow | DblArrow
|
|
|
|
|
| Times | Triangle
|
|
|
|
|
| Wild
|
|
|
|
|
|
2022-05-02 16:40:28 -04:00
|
|
|
|
%runElab derive "Punc" [Generic, Meta, Eq, Ord, DecEq, Show]
|
2022-05-02 11:13:13 -04:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
public export
|
|
|
|
|
data Kind
|
|
|
|
|
= P Punc
|
|
|
|
|
| Name | Symbol
|
|
|
|
|
|
2022-05-02 16:40:28 -04:00
|
|
|
|
%runElab derive "Kind" [Generic, Meta, Eq, Ord, DecEq, Show]
|
2022-05-02 11:13:13 -04:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
export
|
|
|
|
|
TokenKind Kind where
|
|
|
|
|
TokType (P _) = ()
|
|
|
|
|
TokType Name = String
|
|
|
|
|
TokType Symbol = String
|
|
|
|
|
|
|
|
|
|
tokValue (P _) _ = ()
|
|
|
|
|
tokValue Name x = x
|
|
|
|
|
tokValue Symbol x = assert_total strTail x
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
Token' = Token (Maybe Kind)
|
|
|
|
|
Token = Token Kind
|
|
|
|
|
|
|
|
|
|
TokenMap' = TokenMap Token'
|
|
|
|
|
TokenMap = TokenMap Token
|
|
|
|
|
|
|
|
|
|
nameStart = pred $ \c => isAlpha c || c == '_'
|
|
|
|
|
nameCont = pred $ \c => isAlphaNum c || c == '_' || c == '\''
|
|
|
|
|
|
|
|
|
|
name = nameStart <+> many nameCont <+> reject nameCont
|
|
|
|
|
|
|
|
|
|
wild = exact "_" <+> reject nameCont
|
|
|
|
|
|
|
|
|
|
%hide Text.Lexer.symbol
|
|
|
|
|
symbol = exact "'" <+> name
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
tokens = toTokenMap [
|
|
|
|
|
(lineComment (exact "--"), Nothing),
|
|
|
|
|
(blockComment (exact "{-") (exact "-}"), Nothing),
|
|
|
|
|
(spaces, Nothing),
|
|
|
|
|
|
|
|
|
|
(exact "(", Just $ P LParen), (exact ")", Just $ P RParen),
|
|
|
|
|
(exact "[", Just $ P LSquare), (exact "]", Just $ P RSquare),
|
|
|
|
|
(exact "{", Just $ P LBrace), (exact "}", Just $ P RBrace),
|
|
|
|
|
(exact ",", Just $ P Comma),
|
|
|
|
|
(exact "::" <|> exact "∷", Just $ P DblColon),
|
|
|
|
|
(exact ":", Just $ P Colon),
|
|
|
|
|
|
|
|
|
|
(exact "->" <|> exact "→", Just $ P Arrow),
|
|
|
|
|
(exact "=>" <|> exact "⇒", Just $ P DblArrow),
|
|
|
|
|
(exact "**" <|> exact "×", Just $ P Times),
|
|
|
|
|
(exact "<<" <|> exact "⊲", Just $ P Triangle),
|
|
|
|
|
(wild, Just $ P Wild),
|
|
|
|
|
|
|
|
|
|
(name, Just Name), (symbol, Just Symbol)
|
|
|
|
|
]
|
|
|
|
|
|
|
|
|
|
sequenceT : Token (Maybe Kind) -> Maybe (Token Kind)
|
|
|
|
|
sequenceT tok =
|
|
|
|
|
case tok.kind of
|
|
|
|
|
Just k => Just $ {kind := k} tok
|
|
|
|
|
Nothing => Nothing
|
|
|
|
|
|
|
|
|
|
export
|
|
|
|
|
lex : MonadThrow Error m => String -> m (List (WithBounds Token))
|
|
|
|
|
lex str =
|
|
|
|
|
let (res, (line, col, str)) = lex tokens str in
|
|
|
|
|
case asList str of
|
|
|
|
|
[] => pure $ mapMaybe (traverse sequenceT) res
|
|
|
|
|
c :: _ => throw $ Err {line, col, char = c}
|