Compare commits

...

4 commits

Author SHA1 Message Date
e13cd50175 pokes in TAP 2022-05-04 00:49:18 +02:00
fa5beb4e2b decimal numbers 2022-05-04 00:49:09 +02:00
699c6a5ca1 token stuff 2022-05-03 02:03:22 +02:00
a510737462 .gitignore 2022-05-03 02:02:25 +02:00
4 changed files with 124 additions and 78 deletions

2
.gitignore vendored
View file

@ -3,3 +3,5 @@ build
depends depends
*.ipkg *.ipkg
*~ *~
quox
quox-tests

View file

@ -4,6 +4,7 @@ import Quox.Error
import Data.String import Data.String
import public Text.Lexer import public Text.Lexer
import public Text.Lexer.Tokenizer
import Generics.Derive import Generics.Derive
%default total %default total
@ -13,6 +14,7 @@ import Generics.Derive
public export public export
record Error where record Error where
constructor Err constructor Err
reason : StopReason
line, col : Int line, col : Int
char : Char char : Char
@ -30,32 +32,23 @@ data Punc
%runElab derive "Punc" [Generic, Meta, Eq, Ord, DecEq, Show] %runElab derive "Punc" [Generic, Meta, Eq, Ord, DecEq, Show]
||| zero and one are separate because they are
||| quantity & dimension constants
public export
data Number = Zero | One | Other Nat
%runElab derive "Number" [Generic, Meta, Eq, Ord, DecEq, Show]
public export public export
data Kind data Token
= P Punc = P Punc
| Name | Symbol | Name String | Symbol String
| N Number
%runElab derive "Kind" [Generic, Meta, Eq, Ord, DecEq, Show] %runElab derive "Token" [Generic, Meta, Eq, Ord, DecEq, Show]
export
TokenKind Kind where
TokType (P _) = ()
TokType Name = String
TokType Symbol = String
tokValue (P _) _ = ()
tokValue Name x = x
tokValue Symbol x = assert_total strTail x
Token' = Token (Maybe Kind)
Token = Token Kind
TokenMap' = TokenMap Token'
TokenMap = TokenMap Token
nameStart = pred $ \c => isAlpha c || c == '_' nameStart = pred $ \c => isAlpha c || c == '_'
nameCont = pred $ \c => isAlphaNum c || c == '_' || c == '\'' nameCont = pred $ \c => isAlphaNum c || c == '_' || c == '\''
@ -67,37 +60,70 @@ wild = exact "_" <+> reject nameCont
symbol = exact "'" <+> name symbol = exact "'" <+> name
tokens = toTokenMap [ decimal : Lexer
(lineComment (exact "--"), Nothing), decimal =
(blockComment (exact "{-") (exact "-}"), Nothing), digit <+> opt (many (digit <|> is '_') <+> digit)
(spaces, Nothing),
(exact "(", Just $ P LParen), (exact ")", Just $ P RParen), natToNumber : Nat -> Number
(exact "[", Just $ P LSquare), (exact "]", Just $ P RSquare), natToNumber 0 = Zero
(exact "{", Just $ P LBrace), (exact "}", Just $ P RBrace), natToNumber 1 = One
(exact ",", Just $ P Comma), natToNumber k = Other k
(exact "::" <|> exact "", Just $ P DblColon),
(exact ":", Just $ P Colon),
(exact "->" <|> exact "", Just $ P Arrow), toDigit : Char -> Nat
(exact "=>" <|> exact "", Just $ P DblArrow), toDigit c = cast $ ord c - ord '0'
(exact "**" <|> exact "×", Just $ P Times),
(exact "<<" <|> exact "", Just $ P Triangle),
(wild, Just $ P Wild),
(name, Just Name), (symbol, Just Symbol) makeDec' : Nat -> String -> Maybe Nat
makeDec' acc x with (asList x)
makeDec' acc "" | [] = pure acc
makeDec' acc (strCons '_' str) | '_' :: lst = makeDec' acc str | lst
makeDec' acc (strCons d str) | d :: lst =
if d >= '0' && d <= '9' then
makeDec' (acc * 10 + toDigit d) str | lst
else
Nothing
makeDec = fromMaybe 0 . makeDec' 0
skip : Lexer -> Tokenizer (Maybe a)
skip lex = match lex $ const Nothing
simple : List String -> a -> Tokenizer (Maybe a)
simple str x = match (choice $ map exact str) $ const $ Just x
choice : (xs : List (Tokenizer a)) -> {auto 0 _ : So (isCons xs)} -> Tokenizer a
choice (t :: ts) = foldl (\a, b => a <|> b) t ts
tokens : Tokenizer (Maybe Token)
tokens = choice [
skip $ lineComment $ exact "--",
skip $ blockComment (exact "{-") (exact "-}"),
skip spaces,
simple ["("] $ P LParen, simple [")"] $ P RParen,
simple ["["] $ P LSquare, simple ["]"] $ P RSquare,
simple ["{"] $ P LBrace, simple ["}"] $ P RBrace,
simple [","] $ P Comma,
simple ["::", ""] $ P DblColon,
simple [":"] $ P Colon,
simple ["->", ""] $ P Arrow,
simple ["=>", ""] $ P DblArrow,
simple ["**", "×"] $ P Times,
simple ["<<", ""] $ P Triangle,
match wild $ const $ Just $ P Wild,
match name $ Just . Name,
match symbol $ Just . Symbol . assert_total strTail,
-- [todo] other bases?
match (some $ digit <|> exact "_") $ Just . N . natToNumber . makeDec
] ]
sequenceT : Token (Maybe Kind) -> Maybe (Token Kind)
sequenceT tok =
case tok.kind of
Just k => Just $ {kind := k} tok
Nothing => Nothing
export export
lex : MonadThrow Error m => String -> m (List (WithBounds Token)) lex : MonadThrow Error m => String -> m (List (WithBounds Token))
lex str = lex str =
let (res, (line, col, str)) = lex tokens str in let (res, (reason, line, col, str)) = lex tokens str in
case asList str of case reason of
[] => pure $ mapMaybe (traverse sequenceT) res EndInput => pure $ mapMaybe sequence res
c :: _ => throw $ Err {line, col, char = c} _ => let char = assert_total strIndex str 0 in
throw $ Err {reason, line, col, char}

View file

@ -1,4 +1,5 @@
module TAP module TAP
-- [todo] extract this and Quox.Error to their own packages
import public Quox.Error import public Quox.Error
@ -45,7 +46,7 @@ All ToInfo es => ToInfo (OneOf es) where
export %inline ToInfo () where toInfo () = [] export %inline ToInfo () where toInfo () = []
export Show a => ToInfo (List (String, a)) where toInfo = map (map show) export %inline Show a => ToInfo (List (String, a)) where toInfo = map (map show)
export export
@ -121,15 +122,17 @@ export %inline
header : List a -> String header : List a -> String
header tests = "1..\{show $ length tests}" header tests = "1..\{show $ length tests}"
private
makePrefix : SnocList String -> String makePrefix : SnocList String -> String
makePrefix [<] = "" makePrefix [<] = ""
makePrefix (xs :< x) = foldr (\a, b => "\{a}/\{b}") x xs makePrefix (xs :< x) = foldr (\a, b => "\{a}/\{b}") x xs
private %inline
withPrefix : SnocList String -> TestBase -> Test withPrefix : SnocList String -> TestBase -> Test
withPrefix pfx b = One $ {label := "[\{makePrefix pfx}] \{b.label}"} b withPrefix pfx b = One $ {label := "[\{makePrefix pfx}] \{b.label}"} b
mutual mutual
export export %inline
flattenWith : SnocList String -> List Test -> List Test flattenWith : SnocList String -> List Test -> List Test
flattenWith pfx = concatMap (flatten1With pfx) flattenWith pfx = concatMap (flatten1With pfx)
@ -138,11 +141,11 @@ mutual
flatten1With pfx (One t) = [withPrefix pfx t] flatten1With pfx (One t) = [withPrefix pfx t]
flatten1With pfx (Group x ts) = flattenWith (pfx :< x) ts flatten1With pfx (Group x ts) = flattenWith (pfx :< x) ts
export export %inline
flatten : List Test -> List Test flatten : List Test -> List Test
flatten = flattenWith [<] flatten = flattenWith [<]
export export %inline
flatten1 : Test -> List Test flatten1 : Test -> List Test
flatten1 = flatten1With [<] flatten1 = flatten1With [<]

View file

@ -6,32 +6,36 @@ import TAP
export export
ToInfo Error where ToInfo Error where
toInfo (Err line col char) = toInfo (Err reason line col char) =
[("line", show line), ("col", show col), ("char", show char)] [("reason", show reason),
("line", show line),
("col", show col),
("char", show char)]
data ExtraError data ExtraError
= WrongAnswer (List Kind) (List Kind) = WrongAnswer (List Token) (List Token)
| TestFailed (List Kind) | TestFailed (List Token)
ToInfo ExtraError where ToInfo ExtraError where
toInfo (WrongAnswer exp got) = toInfo (WrongAnswer exp got) =
[("expected", show exp), ("received", show got)] [("expected", show exp), ("received", show got)]
toInfo (TestFailed got) = [("failed", show got)] toInfo (TestFailed got) =
[("failed", show got)]
parameters (label : String) (input : String) parameters (label : String) (input : String)
acceptsSuchThat' : (List Kind -> Maybe ExtraError) -> Test acceptsSuchThat' : (List Token -> Maybe ExtraError) -> Test
acceptsSuchThat' p = test {es = [Lexer.Error, ExtraError]} label $ do acceptsSuchThat' p = test {es = [Lexer.Error, ExtraError]} label $ do
res <- map (kind . val) <$> lex input res <- map val <$> lex input
case p res of case p res of
Just err => throw err Just err => throw err
Nothing => pure () Nothing => pure ()
acceptsSuchThat : (List Kind -> Bool) -> Test acceptsSuchThat : (List Token -> Bool) -> Test
acceptsSuchThat p = acceptsSuchThat' $ \res => acceptsSuchThat p = acceptsSuchThat' $ \res =>
if p res then Nothing else Just $ TestFailed res if p res then Nothing else Just $ TestFailed res
acceptsWith : List Kind -> Test acceptsWith : List Token -> Test
acceptsWith expect = acceptsSuchThat' $ \res => acceptsWith expect = acceptsSuchThat' $ \res =>
if res == expect then Nothing else Just $ WrongAnswer expect res if res == expect then Nothing else Just $ WrongAnswer expect res
@ -40,13 +44,13 @@ parameters (label : String) (input : String)
rejects : Test rejects : Test
rejects = testThrows {es = [Lexer.Error]} label $ delay $ rejects = testThrows {es = [Lexer.Error]} label $ delay $
map (kind . val) <$> lex input map val <$> lex input
parameters (input : String) {default False esc : Bool} parameters (input : String) {default False esc : Bool}
show' : String -> String show' : String -> String
show' s = if esc then show s else "\"\{s}\"" show' s = if esc then show s else "\"\{s}\""
acceptsWith' : List Kind -> Test acceptsWith' : List Token -> Test
acceptsWith' = acceptsWith (show' input) input acceptsWith' = acceptsWith (show' input) input
accepts' : Test accepts' : Test
@ -73,12 +77,12 @@ tests = "lexer" :- [
"punctuation" :- [ "punctuation" :- [
acceptsWith' "({[:,::]})" acceptsWith' "({[:,::]})"
[P LParen, P LBrace, P LSquare, [P LParen, P LBrace, P LSquare,
P Colon, P Comma, P DblColon, P Colon, P Comma, P DblColon,
P RSquare, P RBrace, P RParen], P RSquare, P RBrace, P RParen],
acceptsWith' " ( { [ : , :: ] } ) " acceptsWith' " ( { [ : , :: ] } ) "
[P LParen, P LBrace, P LSquare, [P LParen, P LBrace, P LSquare,
P Colon, P Comma, P DblColon, P Colon, P Comma, P DblColon,
P RSquare, P RBrace, P RParen], P RSquare, P RBrace, P RParen],
acceptsWith' "-> → => ⇒ ** × << ⊲ ∷" acceptsWith' "-> → => ⇒ ** × << ⊲ ∷"
[P Arrow, P Arrow, P DblArrow, P DblArrow, [P Arrow, P Arrow, P DblArrow, P DblArrow,
@ -87,19 +91,30 @@ tests = "lexer" :- [
], ],
"names & symbols" :- [ "names & symbols" :- [
acceptsWith' "a" [Name], acceptsWith' "a" [Name "a"],
acceptsWith' "abc" [Name], acceptsWith' "abc" [Name "abc"],
acceptsWith' "_a" [Name], acceptsWith' "_a" [Name "_a"],
acceptsWith' "a_" [Name], acceptsWith' "a_" [Name "a_"],
acceptsWith' "a_b" [Name], acceptsWith' "a_b" [Name "a_b"],
acceptsWith' "abc'" [Name], acceptsWith' "abc'" [Name "abc'"],
acceptsWith' "a'b'c''" [Name], acceptsWith' "a'b'c''" [Name "a'b'c''"],
acceptsWith' "abc123" [Name], acceptsWith' "abc123" [Name "abc123"],
acceptsWith' "ab cd" [Name, Name], acceptsWith' "_1" [Name "_1"],
acceptsWith' "ab{--}cd" [Name, Name], acceptsWith' "ab cd" [Name "ab", Name "cd"],
acceptsWith' "'a" [Symbol], acceptsWith' "ab{--}cd" [Name "ab", Name "cd"],
acceptsWith' "'ab" [Symbol], acceptsWith' "'a" [Symbol "a"],
acceptsWith' "'_b" [Symbol], acceptsWith' "'ab" [Symbol "ab"],
acceptsWith' "'_b" [Symbol "_b"],
rejects' "'" rejects' "'"
],
"numbers" :- [
acceptsWith' "0" [N Zero],
acceptsWith' "1" [N One],
acceptsWith' "2" [N $ Other 2],
acceptsWith' "69" [N $ Other 69],
acceptsWith' "1_000" [N $ Other 1000],
todo "octal",
todo "hex"
] ]
] ]