Compare commits
5 Commits
named-core
...
test-synta
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
a6ff46e2bf | ||
|
|
d3a25742f1 | ||
|
|
650a4cf22f | ||
|
|
baf9d79285 | ||
|
|
c7aed71db5 |
18
.ghci
18
.ghci
@@ -1,18 +0,0 @@
|
|||||||
:set -XOverloadedStrings
|
|
||||||
|
|
||||||
:set -package process
|
|
||||||
|
|
||||||
:{
|
|
||||||
import System.Exit qualified
|
|
||||||
import System.Process qualified
|
|
||||||
|
|
||||||
_reload_and_make _ = do
|
|
||||||
p <- System.Process.spawnCommand "make -f Makefile_happysrcs"
|
|
||||||
r <- System.Process.waitForProcess p
|
|
||||||
case r of
|
|
||||||
System.Exit.ExitSuccess -> pure ":reload"
|
|
||||||
_ -> pure ""
|
|
||||||
:}
|
|
||||||
|
|
||||||
:def! r _reload_and_make
|
|
||||||
|
|
||||||
17
CHANGELOG.md
17
CHANGELOG.md
@@ -1,17 +0,0 @@
|
|||||||
# unreleased
|
|
||||||
|
|
||||||
* New tag syntax:
|
|
||||||
```hs
|
|
||||||
case x of
|
|
||||||
{ 1 -> something
|
|
||||||
; 2 -> another
|
|
||||||
}
|
|
||||||
```
|
|
||||||
is now written as
|
|
||||||
```hs
|
|
||||||
case x of
|
|
||||||
{ <1> -> something
|
|
||||||
; <2> -> another
|
|
||||||
}
|
|
||||||
```
|
|
||||||
|
|
||||||
@@ -1,25 +0,0 @@
|
|||||||
HAPPY = happy
|
|
||||||
HAPPY_OPTS = -a -g -c
|
|
||||||
ALEX = alex
|
|
||||||
ALEX_OPTS = -g
|
|
||||||
|
|
||||||
SRC = src
|
|
||||||
CABAL_BUILD = dist-newstyle/build/x86_64-osx/ghc-9.6.2/rlp-0.1.0.0/build
|
|
||||||
|
|
||||||
all: parsers lexers
|
|
||||||
|
|
||||||
parsers: $(CABAL_BUILD)/Rlp/Parse.hs $(CABAL_BUILD)/Core/Parse.hs
|
|
||||||
lexers: $(CABAL_BUILD)/Rlp/Lex.hs $(CABAL_BUILD)/Core/Lex.hs
|
|
||||||
|
|
||||||
$(CABAL_BUILD)/Rlp/Parse.hs: $(SRC)/Rlp/Parse.y
|
|
||||||
$(HAPPY) $(HAPPY_OPTS) $< -o $@
|
|
||||||
|
|
||||||
$(CABAL_BUILD)/Rlp/Lex.hs: $(SRC)/Rlp/Lex.x
|
|
||||||
$(ALEX) $(ALEX_OPTS) $< -o $@
|
|
||||||
|
|
||||||
$(CABAL_BUILD)/Core/Parse.hs: $(SRC)/Core/Parse.y
|
|
||||||
$(HAPPY) $(HAPPY_OPTS) $< -o $@
|
|
||||||
|
|
||||||
$(CABAL_BUILD)/Core/Lex.hs: $(SRC)/Core/Lex.x
|
|
||||||
$(ALEX) $(ALEX_OPTS) $< -o $@
|
|
||||||
|
|
||||||
61
README.md
61
README.md
@@ -30,12 +30,12 @@ $ rlpc -ddump-opts t.hs
|
|||||||
|
|
||||||
### Potential Features
|
### Potential Features
|
||||||
Listed in order of importance.
|
Listed in order of importance.
|
||||||
- [x] ADTs
|
- [ ] ADTs
|
||||||
- [x] First-class functions
|
- [ ] First-class functions
|
||||||
- [ ] Higher-kinded types
|
- [ ] Higher-kinded types
|
||||||
- [ ] Typeclasses
|
- [ ] Typeclasses
|
||||||
- [x] Parametric polymorphism
|
- [ ] Parametric polymorphism
|
||||||
- [x] Hindley-Milner type inference
|
- [ ] Hindley-Milner type inference
|
||||||
- [ ] Newtype coercion
|
- [ ] Newtype coercion
|
||||||
- [ ] Parallelism
|
- [ ] Parallelism
|
||||||
|
|
||||||
@@ -66,59 +66,32 @@ Listed in order of importance.
|
|||||||
- [ ] TCO
|
- [ ] TCO
|
||||||
- [ ] DCE
|
- [ ] DCE
|
||||||
- [ ] Frontend
|
- [ ] Frontend
|
||||||
- [x] High-level language
|
- [ ] High-level language
|
||||||
- [x] AST
|
- [ ] AST
|
||||||
- [x] Lexer
|
- [ ] Lexer
|
||||||
- [x] Parser
|
- [ ] Parser
|
||||||
- [ ] Translation to the core language
|
- [ ] Translation to the core language
|
||||||
- [ ] Constraint solver
|
- [ ] Constraint solver
|
||||||
- [ ] `do`-notation
|
- [ ] `do`-notation
|
||||||
- [x] CLI
|
- [x] CLI
|
||||||
- [ ] Documentation
|
- [ ] Documentation
|
||||||
- [x] State transition rules
|
- [ ] State transition rules
|
||||||
- [ ] How does the evaluation model work?
|
- [ ] How does the evaluation model work?
|
||||||
- [ ] The Hindley-Milner type system
|
|
||||||
- [ ] CLI usage
|
- [ ] CLI usage
|
||||||
- [ ] Tail call optimisation
|
- [ ] Tail call optimisation
|
||||||
- [ ] Parsing rlp
|
- [x] Parsing rlp
|
||||||
- [ ] Tests
|
- [ ] Tests
|
||||||
- [x] Generic example programs
|
- [x] Generic example programs
|
||||||
- [ ] Parser
|
- [ ] Parser
|
||||||
|
|
||||||
### ~~December Release Plan~~
|
### December Release Plan
|
||||||
- [x] Tests
|
- [ ] Tests
|
||||||
- [ ] Core lexer
|
- [ ] Core lexer
|
||||||
- [ ] Core parser
|
- [ ] Core parser
|
||||||
- [x] Evaluation model
|
- [ ] Evaluation model
|
||||||
- [ ] Benchmarks
|
- [ ] Benchmarks
|
||||||
- [x] Stable Core lexer
|
- [ ] Stable Core lexer
|
||||||
- [x] Stable Core parser
|
- [ ] Stable Core parser
|
||||||
- [x] Stable evaluation model
|
- [ ] Stable evaluation model
|
||||||
- [x] Garbage Collection
|
- [ ] Garbage Collection
|
||||||
- [ ] Stable documentation for the evaluation model
|
- [ ] Stable documentation for the evaluation model
|
||||||
|
|
||||||
### January Release Plan
|
|
||||||
- [ ] Beta rl' to Core
|
|
||||||
- [ ] UX improvements
|
|
||||||
- [ ] Actual compiler errors -- no more unexceptional `error` calls
|
|
||||||
- [ ] Better CLI dump flags
|
|
||||||
- [ ] Annotate the AST with token positions for errors
|
|
||||||
|
|
||||||
### March Release Plan
|
|
||||||
- [ ] Tests
|
|
||||||
- [ ] rl' parser
|
|
||||||
- [ ] rl' lexer
|
|
||||||
|
|
||||||
### Indefinite Release Plan
|
|
||||||
|
|
||||||
This list is more concrete than the milestones, but likely further in the future
|
|
||||||
than the other release plans.
|
|
||||||
|
|
||||||
- [ ] Stable rl' to Core
|
|
||||||
- [ ] Core polish
|
|
||||||
- [ ] Better, stable parser
|
|
||||||
- [ ] Better, stable lexer
|
|
||||||
- [ ] Less hacky handling of named data
|
|
||||||
- [ ] Less hacky pragmas
|
|
||||||
- [ ] GM to LLVM
|
|
||||||
|
|
||||||
|
|||||||
@@ -112,3 +112,5 @@ The way around this is quite simple: simply offset the stack when w
|
|||||||
:end-before: -- << [ref/compileC]
|
:end-before: -- << [ref/compileC]
|
||||||
:caption: src/GM.hs
|
:caption: src/GM.hs
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@@ -2,21 +2,16 @@ Lexing, Parsing, and Layouts
|
|||||||
============================
|
============================
|
||||||
|
|
||||||
The C-style languages of my previous experiences have all had quite trivial
|
The C-style languages of my previous experiences have all had quite trivial
|
||||||
lexical analysis stages: you ignore all whitespace and point out the symbols you
|
lexical analysis stages, peaking in complexity when I streamed tokens lazily in
|
||||||
recognise. If you don't recognise something, check if it's a literal or an
|
C. The task of tokenising a C-style language is very simple in description: you
|
||||||
identifier. Should it be neither, return an error.
|
ignore all whitespace and point out what you recognise. If you don't recognise
|
||||||
|
something, check if it's a literal or an identifier. Should it be neither,
|
||||||
|
return an error.
|
||||||
|
|
||||||
In contrast, both lexing and parsing a Haskell-like language poses a number of
|
On paper, both lexing and parsing a Haskell-like language seem to pose a few
|
||||||
greater challenges. Listed by ascending intimidation factor, some of the
|
greater challenges. Listed by ascending intimidation factor, some of the
|
||||||
potential roadblocks on my mind before making an attempt were:
|
potential roadblocks on my mind before making an attempt were:
|
||||||
|
|
||||||
* Context-sensitive keywords; Haskell allows for some words to be used as
|
|
||||||
identifiers in appropriate contexts, such as :code:`family`, :code:`role`,
|
|
||||||
:code:`as`. Reading a note_ found in `GHC's lexer`_, it appears that keywords
|
|
||||||
are only considered in bodies for which their use is relevant, e.g.
|
|
||||||
:code:`family` and :code:`role` in type declarations, :code:`as` after
|
|
||||||
:code:`case`; :code:`if`, :code:`then`, and :code:`else` in expressions, etc.
|
|
||||||
|
|
||||||
* Operators; Haskell has not only user-defined infix operators, but user-defined
|
* Operators; Haskell has not only user-defined infix operators, but user-defined
|
||||||
precedence levels and associativities. I recall using an algorithm that looked
|
precedence levels and associativities. I recall using an algorithm that looked
|
||||||
up infix, prefix, postfix, and even mixfix operators up in a global table to
|
up infix, prefix, postfix, and even mixfix operators up in a global table to
|
||||||
@@ -24,9 +19,17 @@ potential roadblocks on my mind before making an attempt were:
|
|||||||
stored in the table). I never modified the table at runtime, however this
|
stored in the table). I never modified the table at runtime, however this
|
||||||
could be a very nice solution for Haskell.
|
could be a very nice solution for Haskell.
|
||||||
|
|
||||||
|
* Context-sensitive keywords; Haskell allows for some words to be used as identifiers in
|
||||||
|
appropriate contexts, such as :code:`family`, :code:`role`, :code:`as`.
|
||||||
|
Reading a note_ found in `GHC's lexer`_,
|
||||||
|
it appears that keywords are only considered in bodies for which their use is
|
||||||
|
relevant, e.g. :code:`family` and :code:`role` in type declarations,
|
||||||
|
:code:`as` after :code:`case`; :code:`if`, :code:`then`, and :code:`else` in
|
||||||
|
expressions, etc.
|
||||||
|
|
||||||
* Whitespace sensitivity; While I was comfortable with the idea of a system
|
* Whitespace sensitivity; While I was comfortable with the idea of a system
|
||||||
similar to Python's INDENT/DEDENT tokens, Haskell's layout system is based on
|
similar to Python's INDENT/DEDENT tokens, Haskell seemed to use whitespace to
|
||||||
alignment and is very generous with line-folding.
|
section code in a way that *felt* different.
|
||||||
|
|
||||||
.. _note: https://gitlab.haskell.org/ghc/ghc/-/wikis/commentary/coding-style#2-using-notes
|
.. _note: https://gitlab.haskell.org/ghc/ghc/-/wikis/commentary/coding-style#2-using-notes
|
||||||
.. _GHC's lexer: https://gitlab.haskell.org/ghc/ghc/-/blob/master/compiler/GHC/Parser/Lexer.x#L1133
|
.. _GHC's lexer: https://gitlab.haskell.org/ghc/ghc/-/blob/master/compiler/GHC/Parser/Lexer.x#L1133
|
||||||
@@ -42,9 +45,9 @@ We will compare and contrast with Python's lexical analysis. Much to my dismay,
|
|||||||
Python uses newlines and indentation to separate statements and resolve scope
|
Python uses newlines and indentation to separate statements and resolve scope
|
||||||
instead of the traditional semicolons and braces found in C-style languages (we
|
instead of the traditional semicolons and braces found in C-style languages (we
|
||||||
may generally refer to these C-style languages as *explicitly-sectioned*).
|
may generally refer to these C-style languages as *explicitly-sectioned*).
|
||||||
Internally during tokenisation, when the Python lexer encounters a new line, the
|
Internally during tokenisation, when the Python lexer begins a new line, they
|
||||||
indentation of the new line is compared with that of the previous and the
|
compare the indentation of the new line with that of the previous and apply the
|
||||||
following rules are applied:
|
following rules:
|
||||||
|
|
||||||
1. If the new line has greater indentation than the previous, insert an INDENT
|
1. If the new line has greater indentation than the previous, insert an INDENT
|
||||||
token and push the new line's indentation level onto the indentation stack
|
token and push the new line's indentation level onto the indentation stack
|
||||||
@@ -57,37 +60,44 @@ following rules are applied:
|
|||||||
3. If the indentation is equal, insert a NEWLINE token to terminate the previous
|
3. If the indentation is equal, insert a NEWLINE token to terminate the previous
|
||||||
line, and leave it at that!
|
line, and leave it at that!
|
||||||
|
|
||||||
On the parser's end, the INDENT, DEDENT, and NEWLINE tokens are identical to
|
Parsing Python with the INDENT, DEDENT, and NEWLINE tokens is identical to
|
||||||
braces and semicolons. In developing our *layout* rules, we will follow in the
|
parsing a language with braces and semicolons. This is a solution pretty in line
|
||||||
pattern of translating the whitespace-sensitive source language to an explicitly
|
with Python's philosophy of the "one correct answer" (TODO: this needs a
|
||||||
sectioned language.
|
source). In developing our *layout* rules, we will follow in the pattern of
|
||||||
|
translating the whitespace-sensitive source language to an explicitly sectioned
|
||||||
|
language.
|
||||||
|
|
||||||
But What About Haskell?
|
But What About Haskell?
|
||||||
***********************
|
***********************
|
||||||
|
|
||||||
Parsing Haskell -- and thus rl' -- is only slightly more complex than Python,
|
We saw that Python, the most notable example of an implicitly sectioned
|
||||||
but the design is certainly more sensitive.
|
language, is pretty simple to lex. Why then am I so afraid of Haskell's layouts?
|
||||||
|
To be frank, I'm far less scared after asking myself this -- however there are
|
||||||
|
certainly some new complexities that Python needn't concern. Haskell has
|
||||||
|
implicit line *continuation*: forms written over multiple lines; indentation
|
||||||
|
styles often seen in Haskell are somewhat esoteric compared to Python's
|
||||||
|
"s/[{};]//".
|
||||||
|
|
||||||
.. code-block:: haskell
|
.. code-block:: haskell
|
||||||
|
|
||||||
-- line folds
|
-- line continuation
|
||||||
something = this is a
|
something = this is a
|
||||||
single expression
|
single expression
|
||||||
|
|
||||||
-- an extremely common style found in haskell
|
-- an extremely common style found in haskell
|
||||||
data Some = Data
|
data Python = Users
|
||||||
{ is :: Presented
|
{ are :: Crying
|
||||||
, in :: This
|
, right :: About
|
||||||
, silly :: Style
|
, now :: Sorry
|
||||||
}
|
}
|
||||||
|
|
||||||
-- another style oddity
|
-- another formatting oddity
|
||||||
-- note that this is not a single
|
-- note that this is not a single
|
||||||
-- continued line! `look at`,
|
-- continued line! `look at`,
|
||||||
-- `this odd`, and `alignment` are all
|
-- `this`, and `alignment` are all
|
||||||
-- discrete items!
|
-- separate expressions!
|
||||||
anotherThing = do look at
|
anotherThing = do look at
|
||||||
this odd
|
this
|
||||||
alignment
|
alignment
|
||||||
|
|
||||||
But enough fear, lets actually think about implementation. Firstly, some
|
But enough fear, lets actually think about implementation. Firstly, some
|
||||||
@@ -223,4 +233,3 @@ References
|
|||||||
|
|
||||||
* `Haskell syntax reference
|
* `Haskell syntax reference
|
||||||
<https://www.haskell.org/onlinereport/haskell2010/haskellch10.html>`_
|
<https://www.haskell.org/onlinereport/haskell2010/haskellch10.html>`_
|
||||||
|
|
||||||
|
|||||||
@@ -1,5 +0,0 @@
|
|||||||
Type Inference in rl'
|
|
||||||
=====================
|
|
||||||
|
|
||||||
rl' implements type inference via the Hindley-Milner type system.
|
|
||||||
|
|
||||||
@@ -32,7 +32,6 @@ html_theme = 'alabaster'
|
|||||||
imgmath_latex_preamble = r'''
|
imgmath_latex_preamble = r'''
|
||||||
\usepackage{amsmath}
|
\usepackage{amsmath}
|
||||||
\usepackage{tabularray}
|
\usepackage{tabularray}
|
||||||
\usepackage{syntax}
|
|
||||||
|
|
||||||
\newcommand{\transrule}[2]
|
\newcommand{\transrule}[2]
|
||||||
{\begin{tblr}{|rrrlc|}
|
{\begin{tblr}{|rrrlc|}
|
||||||
|
|||||||
@@ -1,67 +0,0 @@
|
|||||||
The Complete Syntax of rl'
|
|
||||||
==========================
|
|
||||||
|
|
||||||
WIP.
|
|
||||||
|
|
||||||
Provided is the complete syntax of rl' in (pseudo) EBNF. {A} represents zero or
|
|
||||||
more A's, [A] means optional A, and terminals are wrapped in 'single-quotes'.
|
|
||||||
|
|
||||||
.. math
|
|
||||||
:nowrap:
|
|
||||||
|
|
||||||
\setlength{\grammarparsep}{20pt plus 1pt minus 1pt}
|
|
||||||
\setlength{\grammarindent}{12em}
|
|
||||||
\begin{grammar}
|
|
||||||
<Decl> ::= <InfixDecl>
|
|
||||||
\alt <DataDecl>
|
|
||||||
\alt <TypeSig>
|
|
||||||
\alt <FunDef>
|
|
||||||
|
|
||||||
<InfixDecl> ::= <InfixWord> `litint' <Name>
|
|
||||||
<InfixWord> ::= `infix'
|
|
||||||
\alt `infixl'
|
|
||||||
\alt `infixr'
|
|
||||||
|
|
||||||
<DataDecl> ::= `data' `conname' {}
|
|
||||||
|
|
||||||
\end{grammar}
|
|
||||||
|
|
||||||
.. code-block:: bnf
|
|
||||||
|
|
||||||
Decl ::= InfixDecl
|
|
||||||
| DataDecl
|
|
||||||
| TypeSig
|
|
||||||
| FunDef
|
|
||||||
|
|
||||||
InfixDecl ::= InfixWord 'litint' Operator
|
|
||||||
InfixWord ::= 'infix'
|
|
||||||
| 'infixl'
|
|
||||||
| 'infixr'
|
|
||||||
|
|
||||||
DataDecl ::= 'data' 'conname' {'name'} '=' Data
|
|
||||||
DataCons ::= 'conname' {Type1} ['|' DataCons]
|
|
||||||
|
|
||||||
TypeSig ::= Var '::' Type
|
|
||||||
FunDef ::= Var {Pat1} '=' Expr
|
|
||||||
|
|
||||||
Type ::= Type1 {Type1}
|
|
||||||
-- note that (->) is right-associative,
|
|
||||||
-- and extends as far as possible
|
|
||||||
| Type '->' Type
|
|
||||||
Type1 ::= '(' Type ')'
|
|
||||||
| 'conname'
|
|
||||||
|
|
||||||
Pat ::= 'conname' Pat1 {Pat1}
|
|
||||||
| Pat 'consym' Pat
|
|
||||||
|
|
||||||
Pat1 ::= Literal
|
|
||||||
| 'conname'
|
|
||||||
| '(' Pat ')'
|
|
||||||
|
|
||||||
Literal ::= 'litint'
|
|
||||||
|
|
||||||
Var ::= 'varname'
|
|
||||||
| '(' 'varsym' ')'
|
|
||||||
Con ::= 'conname'
|
|
||||||
| '(' 'consym' ')'
|
|
||||||
|
|
||||||
@@ -1,17 +0,0 @@
|
|||||||
rl' Inference Rules
|
|
||||||
===================
|
|
||||||
|
|
||||||
.. rubric::
|
|
||||||
[Var]
|
|
||||||
|
|
||||||
.. math::
|
|
||||||
\frac{x : \tau \in \Gamma}
|
|
||||||
{\Gamma \vdash x : \tau}
|
|
||||||
|
|
||||||
.. rubric::
|
|
||||||
[App]
|
|
||||||
|
|
||||||
.. math::
|
|
||||||
\frac{\Gamma \vdash f : \alpha \to \beta \qquad \Gamma \vdash x : \alpha}
|
|
||||||
{\Gamma \vdash f x : \beta}
|
|
||||||
|
|
||||||
@@ -1,6 +1,6 @@
|
|||||||
fac n = case (==#) n 0 of
|
fac n = case (==#) n 0 of
|
||||||
{ <1> -> 1
|
{ 1 -> 1
|
||||||
; <0> -> (*#) n (fac ((-#) n 1))
|
; 0 -> (*#) n (fac ((-#) n 1))
|
||||||
};
|
};
|
||||||
|
|
||||||
main = fac 3;
|
main = fac 3;
|
||||||
|
|||||||
@@ -2,8 +2,8 @@ nil = Pack{0 0};
|
|||||||
cons x y = Pack{1 2} x y;
|
cons x y = Pack{1 2} x y;
|
||||||
list = cons 1 (cons 2 (cons 3 nil));
|
list = cons 1 (cons 2 (cons 3 nil));
|
||||||
sum l = case l of
|
sum l = case l of
|
||||||
{ <0> -> 0
|
{ 0 -> 0
|
||||||
; <1> x xs -> (+#) x (sum xs)
|
; 1 x xs -> (+#) x (sum xs)
|
||||||
};
|
};
|
||||||
main = sum list;
|
main = sum list;
|
||||||
|
|
||||||
|
|||||||
@@ -1,105 +0,0 @@
|
|||||||
Programming Language Checklist
|
|
||||||
by Colin McMillen, Jason Reed, and Elly Fong-Jones, 2011-10-10.
|
|
||||||
|
|
||||||
You appear to be advocating a new:
|
|
||||||
[x] functional [ ] imperative [ ] object-oriented [ ] procedural [ ] stack-based
|
|
||||||
[ ] "multi-paradigm" [x] lazy [ ] eager [x] statically-typed [ ] dynamically-typed
|
|
||||||
[x] pure [ ] impure [ ] non-hygienic [ ] visual [x] beginner-friendly
|
|
||||||
[ ] non-programmer-friendly [ ] completely incomprehensible
|
|
||||||
programming language. Your language will not work. Here is why it will not work.
|
|
||||||
|
|
||||||
You appear to believe that:
|
|
||||||
[ ] Syntax is what makes programming difficult
|
|
||||||
[x] Garbage collection is free [x] Computers have infinite memory
|
|
||||||
[x] Nobody really needs:
|
|
||||||
[x] concurrency [x] a REPL [x] debugger support [x] IDE support [x] I/O
|
|
||||||
[x] to interact with code not written in your language
|
|
||||||
[ ] The entire world speaks 7-bit ASCII
|
|
||||||
[ ] Scaling up to large software projects will be easy
|
|
||||||
[ ] Convincing programmers to adopt a new language will be easy
|
|
||||||
[ ] Convincing programmers to adopt a language-specific IDE will be easy
|
|
||||||
[ ] Programmers love writing lots of boilerplate
|
|
||||||
[ ] Specifying behaviors as "undefined" means that programmers won't rely on them
|
|
||||||
[ ] "Spooky action at a distance" makes programming more fun
|
|
||||||
|
|
||||||
Unfortunately, your language (has/lacks):
|
|
||||||
[x] comprehensible syntax [ ] semicolons [x] significant whitespace [ ] macros
|
|
||||||
[ ] implicit type conversion [ ] explicit casting [x] type inference
|
|
||||||
[ ] goto [ ] exceptions [x] closures [x] tail recursion [ ] coroutines
|
|
||||||
[ ] reflection [ ] subtyping [ ] multiple inheritance [x] operator overloading
|
|
||||||
[x] algebraic datatypes [x] recursive types [x] polymorphic types
|
|
||||||
[ ] covariant array typing [x] monads [ ] dependent types
|
|
||||||
[x] infix operators [x] nested comments [ ] multi-line strings [ ] regexes
|
|
||||||
[ ] call-by-value [x] call-by-name [ ] call-by-reference [ ] call-cc
|
|
||||||
|
|
||||||
The following philosophical objections apply:
|
|
||||||
[ ] Programmers should not need to understand category theory to write "Hello, World!"
|
|
||||||
[ ] Programmers should not develop RSI from writing "Hello, World!"
|
|
||||||
[ ] The most significant program written in your language is its own compiler
|
|
||||||
[x] The most significant program written in your language isn't even its own compiler
|
|
||||||
[x] No language spec
|
|
||||||
[x] "The implementation is the spec"
|
|
||||||
[ ] The implementation is closed-source [ ] covered by patents [ ] not owned by you
|
|
||||||
[ ] Your type system is unsound [ ] Your language cannot be unambiguously parsed
|
|
||||||
[ ] a proof of same is attached
|
|
||||||
[ ] invoking this proof crashes the compiler
|
|
||||||
[x] The name of your language makes it impossible to find on Google
|
|
||||||
[x] Interpreted languages will never be as fast as C
|
|
||||||
[ ] Compiled languages will never be "extensible"
|
|
||||||
[ ] Writing a compiler that understands English is AI-complete
|
|
||||||
[ ] Your language relies on an optimization which has never been shown possible
|
|
||||||
[ ] There are less than 100 programmers on Earth smart enough to use your language
|
|
||||||
[ ] ____________________________ takes exponential time
|
|
||||||
[ ] ____________________________ is known to be undecidable
|
|
||||||
|
|
||||||
Your implementation has the following flaws:
|
|
||||||
[ ] CPUs do not work that way
|
|
||||||
[ ] RAM does not work that way
|
|
||||||
[ ] VMs do not work that way
|
|
||||||
[ ] Compilers do not work that way
|
|
||||||
[ ] Compilers cannot work that way
|
|
||||||
[ ] Shift-reduce conflicts in parsing seem to be resolved using rand()
|
|
||||||
[ ] You require the compiler to be present at runtime
|
|
||||||
[ ] You require the language runtime to be present at compile-time
|
|
||||||
[ ] Your compiler errors are completely inscrutable
|
|
||||||
[ ] Dangerous behavior is only a warning
|
|
||||||
[ ] The compiler crashes if you look at it funny
|
|
||||||
[x] The VM crashes if you look at it funny
|
|
||||||
[x] You don't seem to understand basic optimization techniques
|
|
||||||
[x] You don't seem to understand basic systems programming
|
|
||||||
[ ] You don't seem to understand pointers
|
|
||||||
[ ] You don't seem to understand functions
|
|
||||||
|
|
||||||
Additionally, your marketing has the following problems:
|
|
||||||
[x] Unsupported claims of increased productivity
|
|
||||||
[x] Unsupported claims of greater "ease of use"
|
|
||||||
[ ] Obviously rigged benchmarks
|
|
||||||
[ ] Graphics, simulation, or crypto benchmarks where your code just calls
|
|
||||||
handwritten assembly through your FFI
|
|
||||||
[ ] String-processing benchmarks where you just call PCRE
|
|
||||||
[ ] Matrix-math benchmarks where you just call BLAS
|
|
||||||
[x] Noone really believes that your language is faster than:
|
|
||||||
[x] assembly [x] C [x] FORTRAN [x] Java [x] Ruby [ ] Prolog
|
|
||||||
[ ] Rejection of orthodox programming-language theory without justification
|
|
||||||
[x] Rejection of orthodox systems programming without justification
|
|
||||||
[ ] Rejection of orthodox algorithmic theory without justification
|
|
||||||
[ ] Rejection of basic computer science without justification
|
|
||||||
|
|
||||||
Taking the wider ecosystem into account, I would like to note that:
|
|
||||||
[x] Your complex sample code would be one line in: examples/
|
|
||||||
[ ] We already have an unsafe imperative language
|
|
||||||
[ ] We already have a safe imperative OO language
|
|
||||||
[x] We already have a safe statically-typed eager functional language
|
|
||||||
[ ] You have reinvented Lisp but worse
|
|
||||||
[ ] You have reinvented Javascript but worse
|
|
||||||
[ ] You have reinvented Java but worse
|
|
||||||
[ ] You have reinvented C++ but worse
|
|
||||||
[ ] You have reinvented PHP but worse
|
|
||||||
[ ] You have reinvented PHP better, but that's still no justification
|
|
||||||
[ ] You have reinvented Brainfuck but non-ironically
|
|
||||||
|
|
||||||
In conclusion, this is what I think of you:
|
|
||||||
[ ] You have some interesting ideas, but this won't fly.
|
|
||||||
[x] This is a bad language, and you should feel bad for inventing it.
|
|
||||||
[ ] Programming in this language is an adequate punishment for inventing it.
|
|
||||||
|
|
||||||
67
rlp.cabal
67
rlp.cabal
@@ -12,7 +12,6 @@ category: Language
|
|||||||
build-type: Simple
|
build-type: Simple
|
||||||
extra-doc-files: README.md
|
extra-doc-files: README.md
|
||||||
-- extra-source-files:
|
-- extra-source-files:
|
||||||
tested-with: GHC==9.6.2
|
|
||||||
|
|
||||||
common warnings
|
common warnings
|
||||||
-- ghc-options: -Wall -Wno-incomplete-uni-patterns -Wno-unused-top-binds
|
-- ghc-options: -Wall -Wno-incomplete-uni-patterns -Wno-unused-top-binds
|
||||||
@@ -31,12 +30,6 @@ library
|
|||||||
, Core.TH
|
, Core.TH
|
||||||
, Core.HindleyMilner
|
, Core.HindleyMilner
|
||||||
, Control.Monad.Errorful
|
, Control.Monad.Errorful
|
||||||
, Rlp.Syntax
|
|
||||||
-- , Rlp.Parse.Decls
|
|
||||||
, Rlp.Parse
|
|
||||||
, Rlp.Parse.Associate
|
|
||||||
, Rlp.Lex
|
|
||||||
, Rlp.Parse.Types
|
|
||||||
|
|
||||||
other-modules: Data.Heap
|
other-modules: Data.Heap
|
||||||
, Data.Pretty
|
, Data.Pretty
|
||||||
@@ -44,38 +37,34 @@ library
|
|||||||
, Core.Lex
|
, Core.Lex
|
||||||
, Core2Core
|
, Core2Core
|
||||||
, Control.Monad.Utils
|
, Control.Monad.Utils
|
||||||
|
, RLP.Syntax
|
||||||
|
|
||||||
build-tool-depends: happy:happy, alex:alex
|
build-tool-depends: happy:happy, alex:alex
|
||||||
|
|
||||||
-- other-extensions:
|
-- other-extensions:
|
||||||
build-depends: base ^>=4.18.0.0
|
build-depends: base ^>=4.18.0.0
|
||||||
|
, containers
|
||||||
|
, microlens
|
||||||
|
, microlens-mtl
|
||||||
|
, microlens-th
|
||||||
|
, microlens-platform
|
||||||
|
, mtl
|
||||||
|
, template-haskell
|
||||||
-- required for happy
|
-- required for happy
|
||||||
, array >= 0.5.5 && < 0.6
|
, array
|
||||||
, containers >= 0.6.7 && < 0.7
|
, data-default-class
|
||||||
, template-haskell >= 2.20.0 && < 2.21
|
, unordered-containers
|
||||||
, pretty >= 1.1.3 && < 1.2
|
, hashable
|
||||||
, data-default >= 0.7.1 && < 0.8
|
, pretty
|
||||||
, data-default-class >= 0.1.2 && < 0.2
|
-- TODO: either learn recursion-schemes, or stop depending
|
||||||
, hashable >= 1.4.3 && < 1.5
|
-- on it.
|
||||||
, mtl >= 2.3.1 && < 2.4
|
, recursion-schemes
|
||||||
, text >= 2.0.2 && < 2.1
|
, megaparsec
|
||||||
, megaparsec >= 9.6.1 && < 9.7
|
, text
|
||||||
, microlens >= 0.4.13 && < 0.5
|
|
||||||
, microlens-mtl >= 0.2.0 && < 0.3
|
|
||||||
, microlens-platform >= 0.4.3 && < 0.5
|
|
||||||
, microlens-th >= 0.4.3 && < 0.5
|
|
||||||
, unordered-containers >= 0.2.20 && < 0.3
|
|
||||||
, recursion-schemes >= 5.2.2 && < 5.3
|
|
||||||
, data-fix >= 0.3.2 && < 0.4
|
|
||||||
, utf8-string >= 1.0.2 && < 1.1
|
|
||||||
, extra >= 1.7.0 && < 2
|
|
||||||
|
|
||||||
hs-source-dirs: src
|
hs-source-dirs: src
|
||||||
default-language: GHC2021
|
default-language: GHC2021
|
||||||
|
|
||||||
default-extensions:
|
|
||||||
OverloadedStrings
|
|
||||||
|
|
||||||
executable rlpc
|
executable rlpc
|
||||||
import: warnings
|
import: warnings
|
||||||
main-is: Main.hs
|
main-is: Main.hs
|
||||||
@@ -83,12 +72,12 @@ executable rlpc
|
|||||||
-- other-extensions:
|
-- other-extensions:
|
||||||
build-depends: base ^>=4.18.0.0
|
build-depends: base ^>=4.18.0.0
|
||||||
, rlp
|
, rlp
|
||||||
, optparse-applicative >= 0.18.1 && < 0.19
|
, optparse-applicative
|
||||||
, microlens >= 0.4.13 && < 0.5
|
, microlens
|
||||||
, microlens-mtl >= 0.2.0 && < 0.3
|
, microlens-mtl
|
||||||
, mtl >= 2.3.1 && < 2.4
|
, mtl
|
||||||
, unordered-containers >= 0.2.20 && < 0.3
|
, unordered-containers
|
||||||
, text >= 2.0.2 && < 2.1
|
, text
|
||||||
|
|
||||||
hs-source-dirs: app
|
hs-source-dirs: app
|
||||||
default-language: GHC2021
|
default-language: GHC2021
|
||||||
@@ -101,12 +90,20 @@ test-suite rlp-test
|
|||||||
hs-source-dirs: tst
|
hs-source-dirs: tst
|
||||||
main-is: Main.hs
|
main-is: Main.hs
|
||||||
build-depends: base ^>=4.18.0.0
|
build-depends: base ^>=4.18.0.0
|
||||||
|
, unordered-containers
|
||||||
, rlp
|
, rlp
|
||||||
, QuickCheck
|
, QuickCheck
|
||||||
, hspec ==2.*
|
, hspec ==2.*
|
||||||
, microlens
|
, microlens
|
||||||
|
, text
|
||||||
|
, pretty
|
||||||
|
, microlens-platform
|
||||||
|
|
||||||
other-modules: Arith
|
other-modules: Arith
|
||||||
, GMSpec
|
, GMSpec
|
||||||
|
, CoreSyntax
|
||||||
, Core.HindleyMilnerSpec
|
, Core.HindleyMilnerSpec
|
||||||
|
, Core.ParseSpec
|
||||||
|
|
||||||
build-tool-depends: hspec-discover:hspec-discover
|
build-tool-depends: hspec-discover:hspec-discover
|
||||||
|
|
||||||
|
|||||||
@@ -11,6 +11,8 @@ module Compiler.JustRun
|
|||||||
( justLexSrc
|
( justLexSrc
|
||||||
, justParseSrc
|
, justParseSrc
|
||||||
, justTypeCheckSrc
|
, justTypeCheckSrc
|
||||||
|
, RlpcError
|
||||||
|
, Program'
|
||||||
)
|
)
|
||||||
where
|
where
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
@@ -26,23 +28,21 @@ import Data.Function ((&))
|
|||||||
import GM
|
import GM
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
justLexSrc :: String -> Either [MsgEnvelope RlpcError] [CoreToken]
|
justLexSrc :: String -> Either RlpcError [CoreToken]
|
||||||
justLexSrc s = lexCoreR (T.pack s)
|
justLexSrc s = lexCoreR (T.pack s)
|
||||||
& fmap (map $ \ (Located _ _ _ t) -> t)
|
& fmap (map $ \ (Located _ _ _ t) -> t)
|
||||||
& rlpcToEither
|
& rlpcToEither
|
||||||
|
|
||||||
justParseSrc :: String -> Either [MsgEnvelope RlpcError] Program'
|
justParseSrc :: String -> Either RlpcError Program'
|
||||||
justParseSrc s = parse (T.pack s)
|
justParseSrc s = parse (T.pack s)
|
||||||
& rlpcToEither
|
& rlpcToEither
|
||||||
where parse = lexCoreR >=> parseCoreProgR
|
where parse = lexCoreR >=> parseCoreProgR
|
||||||
|
|
||||||
justTypeCheckSrc :: String -> Either [MsgEnvelope RlpcError] Program'
|
justTypeCheckSrc :: String -> Either RlpcError Program'
|
||||||
justTypeCheckSrc s = typechk (T.pack s)
|
justTypeCheckSrc s = typechk (T.pack s)
|
||||||
& rlpcToEither
|
& rlpcToEither
|
||||||
where typechk = lexCoreR >=> parseCoreProgR >=> checkCoreProgR
|
where typechk = lexCoreR >=> parseCoreProgR >=> checkCoreProgR
|
||||||
|
|
||||||
rlpcToEither :: RLPC a -> Either [MsgEnvelope RlpcError] a
|
rlpcToEither :: RLPC e a -> Either e a
|
||||||
rlpcToEither r = case evalRLPC def r of
|
rlpcToEither = evalRLPC def >>> fmap fst
|
||||||
(Just a, _) -> Right a
|
|
||||||
(Nothing, es) -> Left es
|
|
||||||
|
|
||||||
|
|||||||
@@ -16,9 +16,9 @@ module Compiler.RLPC
|
|||||||
, RLPCT(..)
|
, RLPCT(..)
|
||||||
, RLPCIO
|
, RLPCIO
|
||||||
, RLPCOptions(RLPCOptions)
|
, RLPCOptions(RLPCOptions)
|
||||||
, IsRlpcError(..)
|
|
||||||
, RlpcError(..)
|
, RlpcError(..)
|
||||||
, MsgEnvelope(..)
|
, IsRlpcError(..)
|
||||||
|
, rlpc
|
||||||
, addFatal
|
, addFatal
|
||||||
, addWound
|
, addWound
|
||||||
, MonadErrorful
|
, MonadErrorful
|
||||||
@@ -27,6 +27,9 @@ module Compiler.RLPC
|
|||||||
, evalRLPCT
|
, evalRLPCT
|
||||||
, evalRLPCIO
|
, evalRLPCIO
|
||||||
, evalRLPC
|
, evalRLPC
|
||||||
|
, addRlpcWound
|
||||||
|
, addRlpcFatal
|
||||||
|
, liftRlpcErrs
|
||||||
, rlpcLogFile
|
, rlpcLogFile
|
||||||
, rlpcDebugOpts
|
, rlpcDebugOpts
|
||||||
, rlpcEvaluator
|
, rlpcEvaluator
|
||||||
@@ -37,7 +40,6 @@ module Compiler.RLPC
|
|||||||
, flagDDumpOpts
|
, flagDDumpOpts
|
||||||
, flagDDumpAST
|
, flagDDumpAST
|
||||||
, def
|
, def
|
||||||
, liftErrorful
|
|
||||||
)
|
)
|
||||||
where
|
where
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
@@ -49,7 +51,6 @@ import Control.Monad.Errorful
|
|||||||
import Compiler.RlpcError
|
import Compiler.RlpcError
|
||||||
import Data.Functor.Identity
|
import Data.Functor.Identity
|
||||||
import Data.Default.Class
|
import Data.Default.Class
|
||||||
import Data.Foldable
|
|
||||||
import GHC.Generics (Generic)
|
import GHC.Generics (Generic)
|
||||||
import Data.Hashable (Hashable)
|
import Data.Hashable (Hashable)
|
||||||
import Data.HashSet (HashSet)
|
import Data.HashSet (HashSet)
|
||||||
@@ -57,44 +58,48 @@ import Data.HashSet qualified as S
|
|||||||
import Data.Coerce
|
import Data.Coerce
|
||||||
import Lens.Micro
|
import Lens.Micro
|
||||||
import Lens.Micro.TH
|
import Lens.Micro.TH
|
||||||
import System.Exit
|
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
newtype RLPCT m a = RLPCT {
|
-- TODO: fancy errors
|
||||||
runRLPCT :: ReaderT RLPCOptions (ErrorfulT (MsgEnvelope RlpcError) m) a
|
newtype RLPCT e m a = RLPCT {
|
||||||
|
runRLPCT :: ReaderT RLPCOptions (ErrorfulT e m) a
|
||||||
}
|
}
|
||||||
deriving (Functor, Applicative, Monad)
|
-- TODO: incorrect ussage of MonadReader. RLPC should have its own
|
||||||
|
-- environment access functions
|
||||||
|
deriving (Functor, Applicative, Monad, MonadReader RLPCOptions)
|
||||||
|
|
||||||
type RLPC = RLPCT Identity
|
deriving instance (MonadIO m) => MonadIO (RLPCT e m)
|
||||||
|
|
||||||
type RLPCIO = RLPCT IO
|
instance MonadTrans (RLPCT e) where
|
||||||
|
lift = RLPCT . lift . lift
|
||||||
|
|
||||||
|
instance (MonadState s m) => MonadState s (RLPCT e m) where
|
||||||
|
state = lift . state
|
||||||
|
|
||||||
|
type RLPC e = RLPCT e Identity
|
||||||
|
|
||||||
|
type RLPCIO e = RLPCT e IO
|
||||||
|
|
||||||
|
evalRLPCT :: RLPCOptions
|
||||||
|
-> RLPCT e m a
|
||||||
|
-> m (Either e (a, [e]))
|
||||||
|
evalRLPCT o = runRLPCT >>> flip runReaderT o >>> runErrorfulT
|
||||||
|
|
||||||
evalRLPC :: RLPCOptions
|
evalRLPC :: RLPCOptions
|
||||||
-> RLPC a
|
-> RLPC e a
|
||||||
-> (Maybe a, [MsgEnvelope RlpcError])
|
-> Either e (a, [e])
|
||||||
evalRLPC opt r = runRLPCT r
|
evalRLPC o m = coerce $ evalRLPCT o m
|
||||||
& flip runReaderT opt
|
|
||||||
& runErrorful
|
|
||||||
|
|
||||||
evalRLPCT :: (Monad m)
|
evalRLPCIO :: (Exception e)
|
||||||
=> RLPCOptions
|
=> RLPCOptions
|
||||||
-> RLPCT m a
|
-> RLPCIO e a
|
||||||
-> m (Maybe a, [MsgEnvelope RlpcError])
|
-> IO (a, [e])
|
||||||
evalRLPCT = undefined
|
evalRLPCIO o m = do
|
||||||
|
m' <- evalRLPCT o m
|
||||||
evalRLPCIO :: RLPCOptions -> RLPCIO a -> IO a
|
case m' of
|
||||||
evalRLPCIO opt r = do
|
-- TODO: errors
|
||||||
(ma,es) <- evalRLPCT opt r
|
Left e -> throwIO e
|
||||||
putRlpcErrs es
|
Right a -> pure a
|
||||||
case ma of
|
|
||||||
Just x -> pure x
|
|
||||||
Nothing -> die "Failed, no code compiled."
|
|
||||||
|
|
||||||
putRlpcErrs :: [MsgEnvelope RlpcError] -> IO ()
|
|
||||||
putRlpcErrs = traverse_ print
|
|
||||||
|
|
||||||
liftErrorful :: (Monad m, IsRlpcError e) => ErrorfulT (MsgEnvelope e) m a -> RLPCT m a
|
|
||||||
liftErrorful e = RLPCT $ lift (fmap liftRlpcError `mapErrorful` e)
|
|
||||||
|
|
||||||
data RLPCOptions = RLPCOptions
|
data RLPCOptions = RLPCOptions
|
||||||
{ _rlpcLogFile :: Maybe FilePath
|
{ _rlpcLogFile :: Maybe FilePath
|
||||||
@@ -108,6 +113,32 @@ data RLPCOptions = RLPCOptions
|
|||||||
data Evaluator = EvaluatorGM | EvaluatorTI
|
data Evaluator = EvaluatorGM | EvaluatorTI
|
||||||
deriving Show
|
deriving Show
|
||||||
|
|
||||||
|
data Severity = Error
|
||||||
|
| Warning
|
||||||
|
| Debug
|
||||||
|
deriving Show
|
||||||
|
|
||||||
|
-- temporary until we have a new doc building system
|
||||||
|
type ErrorDoc = String
|
||||||
|
|
||||||
|
instance (Monad m) => MonadErrorful e (RLPCT e m) where
|
||||||
|
addWound = RLPCT . lift . addWound
|
||||||
|
addFatal = RLPCT . lift . addFatal
|
||||||
|
|
||||||
|
liftRlpcErrs :: (IsRlpcError e, Monad m)
|
||||||
|
=> RLPCT e m a -> RLPCT RlpcError m a
|
||||||
|
liftRlpcErrs m = RLPCT . ReaderT $ \r ->
|
||||||
|
mapErrors liftRlpcErr $ runRLPCT >>> (`runReaderT` r) $ m
|
||||||
|
|
||||||
|
addRlpcWound :: (IsRlpcError e, Monad m) => e -> RLPCT RlpcError m ()
|
||||||
|
addRlpcWound = addWound . liftRlpcErr
|
||||||
|
|
||||||
|
addRlpcFatal :: (IsRlpcError e, Monad m) => e -> RLPCT RlpcError m ()
|
||||||
|
addRlpcFatal = addWound . liftRlpcErr
|
||||||
|
|
||||||
|
rlpc :: (Monad m) => ErrorfulT e m a -> RLPCT e m a
|
||||||
|
rlpc = RLPCT . ReaderT . const
|
||||||
|
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
instance Default RLPCOptions where
|
instance Default RLPCOptions where
|
||||||
|
|||||||
@@ -1,70 +1,15 @@
|
|||||||
{-# LANGUAGE TemplateHaskell #-}
|
|
||||||
{-# LANGUAGE PatternSynonyms, ViewPatterns #-}
|
|
||||||
module Compiler.RlpcError
|
module Compiler.RlpcError
|
||||||
( IsRlpcError(..)
|
( RlpcError(..)
|
||||||
, MsgEnvelope(..)
|
, IsRlpcError(..)
|
||||||
, Severity(..)
|
|
||||||
, RlpcError(..)
|
|
||||||
, SrcSpan(..)
|
|
||||||
, msgSpan
|
|
||||||
, msgDiagnostic
|
|
||||||
, msgSeverity
|
|
||||||
, liftRlpcErrors
|
|
||||||
, errorMsg
|
|
||||||
)
|
)
|
||||||
where
|
where
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
import Control.Monad.Errorful
|
import Control.Monad.Errorful
|
||||||
import Data.Text (Text)
|
|
||||||
import Data.Text qualified as T
|
|
||||||
import GHC.Exts (IsString(..))
|
|
||||||
import Lens.Micro.Platform
|
|
||||||
import Lens.Micro.Platform.Internal
|
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
data MsgEnvelope e = MsgEnvelope
|
data RlpcError = RlpcErr String -- temp
|
||||||
{ _msgSpan :: SrcSpan
|
deriving (Show, Eq)
|
||||||
, _msgDiagnostic :: e
|
|
||||||
, _msgSeverity :: Severity
|
|
||||||
}
|
|
||||||
deriving (Functor, Show)
|
|
||||||
|
|
||||||
newtype RlpcError = Text [Text]
|
class IsRlpcError a where
|
||||||
deriving Show
|
liftRlpcErr :: a -> RlpcError
|
||||||
|
|
||||||
instance IsString RlpcError where
|
|
||||||
fromString = Text . pure . T.pack
|
|
||||||
|
|
||||||
class IsRlpcError e where
|
|
||||||
liftRlpcError :: e -> RlpcError
|
|
||||||
|
|
||||||
instance IsRlpcError RlpcError where
|
|
||||||
liftRlpcError = id
|
|
||||||
|
|
||||||
data Severity = SevWarning
|
|
||||||
| SevError
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
data SrcSpan = SrcSpan
|
|
||||||
!Int -- ^ Line
|
|
||||||
!Int -- ^ Column
|
|
||||||
!Int -- ^ Length
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
makeLenses ''MsgEnvelope
|
|
||||||
|
|
||||||
liftRlpcErrors :: (Functor m, IsRlpcError e)
|
|
||||||
=> ErrorfulT e m a
|
|
||||||
-> ErrorfulT RlpcError m a
|
|
||||||
liftRlpcErrors = mapErrorful liftRlpcError
|
|
||||||
|
|
||||||
instance (IsRlpcError e) => IsRlpcError (MsgEnvelope e) where
|
|
||||||
liftRlpcError msg = msg ^. msgDiagnostic & liftRlpcError
|
|
||||||
|
|
||||||
errorMsg :: SrcSpan -> e -> MsgEnvelope e
|
|
||||||
errorMsg s e = MsgEnvelope
|
|
||||||
{ _msgSpan = s
|
|
||||||
, _msgDiagnostic = e
|
|
||||||
, _msgSeverity = SevError
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|||||||
@@ -1,79 +1,73 @@
|
|||||||
{-# LANGUAGE StandaloneDeriving #-}
|
{-# LANGUAGE StandaloneDeriving #-}
|
||||||
{-# LANGUAGE FunctionalDependencies #-}
|
{-# LANGUAGE FunctionalDependencies #-}
|
||||||
{-# LANGUAGE TupleSections, PatternSynonyms #-}
|
{-# LANGUAGE TupleSections, PatternSynonyms #-}
|
||||||
{-# LANGUAGE UndecidableInstances #-}
|
|
||||||
module Control.Monad.Errorful
|
module Control.Monad.Errorful
|
||||||
( ErrorfulT
|
( ErrorfulT
|
||||||
, runErrorfulT
|
, runErrorfulT
|
||||||
, Errorful
|
, Errorful
|
||||||
, runErrorful
|
, runErrorful
|
||||||
, mapErrorful
|
, mapErrors
|
||||||
, MonadErrorful(..)
|
, MonadErrorful(..)
|
||||||
)
|
)
|
||||||
where
|
where
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
import Control.Monad.State.Strict
|
|
||||||
import Control.Monad.Trans
|
import Control.Monad.Trans
|
||||||
import Data.Functor.Identity
|
import Data.Functor.Identity
|
||||||
import Data.Coerce
|
import Data.Coerce
|
||||||
import Data.HashSet (HashSet)
|
|
||||||
import Data.HashSet qualified as H
|
|
||||||
import Lens.Micro
|
import Lens.Micro
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
newtype ErrorfulT e m a = ErrorfulT { runErrorfulT :: m (Maybe a, [e]) }
|
newtype ErrorfulT e m a = ErrorfulT { runErrorfulT :: m (Either e (a, [e])) }
|
||||||
|
|
||||||
type Errorful e = ErrorfulT e Identity
|
type Errorful e = ErrorfulT e Identity
|
||||||
|
|
||||||
pattern Errorful :: (Maybe a, [e]) -> Errorful e a
|
pattern Errorful :: (Either e (a, [e])) -> Errorful e a
|
||||||
pattern Errorful a = ErrorfulT (Identity a)
|
pattern Errorful a = ErrorfulT (Identity a)
|
||||||
|
|
||||||
runErrorful :: Errorful e a -> (Maybe a, [e])
|
runErrorful :: Errorful e a -> Either e (a, [e])
|
||||||
runErrorful m = coerce (runErrorfulT m)
|
runErrorful m = coerce (runErrorfulT m)
|
||||||
|
|
||||||
class (Applicative m) => MonadErrorful e m | m -> e where
|
class (Applicative m) => MonadErrorful e m | m -> e where
|
||||||
addWound :: e -> m ()
|
addWound :: e -> m ()
|
||||||
addFatal :: e -> m a
|
addFatal :: e -> m a
|
||||||
|
|
||||||
|
-- not sure if i want to add this yet...
|
||||||
|
-- catchWound :: m a -> (e -> m a) -> m a
|
||||||
|
|
||||||
instance (Applicative m) => MonadErrorful e (ErrorfulT e m) where
|
instance (Applicative m) => MonadErrorful e (ErrorfulT e m) where
|
||||||
addWound e = ErrorfulT $ pure (Just (), [e])
|
addWound e = ErrorfulT $ pure . Right $ ((), [e])
|
||||||
addFatal e = ErrorfulT $ pure (Nothing, [e])
|
addFatal e = ErrorfulT $ pure . Left $ e
|
||||||
|
|
||||||
instance MonadTrans (ErrorfulT e) where
|
instance MonadTrans (ErrorfulT e) where
|
||||||
lift m = ErrorfulT ((\x -> (Just x,[])) <$> m)
|
lift m = ErrorfulT (Right . (,[]) <$> m)
|
||||||
|
|
||||||
instance (MonadIO m) => MonadIO (ErrorfulT e m) where
|
instance (MonadIO m) => MonadIO (ErrorfulT e m) where
|
||||||
liftIO = lift . liftIO
|
liftIO = lift . liftIO
|
||||||
|
|
||||||
instance (Functor m) => Functor (ErrorfulT e m) where
|
instance (Functor m) => Functor (ErrorfulT e m) where
|
||||||
fmap f (ErrorfulT m) = ErrorfulT (m & mapped . _1 . _Just %~ f)
|
fmap f (ErrorfulT m) = ErrorfulT $ fmap (_1 %~ f) <$> m
|
||||||
|
|
||||||
instance (Applicative m) => Applicative (ErrorfulT e m) where
|
instance (Applicative m) => Applicative (ErrorfulT e m) where
|
||||||
pure a = ErrorfulT . pure $ (Just a, [])
|
pure a = ErrorfulT (pure . Right $ (a, []))
|
||||||
|
|
||||||
ErrorfulT m <*> ErrorfulT n = ErrorfulT $ m `apply` n where
|
m <*> a = ErrorfulT (m' `apply` a')
|
||||||
apply :: m (Maybe (a -> b), [e]) -> m (Maybe a, [e]) -> m (Maybe b, [e])
|
where
|
||||||
apply = liftA2 $ \ (mf,e1) (ma,e2) -> (mf <*> ma, e1 <> e2)
|
m' = runErrorfulT m
|
||||||
|
a' = runErrorfulT a
|
||||||
|
-- TODO: strict concatenation
|
||||||
|
apply = liftA2 $ liftA2 (\ (f,e1) (x,e2) -> (f x, e1 ++ e2))
|
||||||
|
|
||||||
instance (Monad m) => Monad (ErrorfulT e m) where
|
instance (Monad m) => Monad (ErrorfulT e m) where
|
||||||
ErrorfulT m >>= k = ErrorfulT $ do
|
ErrorfulT m >>= k = ErrorfulT $ do
|
||||||
(a,es) <- m
|
m' <- m
|
||||||
case a of
|
case m' of
|
||||||
Just x -> runErrorfulT (k x)
|
Right (a,es) -> runErrorfulT (k a)
|
||||||
Nothing -> pure (Nothing, es)
|
Left e -> pure (Left e)
|
||||||
|
|
||||||
mapErrorful :: (Functor m) => (e -> e') -> ErrorfulT e m a -> ErrorfulT e' m a
|
mapErrors :: (Monad m) => (e -> e') -> ErrorfulT e m a -> ErrorfulT e' m a
|
||||||
mapErrorful f (ErrorfulT m) = ErrorfulT $
|
mapErrors f m = ErrorfulT $ do
|
||||||
m & mapped . _2 . mapped %~ f
|
x <- runErrorfulT m
|
||||||
|
case x of
|
||||||
-- when microlens-pro drops we can write this as
|
Left e -> pure . Left $ f e
|
||||||
-- mapErrorful f = coerced . mapped . _2 . mappd %~ f
|
Right (a,es) -> pure . Right $ (a, f <$> es)
|
||||||
-- lol
|
|
||||||
|
|
||||||
--------------------------------------------------------------------------------
|
|
||||||
-- daily dose of n^2 instances
|
|
||||||
|
|
||||||
instance (Monad m, MonadErrorful e m) => MonadErrorful e (StateT s m) where
|
|
||||||
addWound = undefined
|
|
||||||
addFatal = undefined
|
|
||||||
|
|
||||||
|
|||||||
@@ -4,19 +4,17 @@ Description : Core examples (may eventually be unit tests)
|
|||||||
-}
|
-}
|
||||||
{-# LANGUAGE QuasiQuotes #-}
|
{-# LANGUAGE QuasiQuotes #-}
|
||||||
{-# LANGUAGE OverloadedStrings #-}
|
{-# LANGUAGE OverloadedStrings #-}
|
||||||
module Core.Examples where
|
module Core.Examples
|
||||||
|
( fac3
|
||||||
|
, sumList
|
||||||
|
, constDivZero
|
||||||
|
, idCase
|
||||||
|
) where
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
import Core.Syntax
|
import Core.Syntax
|
||||||
import Core.TH
|
import Core.TH
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
-- fac3 = undefined
|
|
||||||
-- sumList = undefined
|
|
||||||
-- constDivZero = undefined
|
|
||||||
-- idCase = undefined
|
|
||||||
|
|
||||||
---
|
|
||||||
|
|
||||||
letrecExample :: Program'
|
letrecExample :: Program'
|
||||||
letrecExample = [coreProg|
|
letrecExample = [coreProg|
|
||||||
pair x y f = f x y;
|
pair x y f = f x y;
|
||||||
@@ -142,8 +140,8 @@ simple1 = [coreProg|
|
|||||||
caseBool1 :: Program'
|
caseBool1 :: Program'
|
||||||
caseBool1 = [coreProg|
|
caseBool1 = [coreProg|
|
||||||
_if c x y = case c of
|
_if c x y = case c of
|
||||||
{ <1> -> x
|
{ 1 -> x
|
||||||
; <0> -> y
|
; 0 -> y
|
||||||
};
|
};
|
||||||
|
|
||||||
false = Pack{0 0};
|
false = Pack{0 0};
|
||||||
@@ -155,8 +153,8 @@ caseBool1 = [coreProg|
|
|||||||
fac3 :: Program'
|
fac3 :: Program'
|
||||||
fac3 = [coreProg|
|
fac3 = [coreProg|
|
||||||
fac n = case (==#) n 0 of
|
fac n = case (==#) n 0 of
|
||||||
{ <1> -> 1
|
{ 1 -> 1
|
||||||
; <0> -> (*#) n (fac ((-#) n 1))
|
; 0 -> (*#) n (fac ((-#) n 1))
|
||||||
};
|
};
|
||||||
|
|
||||||
main = fac 3;
|
main = fac 3;
|
||||||
@@ -170,8 +168,8 @@ sumList = [coreProg|
|
|||||||
cons x y = Pack{1 2} x y;
|
cons x y = Pack{1 2} x y;
|
||||||
list = cons 1 (cons 2 (cons 3 nil));
|
list = cons 1 (cons 2 (cons 3 nil));
|
||||||
sum l = case l of
|
sum l = case l of
|
||||||
{ <0> -> 0
|
{ 0 -> 0
|
||||||
; <1> x xs -> (+#) x (sum xs)
|
; 1 x xs -> (+#) x (sum xs)
|
||||||
};
|
};
|
||||||
main = sum list;
|
main = sum list;
|
||||||
|]
|
|]
|
||||||
@@ -187,36 +185,10 @@ idCase = [coreProg|
|
|||||||
id x = x;
|
id x = x;
|
||||||
|
|
||||||
main = id (case Pack{1 0} of
|
main = id (case Pack{1 0} of
|
||||||
{ <1> -> (+#) 2 3
|
{ 1 -> (+#) 2 3
|
||||||
})
|
})
|
||||||
|]
|
|]
|
||||||
|
|
||||||
-- NOTE: the GM primitive (==#) returns an untyped constructor with tag 1 for
|
|
||||||
-- true, and 0 for false. See: GM.boxBool
|
|
||||||
namedBoolCase :: Program'
|
|
||||||
namedBoolCase = [coreProg|
|
|
||||||
{-# PackData True 1 0 #-}
|
|
||||||
{-# PackData False 0 0 #-}
|
|
||||||
main = case (==#) 1 1 of
|
|
||||||
{ True -> 123
|
|
||||||
; False -> 456
|
|
||||||
}
|
|
||||||
|]
|
|
||||||
|
|
||||||
namedConsCase :: Program'
|
|
||||||
namedConsCase = [coreProg|
|
|
||||||
{-# PackData Nil 0 0 #-}
|
|
||||||
{-# PackData Cons 1 2 #-}
|
|
||||||
Nil = Pack{0 0};
|
|
||||||
Cons = Pack{1 2};
|
|
||||||
foldr f z l = case l of
|
|
||||||
{ Nil -> z
|
|
||||||
; Cons x xs -> f x (foldr f z xs)
|
|
||||||
};
|
|
||||||
list = Cons 1 (Cons 2 (Cons 3 Nil));
|
|
||||||
main = foldr (+#) 0 list
|
|
||||||
|]
|
|
||||||
|
|
||||||
-- corePrelude :: Module Name
|
-- corePrelude :: Module Name
|
||||||
-- corePrelude = Module (Just ("Prelude", [])) $
|
-- corePrelude = Module (Just ("Prelude", [])) $
|
||||||
-- -- non-primitive defs
|
-- -- non-primitive defs
|
||||||
@@ -244,4 +216,3 @@ namedConsCase = [coreProg|
|
|||||||
-- , ScDef "Cons" [] $ Con 2 2
|
-- , ScDef "Cons" [] $ Con 2 2
|
||||||
-- ]
|
-- ]
|
||||||
|
|
||||||
--}
|
|
||||||
|
|||||||
@@ -3,7 +3,6 @@ Module : Core.HindleyMilner
|
|||||||
Description : Hindley-Milner type system
|
Description : Hindley-Milner type system
|
||||||
-}
|
-}
|
||||||
{-# LANGUAGE LambdaCase #-}
|
{-# LANGUAGE LambdaCase #-}
|
||||||
{-# LANGUAGE OverloadedStrings #-}
|
|
||||||
module Core.HindleyMilner
|
module Core.HindleyMilner
|
||||||
( Context'
|
( Context'
|
||||||
, infer
|
, infer
|
||||||
@@ -17,17 +16,15 @@ module Core.HindleyMilner
|
|||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
import Lens.Micro
|
import Lens.Micro
|
||||||
import Lens.Micro.Mtl
|
import Lens.Micro.Mtl
|
||||||
import Lens.Micro.Platform
|
|
||||||
import Data.Maybe (fromMaybe)
|
import Data.Maybe (fromMaybe)
|
||||||
import Data.Text qualified as T
|
import Data.Text qualified as T
|
||||||
import Data.HashMap.Strict qualified as H
|
import Data.HashMap.Strict qualified as H
|
||||||
import Data.Foldable (traverse_)
|
import Data.Foldable (traverse_)
|
||||||
import Compiler.RLPC
|
import Compiler.RLPC
|
||||||
import Control.Monad (foldM, void, forM)
|
import Control.Monad (foldM, void)
|
||||||
import Control.Monad.Errorful (Errorful, addFatal)
|
import Control.Monad.Errorful (Errorful, addFatal)
|
||||||
import Control.Monad.State
|
import Control.Monad.State
|
||||||
import Control.Monad.Utils (mapAccumLM)
|
import Control.Monad.Utils (mapAccumLM)
|
||||||
import Text.Printf
|
|
||||||
import Core.Syntax
|
import Core.Syntax
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
@@ -51,23 +48,9 @@ data TypeError
|
|||||||
| TyErrMissingTypeSig Name
|
| TyErrMissingTypeSig Name
|
||||||
deriving (Show, Eq)
|
deriving (Show, Eq)
|
||||||
|
|
||||||
|
-- TODO:
|
||||||
instance IsRlpcError TypeError where
|
instance IsRlpcError TypeError where
|
||||||
liftRlpcError = \case
|
liftRlpcErr = RlpcErr . show
|
||||||
-- todo: use anti-parser instead of show
|
|
||||||
TyErrCouldNotUnify t u -> Text
|
|
||||||
[ T.pack $ printf "Could not match type `%s` with `%s`."
|
|
||||||
(show t) (show u)
|
|
||||||
, "Expected: " <> tshow t
|
|
||||||
, "Got: " <> tshow u
|
|
||||||
]
|
|
||||||
TyErrUntypedVariable n -> Text
|
|
||||||
[ "Untyped (likely undefined) variable `" <> n <> "`"
|
|
||||||
]
|
|
||||||
TyErrRecursiveType t x -> Text
|
|
||||||
[ T.pack $ printf "recursive type error lol"
|
|
||||||
]
|
|
||||||
|
|
||||||
where tshow = T.pack . show
|
|
||||||
|
|
||||||
-- | Synonym for @Errorful [TypeError]@. This means an @HMError@ action may
|
-- | Synonym for @Errorful [TypeError]@. This means an @HMError@ action may
|
||||||
-- throw any number of fatal or nonfatal errors. Run with @runErrorful@.
|
-- throw any number of fatal or nonfatal errors. Run with @runErrorful@.
|
||||||
@@ -105,10 +88,10 @@ checkCoreProg p = scDefs
|
|||||||
where scname = sc ^. _lhs._1
|
where scname = sc ^. _lhs._1
|
||||||
|
|
||||||
-- | @checkCoreProgR p@ returns @p@ if @p@ successfully typechecks.
|
-- | @checkCoreProgR p@ returns @p@ if @p@ successfully typechecks.
|
||||||
checkCoreProgR :: Program' -> RLPC Program'
|
checkCoreProgR :: Program' -> RLPC RlpcError Program'
|
||||||
checkCoreProgR p = undefined
|
checkCoreProgR p = do
|
||||||
|
liftRlpcErrs . rlpc . checkCoreProg $ p
|
||||||
{-# WARNING checkCoreProgR "unimpl" #-}
|
pure p
|
||||||
|
|
||||||
-- | Infer the type of an expression under some context.
|
-- | Infer the type of an expression under some context.
|
||||||
--
|
--
|
||||||
@@ -157,32 +140,7 @@ gather = \g e -> runStateT (go g e) ([],0) <&> \ (t,(cs,_)) -> (t,cs) where
|
|||||||
Let NonRec bs e -> do
|
Let NonRec bs e -> do
|
||||||
g' <- buildLetContext g bs
|
g' <- buildLetContext g bs
|
||||||
go g' e
|
go g' e
|
||||||
Let Rec bs e -> do
|
-- TODO letrec, lambda, case
|
||||||
g' <- buildLetrecContext g bs
|
|
||||||
go g' e
|
|
||||||
Lam bs e -> case bs of
|
|
||||||
[x] -> do
|
|
||||||
tx <- uniqueVar
|
|
||||||
let g' = (x,tx) : g
|
|
||||||
te <- go g' e
|
|
||||||
pure (tx :-> te)
|
|
||||||
-- TODO lambda, case
|
|
||||||
|
|
||||||
buildLetrecContext :: Context' -> [Binding']
|
|
||||||
-> StateT ([Constraint], Int) HMError Context'
|
|
||||||
buildLetrecContext g bs = do
|
|
||||||
let f ag (k := _) = do
|
|
||||||
n <- uniqueVar
|
|
||||||
pure ((k,n) : ag)
|
|
||||||
rg <- foldM f g bs
|
|
||||||
let k ag (k := v) = do
|
|
||||||
t <- go rg v
|
|
||||||
pure ((k,t) : ag)
|
|
||||||
foldM k g bs
|
|
||||||
|
|
||||||
-- | augment a context with the inferred types of each binder. the returned
|
|
||||||
-- context is linearly accumulated, meaning that the context used to infer each binder
|
|
||||||
-- will include the inferred types of all previous binder
|
|
||||||
|
|
||||||
buildLetContext :: Context' -> [Binding']
|
buildLetContext :: Context' -> [Binding']
|
||||||
-> StateT ([Constraint], Int) HMError Context'
|
-> StateT ([Constraint], Int) HMError Context'
|
||||||
@@ -260,20 +218,3 @@ subst x t (TyVar y) | x == y = t
|
|||||||
subst x t (a :-> b) = subst x t a :-> subst x t b
|
subst x t (a :-> b) = subst x t a :-> subst x t b
|
||||||
subst _ _ e = e
|
subst _ _ e = e
|
||||||
|
|
||||||
--------------------------------------------------------------------------------
|
|
||||||
|
|
||||||
demoContext :: Context'
|
|
||||||
demoContext =
|
|
||||||
[ ("fix", (TyVar "a" :-> TyVar "a") :-> TyVar "a")
|
|
||||||
, ("add", TyInt :-> TyInt :-> TyInt)
|
|
||||||
, ("==", TyInt :-> TyInt :-> TyCon "Bool")
|
|
||||||
, ("True", TyCon "Bool")
|
|
||||||
, ("False", TyCon "Bool")
|
|
||||||
]
|
|
||||||
|
|
||||||
pprintType :: Type -> String
|
|
||||||
pprintType (s :-> t) = "(" <> pprintType s <> " -> " <> pprintType t <> ")"
|
|
||||||
pprintType TyFun = "(->)"
|
|
||||||
pprintType (TyVar x) = x ^. unpacked
|
|
||||||
pprintType (TyCon t) = t ^. unpacked
|
|
||||||
|
|
||||||
|
|||||||
@@ -65,8 +65,6 @@ $white_no_nl = $white # $nl
|
|||||||
|
|
||||||
@decimal = $digit+
|
@decimal = $digit+
|
||||||
|
|
||||||
@alttag = "<" $digit+ ">"
|
|
||||||
|
|
||||||
rlp :-
|
rlp :-
|
||||||
|
|
||||||
<0>
|
<0>
|
||||||
@@ -94,8 +92,6 @@ rlp :-
|
|||||||
"=" { constTok TokenEquals }
|
"=" { constTok TokenEquals }
|
||||||
"->" { constTok TokenArrow }
|
"->" { constTok TokenArrow }
|
||||||
|
|
||||||
@alttag { lexWith ( TokenAltTag . read @Int . T.unpack
|
|
||||||
. T.drop 1 . T.init ) }
|
|
||||||
@varname { lexWith TokenVarName }
|
@varname { lexWith TokenVarName }
|
||||||
@conname { lexWith TokenConName }
|
@conname { lexWith TokenConName }
|
||||||
@varsym { lexWith TokenVarSym }
|
@varsym { lexWith TokenVarSym }
|
||||||
@@ -107,6 +103,8 @@ rlp :-
|
|||||||
\n { skip }
|
\n { skip }
|
||||||
}
|
}
|
||||||
|
|
||||||
|
-- TODO: negative literals
|
||||||
|
|
||||||
<pragma>
|
<pragma>
|
||||||
{
|
{
|
||||||
"#-}" { constTok TokenRPragma `andBegin` 0 }
|
"#-}" { constTok TokenRPragma `andBegin` 0 }
|
||||||
@@ -139,7 +137,6 @@ data CoreToken = TokenLet
|
|||||||
| TokenConName Name
|
| TokenConName Name
|
||||||
| TokenVarSym Name
|
| TokenVarSym Name
|
||||||
| TokenConSym Name
|
| TokenConSym Name
|
||||||
| TokenAltTag Tag
|
|
||||||
| TokenEquals
|
| TokenEquals
|
||||||
| TokenLParen
|
| TokenLParen
|
||||||
| TokenRParen
|
| TokenRParen
|
||||||
@@ -172,19 +169,24 @@ lexWith :: (Text -> CoreToken) -> Lexer
|
|||||||
lexWith f (AlexPn _ y x,_,_,s) l = pure $ Located y x l (f $ T.take l s)
|
lexWith f (AlexPn _ y x,_,_,s) l = pure $ Located y x l (f $ T.take l s)
|
||||||
|
|
||||||
-- | The main lexer driver.
|
-- | The main lexer driver.
|
||||||
lexCore :: Text -> RLPC [Located CoreToken]
|
lexCore :: Text -> RLPC SrcError [Located CoreToken]
|
||||||
lexCore s = case m of
|
lexCore s = case m of
|
||||||
Left e -> error "core lex error"
|
Left e -> addFatal err
|
||||||
|
where err = SrcError
|
||||||
|
{ _errSpan = (0,0,0) -- TODO: location
|
||||||
|
, _errSeverity = Error
|
||||||
|
, _errDiagnostic = SrcErrLexical e
|
||||||
|
}
|
||||||
Right ts -> pure ts
|
Right ts -> pure ts
|
||||||
where
|
where
|
||||||
m = runAlex s lexStream
|
m = runAlex s lexStream
|
||||||
|
|
||||||
lexCoreR :: Text -> RLPC [Located CoreToken]
|
lexCoreR :: Text -> RLPC RlpcError [Located CoreToken]
|
||||||
lexCoreR = lexCore
|
lexCoreR = liftRlpcErrs . lexCore
|
||||||
|
|
||||||
-- | @lexCore@, but the tokens are stripped of location info. Useful for
|
-- | @lexCore@, but the tokens are stripped of location info. Useful for
|
||||||
-- debugging
|
-- debugging
|
||||||
lexCore' :: Text -> RLPC [CoreToken]
|
lexCore' :: Text -> RLPC SrcError [CoreToken]
|
||||||
lexCore' s = fmap f <$> lexCore s
|
lexCore' s = fmap f <$> lexCore s
|
||||||
where f (Located _ _ _ t) = t
|
where f (Located _ _ _ t) = t
|
||||||
|
|
||||||
@@ -201,11 +203,11 @@ data ParseError = ParErrLexical String
|
|||||||
|
|
||||||
-- TODO:
|
-- TODO:
|
||||||
instance IsRlpcError SrcError where
|
instance IsRlpcError SrcError where
|
||||||
liftRlpcError = Text . pure . T.pack . show
|
liftRlpcErr = RlpcErr . show
|
||||||
|
|
||||||
-- TODO:
|
-- TODO:
|
||||||
instance IsRlpcError ParseError where
|
instance IsRlpcError ParseError where
|
||||||
liftRlpcError = Text . pure . T.pack . show
|
liftRlpcErr = RlpcErr . show
|
||||||
|
|
||||||
alexEOF :: Alex (Located CoreToken)
|
alexEOF :: Alex (Located CoreToken)
|
||||||
alexEOF = Alex $ \ st@(AlexState { alex_pos = AlexPn _ y x }) ->
|
alexEOF = Alex $ \ st@(AlexState { alex_pos = AlexPn _ y x }) ->
|
||||||
|
|||||||
@@ -3,13 +3,14 @@
|
|||||||
Module : Core.Parse
|
Module : Core.Parse
|
||||||
Description : Parser for the Core language
|
Description : Parser for the Core language
|
||||||
-}
|
-}
|
||||||
{-# LANGUAGE OverloadedStrings, ViewPatterns #-}
|
{-# LANGUAGE OverloadedStrings #-}
|
||||||
module Core.Parse
|
module Core.Parse
|
||||||
( parseCore
|
( parseCore
|
||||||
, parseCoreExpr
|
, parseCoreExpr
|
||||||
, parseCoreProg
|
, parseCoreProg
|
||||||
, parseCoreProgR
|
, parseCoreProgR
|
||||||
, module Core.Lex -- temp convenience
|
, module Core.Lex -- temp convenience
|
||||||
|
, parseTmp
|
||||||
, SrcError
|
, SrcError
|
||||||
, Module
|
, Module
|
||||||
)
|
)
|
||||||
@@ -23,9 +24,7 @@ import Compiler.RLPC
|
|||||||
import Lens.Micro
|
import Lens.Micro
|
||||||
import Data.Default.Class (def)
|
import Data.Default.Class (def)
|
||||||
import Data.Hashable (Hashable)
|
import Data.Hashable (Hashable)
|
||||||
import Data.List.Extra
|
|
||||||
import Data.Text.IO qualified as TIO
|
import Data.Text.IO qualified as TIO
|
||||||
import Data.Text (Text)
|
|
||||||
import Data.Text qualified as T
|
import Data.Text qualified as T
|
||||||
import Data.HashMap.Strict qualified as H
|
import Data.HashMap.Strict qualified as H
|
||||||
}
|
}
|
||||||
@@ -35,7 +34,7 @@ import Data.HashMap.Strict qualified as H
|
|||||||
%name parseCoreProg StandaloneProgram
|
%name parseCoreProg StandaloneProgram
|
||||||
%tokentype { Located CoreToken }
|
%tokentype { Located CoreToken }
|
||||||
%error { parseError }
|
%error { parseError }
|
||||||
%monad { RLPC } { happyBind } { happyPure }
|
%monad { RLPC SrcError }
|
||||||
|
|
||||||
%token
|
%token
|
||||||
let { Located _ _ _ TokenLet }
|
let { Located _ _ _ TokenLet }
|
||||||
@@ -51,7 +50,6 @@ import Data.HashMap.Strict qualified as H
|
|||||||
varsym { Located _ _ _ (TokenVarSym $$) }
|
varsym { Located _ _ _ (TokenVarSym $$) }
|
||||||
conname { Located _ _ _ (TokenConName $$) }
|
conname { Located _ _ _ (TokenConName $$) }
|
||||||
consym { Located _ _ _ (TokenConSym $$) }
|
consym { Located _ _ _ (TokenConSym $$) }
|
||||||
alttag { Located _ _ _ (TokenAltTag $$) }
|
|
||||||
word { Located _ _ _ (TokenWord $$) }
|
word { Located _ _ _ (TokenWord $$) }
|
||||||
'λ' { Located _ _ _ TokenLambda }
|
'λ' { Located _ _ _ TokenLambda }
|
||||||
'->' { Located _ _ _ TokenArrow }
|
'->' { Located _ _ _ TokenArrow }
|
||||||
@@ -79,21 +77,13 @@ Eof : eof { () }
|
|||||||
|
|
||||||
StandaloneProgram :: { Program Name }
|
StandaloneProgram :: { Program Name }
|
||||||
StandaloneProgram : Program eof { $1 }
|
StandaloneProgram : Program eof { $1 }
|
||||||
|
| eof { mempty }
|
||||||
|
|
||||||
Program :: { Program Name }
|
Program :: { Program Name }
|
||||||
Program : ScTypeSig ';' Program { insTypeSig $1 $3 }
|
Program : ScTypeSig ';' Program { insTypeSig $1 $3 }
|
||||||
| ScTypeSig OptSemi { singletonTypeSig $1 }
|
| ScTypeSig OptSemi { singletonTypeSig $1 }
|
||||||
| ScDef ';' Program { insScDef $1 $3 }
|
| ScDef ';' Program { insScDef $1 $3 }
|
||||||
| ScDef OptSemi { singletonScDef $1 }
|
| ScDef OptSemi { singletonScDef $1 }
|
||||||
| TLPragma Program {% doTLPragma $1 $2 }
|
|
||||||
| TLPragma {% doTLPragma $1 mempty }
|
|
||||||
|
|
||||||
TLPragma :: { Pragma }
|
|
||||||
: '{-#' Words '#-}' { Pragma $2 }
|
|
||||||
|
|
||||||
Words :: { [Text] }
|
|
||||||
: Words word { $1 `snoc` $2 }
|
|
||||||
| word { [$1] }
|
|
||||||
|
|
||||||
OptSemi :: { () }
|
OptSemi :: { () }
|
||||||
OptSemi : ';' { () }
|
OptSemi : ';' { () }
|
||||||
@@ -106,11 +96,10 @@ ScDefs :: { [ScDef Name] }
|
|||||||
ScDefs : ScDef ';' ScDefs { $1 : $3 }
|
ScDefs : ScDef ';' ScDefs { $1 : $3 }
|
||||||
| ScDef ';' { [$1] }
|
| ScDef ';' { [$1] }
|
||||||
| ScDef { [$1] }
|
| ScDef { [$1] }
|
||||||
|
| {- epsilon -} { [] }
|
||||||
|
|
||||||
ScDef :: { ScDef Name }
|
ScDef :: { ScDef Name }
|
||||||
ScDef : Var ParList '=' Expr { ScDef $1 $2 $4 }
|
ScDef : Var ParList '=' Expr { ScDef $1 $2 $4 }
|
||||||
-- hack to allow constructors to be compiled into scs
|
|
||||||
| Con ParList '=' Expr { ScDef $1 $2 $4 }
|
|
||||||
|
|
||||||
Type :: { Type }
|
Type :: { Type }
|
||||||
Type : Type1 { $1 }
|
Type : Type1 { $1 }
|
||||||
@@ -159,16 +148,24 @@ Alters : Alter ';' Alters { $1 : $3 }
|
|||||||
| Alter ';' { [$1] }
|
| Alter ';' { [$1] }
|
||||||
| Alter { [$1] }
|
| Alter { [$1] }
|
||||||
|
|
||||||
|
-- TODO: tags should be wrapped in <n> to allow matching against literals
|
||||||
Alter :: { Alter Name }
|
Alter :: { Alter Name }
|
||||||
Alter : alttag ParList '->' Expr { Alter (AltTag $1) $2 $4 }
|
Alter : litint ParList '->' Expr { Alter (AltData $1) $2 $4 }
|
||||||
| Con ParList '->' Expr { Alter (AltData $1) $2 $4 }
|
|
||||||
|
|
||||||
Expr1 :: { Expr Name }
|
Expr1 :: { Expr Name }
|
||||||
Expr1 : litint { Lit $ IntL $1 }
|
Expr1 : litint { Lit $ IntL $1 }
|
||||||
| Id { Var $1 }
|
| Id { Var $1 }
|
||||||
| PackCon { $1 }
|
| PackCon { $1 }
|
||||||
|
| ExprPragma { $1 }
|
||||||
| '(' Expr ')' { $2 }
|
| '(' Expr ')' { $2 }
|
||||||
|
|
||||||
|
ExprPragma :: { Expr Name }
|
||||||
|
ExprPragma : '{-#' Words '#-}' {% exprPragma $2 }
|
||||||
|
|
||||||
|
Words :: { [String] }
|
||||||
|
Words : word Words { T.unpack $1 : $2 }
|
||||||
|
| word { [T.unpack $1] }
|
||||||
|
|
||||||
PackCon :: { Expr Name }
|
PackCon :: { Expr Name }
|
||||||
PackCon : pack '{' litint litint '}' { Con $3 $4 }
|
PackCon : pack '{' litint litint '}' { Con $3 $4 }
|
||||||
|
|
||||||
@@ -194,23 +191,34 @@ Con : '(' consym ')' { $2 }
|
|||||||
|
|
||||||
{
|
{
|
||||||
|
|
||||||
parseError :: [Located CoreToken] -> RLPC a
|
parseError :: [Located CoreToken] -> RLPC SrcError a
|
||||||
parseError (Located y x l t : _) =
|
parseError (Located y x l _ : _) = addFatal err
|
||||||
error $ show y <> ":" <> show x
|
where err = SrcError
|
||||||
<> ": parse error at token `" <> show t <> "'"
|
{ _errSpan = (y,x,l)
|
||||||
|
, _errSeverity = Error
|
||||||
|
, _errDiagnostic = SrcErrParse
|
||||||
|
}
|
||||||
|
|
||||||
{-# WARNING parseError "unimpl" #-}
|
parseTmp :: IO (Module Name)
|
||||||
|
parseTmp = do
|
||||||
|
s <- TIO.readFile "/tmp/t.hs"
|
||||||
|
case parse s of
|
||||||
|
Left e -> error (show e)
|
||||||
|
Right (ts,_) -> pure ts
|
||||||
|
where
|
||||||
|
parse = evalRLPC def . (lexCore >=> parseCore)
|
||||||
|
|
||||||
exprPragma :: [String] -> RLPC (Expr Name)
|
exprPragma :: [String] -> RLPC SrcError (Expr Name)
|
||||||
exprPragma ("AST" : e) = undefined
|
exprPragma ("AST" : e) = astPragma e
|
||||||
exprPragma _ = undefined
|
exprPragma _ = addFatal err
|
||||||
|
where err = SrcError
|
||||||
|
{ _errSpan = (0,0,0) -- TODO: span
|
||||||
|
, _errSeverity = Warning
|
||||||
|
, _errDiagnostic = SrcErrUnknownPragma "" -- TODO: missing pragma
|
||||||
|
}
|
||||||
|
|
||||||
{-# WARNING exprPragma "unimpl" #-}
|
astPragma :: [String] -> RLPC SrcError (Expr Name)
|
||||||
|
astPragma = pure . read . unwords
|
||||||
astPragma :: [String] -> RLPC (Expr Name)
|
|
||||||
astPragma _ = undefined
|
|
||||||
|
|
||||||
{-# WARNING astPragma "unimpl" #-}
|
|
||||||
|
|
||||||
insTypeSig :: (Hashable b) => (b, Type) -> Program b -> Program b
|
insTypeSig :: (Hashable b) => (b, Type) -> Program b -> Program b
|
||||||
insTypeSig ts = programTypeSigs %~ uncurry H.insert ts
|
insTypeSig ts = programTypeSigs %~ uncurry H.insert ts
|
||||||
@@ -224,26 +232,8 @@ insScDef sc = programScDefs %~ (sc:)
|
|||||||
singletonScDef :: (Hashable b) => ScDef b -> Program b
|
singletonScDef :: (Hashable b) => ScDef b -> Program b
|
||||||
singletonScDef sc = insScDef sc mempty
|
singletonScDef sc = insScDef sc mempty
|
||||||
|
|
||||||
parseCoreProgR :: [Located CoreToken] -> RLPC Program'
|
parseCoreProgR :: [Located CoreToken] -> RLPC RlpcError Program'
|
||||||
parseCoreProgR = parseCoreProg
|
parseCoreProgR = liftRlpcErrs . parseCoreProg
|
||||||
|
|
||||||
happyBind :: RLPC a -> (a -> RLPC b) -> RLPC b
|
|
||||||
happyBind m k = m >>= k
|
|
||||||
|
|
||||||
happyPure :: a -> RLPC a
|
|
||||||
happyPure a = pure a
|
|
||||||
|
|
||||||
doTLPragma :: Pragma -> Program' -> RLPC Program'
|
|
||||||
-- TODO: warn unrecognised pragma
|
|
||||||
doTLPragma (Pragma []) p = pure p
|
|
||||||
|
|
||||||
doTLPragma (Pragma pr) p = case pr of
|
|
||||||
-- TODO: warn on overwrite
|
|
||||||
["PackData", n, readt -> t, readt -> a] ->
|
|
||||||
pure $ p & programDataTags . at n ?~ (t,a)
|
|
||||||
|
|
||||||
readt :: (Read a) => Text -> a
|
|
||||||
readt = read . T.unpack
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
@@ -5,14 +5,8 @@ Description : Core ASTs and the like
|
|||||||
{-# LANGUAGE PatternSynonyms, OverloadedStrings #-}
|
{-# LANGUAGE PatternSynonyms, OverloadedStrings #-}
|
||||||
{-# LANGUAGE FunctionalDependencies #-}
|
{-# LANGUAGE FunctionalDependencies #-}
|
||||||
{-# LANGUAGE TemplateHaskell #-}
|
{-# LANGUAGE TemplateHaskell #-}
|
||||||
{-# LANGUAGE DerivingStrategies, DerivingVia #-}
|
|
||||||
-- for recursion-schemes
|
|
||||||
{-# LANGUAGE DeriveFunctor, DeriveFoldable, DeriveTraversable
|
|
||||||
, TemplateHaskell, TypeFamilies #-}
|
|
||||||
module Core.Syntax
|
module Core.Syntax
|
||||||
( Expr(..)
|
( Expr(..)
|
||||||
, ExprF(..)
|
|
||||||
, ExprF'(..)
|
|
||||||
, Type(..)
|
, Type(..)
|
||||||
, pattern TyInt
|
, pattern TyInt
|
||||||
, Lit(..)
|
, Lit(..)
|
||||||
@@ -30,11 +24,9 @@ module Core.Syntax
|
|||||||
, Module(..)
|
, Module(..)
|
||||||
, Program(..)
|
, Program(..)
|
||||||
, Program'
|
, Program'
|
||||||
, Pragma(..)
|
|
||||||
, unliftScDef
|
, unliftScDef
|
||||||
, programScDefs
|
, programScDefs
|
||||||
, programTypeSigs
|
, programTypeSigs
|
||||||
, programDataTags
|
|
||||||
, Expr'
|
, Expr'
|
||||||
, ScDef'
|
, ScDef'
|
||||||
, Alter'
|
, Alter'
|
||||||
@@ -48,15 +40,11 @@ import Data.Coerce
|
|||||||
import Data.Pretty
|
import Data.Pretty
|
||||||
import Data.List (intersperse)
|
import Data.List (intersperse)
|
||||||
import Data.Function ((&))
|
import Data.Function ((&))
|
||||||
import Data.Functor.Foldable
|
|
||||||
import Data.Functor.Foldable.TH (makeBaseFunctor)
|
|
||||||
import Data.String
|
import Data.String
|
||||||
import Data.HashMap.Strict (HashMap)
|
|
||||||
import Data.HashMap.Strict qualified as H
|
import Data.HashMap.Strict qualified as H
|
||||||
import Data.Hashable
|
import Data.Hashable
|
||||||
import Data.Text qualified as T
|
import Data.Text qualified as T
|
||||||
import Data.Char
|
import Data.Char
|
||||||
import GHC.Generics
|
|
||||||
-- Lift instances for the Core quasiquoters
|
-- Lift instances for the Core quasiquoters
|
||||||
import Language.Haskell.TH.Syntax (Lift)
|
import Language.Haskell.TH.Syntax (Lift)
|
||||||
import Lens.Micro.TH (makeLenses)
|
import Lens.Micro.TH (makeLenses)
|
||||||
@@ -70,9 +58,9 @@ data Expr b = Var Name
|
|||||||
| Let Rec [Binding b] (Expr b)
|
| Let Rec [Binding b] (Expr b)
|
||||||
| App (Expr b) (Expr b)
|
| App (Expr b) (Expr b)
|
||||||
| Lit Lit
|
| Lit Lit
|
||||||
deriving (Show, Read, Lift)
|
deriving (Show, Eq, Read, Lift)
|
||||||
|
|
||||||
deriving instance (Eq b) => Eq (Expr b)
|
-- deriving instance (Eq b) => Eq (Expr b)
|
||||||
|
|
||||||
data Type = TyFun
|
data Type = TyFun
|
||||||
| TyVar Name
|
| TyVar Name
|
||||||
@@ -98,27 +86,20 @@ pattern a :-> b = TyApp (TyApp TyFun a) b
|
|||||||
{-# COMPLETE Binding :: Binding #-}
|
{-# COMPLETE Binding :: Binding #-}
|
||||||
{-# COMPLETE (:=) :: Binding #-}
|
{-# COMPLETE (:=) :: Binding #-}
|
||||||
data Binding b = Binding b (Expr b)
|
data Binding b = Binding b (Expr b)
|
||||||
deriving (Show, Read, Lift)
|
deriving (Show, Read, Eq, Lift)
|
||||||
|
|
||||||
deriving instance (Eq b) => Eq (Binding b)
|
|
||||||
|
|
||||||
infixl 1 :=
|
infixl 1 :=
|
||||||
pattern (:=) :: b -> (Expr b) -> (Binding b)
|
pattern (:=) :: b -> (Expr b) -> (Binding b)
|
||||||
pattern k := v = Binding k v
|
pattern k := v = Binding k v
|
||||||
|
|
||||||
data Alter b = Alter AltCon [b] (Expr b)
|
data Alter b = Alter AltCon [b] (Expr b)
|
||||||
deriving (Show, Read, Lift)
|
deriving (Show, Read, Eq, Lift)
|
||||||
|
|
||||||
deriving instance (Eq b) => Eq (Alter b)
|
|
||||||
|
|
||||||
newtype Pragma = Pragma [T.Text]
|
|
||||||
|
|
||||||
data Rec = Rec
|
data Rec = Rec
|
||||||
| NonRec
|
| NonRec
|
||||||
deriving (Show, Read, Eq, Lift)
|
deriving (Show, Read, Eq, Lift)
|
||||||
|
|
||||||
data AltCon = AltData Name
|
data AltCon = AltData Tag
|
||||||
| AltTag Tag
|
|
||||||
| AltLit Lit
|
| AltLit Lit
|
||||||
| Default
|
| Default
|
||||||
deriving (Show, Read, Eq, Lift)
|
deriving (Show, Read, Eq, Lift)
|
||||||
@@ -130,7 +111,7 @@ type Name = T.Text
|
|||||||
type Tag = Int
|
type Tag = Int
|
||||||
|
|
||||||
data ScDef b = ScDef b [b] (Expr b)
|
data ScDef b = ScDef b [b] (Expr b)
|
||||||
deriving (Show, Lift)
|
deriving (Show, Eq, Lift)
|
||||||
|
|
||||||
unliftScDef :: ScDef b -> Expr b
|
unliftScDef :: ScDef b -> Expr b
|
||||||
unliftScDef (ScDef _ as e) = Lam as e
|
unliftScDef (ScDef _ as e) = Lam as e
|
||||||
@@ -140,20 +121,13 @@ data Module b = Module (Maybe (Name, [Name])) (Program b)
|
|||||||
|
|
||||||
data Program b = Program
|
data Program b = Program
|
||||||
{ _programScDefs :: [ScDef b]
|
{ _programScDefs :: [ScDef b]
|
||||||
, _programTypeSigs :: HashMap b Type
|
, _programTypeSigs :: H.HashMap b Type
|
||||||
-- map constructors to their tag and arity
|
|
||||||
, _programDataTags :: HashMap b (Tag, Int)
|
|
||||||
}
|
}
|
||||||
deriving (Show, Lift, Generic)
|
deriving (Show, Eq, Lift)
|
||||||
deriving (Semigroup, Monoid)
|
|
||||||
via Generically (Program b)
|
|
||||||
|
|
||||||
makeLenses ''Program
|
makeLenses ''Program
|
||||||
makeBaseFunctor ''Expr
|
|
||||||
pure []
|
pure []
|
||||||
|
|
||||||
type ExprF' = ExprF Name
|
|
||||||
|
|
||||||
type Program' = Program Name
|
type Program' = Program Name
|
||||||
type Expr' = Expr Name
|
type Expr' = Expr Name
|
||||||
type ScDef' = ScDef Name
|
type ScDef' = ScDef Name
|
||||||
@@ -170,6 +144,12 @@ instance IsString Type where
|
|||||||
| otherwise = TyVar . fromString $ s
|
| otherwise = TyVar . fromString $ s
|
||||||
where (c:_) = s
|
where (c:_) = s
|
||||||
|
|
||||||
|
instance (Hashable b) => Semigroup (Program b) where
|
||||||
|
(<>) = undefined
|
||||||
|
|
||||||
|
instance (Hashable b) => Monoid (Program b) where
|
||||||
|
mempty = Program mempty mempty
|
||||||
|
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
class HasRHS s t a b | s -> a, t -> b, s b -> t, t a -> s where
|
class HasRHS s t a b | s -> a, t -> b, s b -> t, t a -> s where
|
||||||
@@ -203,8 +183,3 @@ instance HasLHS (ScDef b) (ScDef b) (b, [b]) (b, [b]) where
|
|||||||
(\ (ScDef n as _) -> (n,as))
|
(\ (ScDef n as _) -> (n,as))
|
||||||
(\ (ScDef _ _ e) (n',as') -> (ScDef n' as' e))
|
(\ (ScDef _ _ e) (n',as') -> (ScDef n' as' e))
|
||||||
|
|
||||||
instance HasLHS (Binding b) (Binding b) b b where
|
|
||||||
_lhs = lens
|
|
||||||
(\ (k := _) -> k)
|
|
||||||
(\ (_ := e) k' -> k' := e)
|
|
||||||
|
|
||||||
|
|||||||
@@ -6,6 +6,7 @@ module Core.TH
|
|||||||
( coreExpr
|
( coreExpr
|
||||||
, coreProg
|
, coreProg
|
||||||
, coreProgT
|
, coreProgT
|
||||||
|
, core
|
||||||
)
|
)
|
||||||
where
|
where
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
@@ -13,38 +14,74 @@ import Language.Haskell.TH
|
|||||||
import Language.Haskell.TH.Syntax hiding (Module)
|
import Language.Haskell.TH.Syntax hiding (Module)
|
||||||
import Language.Haskell.TH.Quote
|
import Language.Haskell.TH.Quote
|
||||||
import Control.Monad ((>=>))
|
import Control.Monad ((>=>))
|
||||||
import Control.Monad.IO.Class
|
|
||||||
import Control.Arrow ((>>>))
|
|
||||||
import Compiler.RLPC
|
import Compiler.RLPC
|
||||||
import Data.Default.Class (def)
|
import Data.Default.Class (def)
|
||||||
import Data.Text (Text)
|
|
||||||
import Data.Text qualified as T
|
import Data.Text qualified as T
|
||||||
import Core.Parse
|
import Core.Parse
|
||||||
import Core.Lex
|
import Core.Lex
|
||||||
import Core.Syntax
|
|
||||||
import Core.HindleyMilner (checkCoreProgR)
|
import Core.HindleyMilner (checkCoreProgR)
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
coreProg :: QuasiQuoter
|
-- TODO: write in terms of a String -> QuasiQuoter
|
||||||
coreProg = mkqq $ lexCoreR >=> parseCoreProgR
|
|
||||||
|
|
||||||
coreExpr :: QuasiQuoter
|
core :: QuasiQuoter
|
||||||
coreExpr = mkqq $ lexCoreR >=> parseCoreExpr
|
core = QuasiQuoter
|
||||||
|
{ quoteExp = qCore
|
||||||
-- | Type-checked @coreProg@
|
|
||||||
coreProgT :: QuasiQuoter
|
|
||||||
coreProgT = mkqq $ lexCoreR >=> parseCoreProgR >=> checkCoreProgR
|
|
||||||
|
|
||||||
mkqq :: (Lift a) => (Text -> RLPC a) -> QuasiQuoter
|
|
||||||
mkqq p = QuasiQuoter
|
|
||||||
{ quoteExp = mkq p
|
|
||||||
, quotePat = error "core quasiquotes may only be used in expressions"
|
, quotePat = error "core quasiquotes may only be used in expressions"
|
||||||
, quoteType = error "core quasiquotes may only be used in expressions"
|
, quoteType = error "core quasiquotes may only be used in expressions"
|
||||||
, quoteDec = error "core quasiquotes may only be used in expressions"
|
, quoteDec = error "core quasiquotes may only be used in expressions"
|
||||||
}
|
}
|
||||||
|
|
||||||
mkq :: (Lift a) => (Text -> RLPC a) -> String -> Q Exp
|
coreProg :: QuasiQuoter
|
||||||
mkq parse s = case evalRLPC def (parse $ T.pack s) of
|
coreProg = QuasiQuoter
|
||||||
(Just a, _) -> lift a
|
{ quoteExp = qCoreProg
|
||||||
(Nothing, _) -> error "todo: aaahhbbhjhbdjhabsjh"
|
, quotePat = error "core quasiquotes may only be used in expressions"
|
||||||
|
, quoteType = error "core quasiquotes may only be used in expressions"
|
||||||
|
, quoteDec = error "core quasiquotes may only be used in expressions"
|
||||||
|
}
|
||||||
|
|
||||||
|
coreExpr :: QuasiQuoter
|
||||||
|
coreExpr = QuasiQuoter
|
||||||
|
{ quoteExp = qCoreExpr
|
||||||
|
, quotePat = error "core quasiquotes may only be used in expressions"
|
||||||
|
, quoteType = error "core quasiquotes may only be used in expressions"
|
||||||
|
, quoteDec = error "core quasiquotes may only be used in expressions"
|
||||||
|
}
|
||||||
|
|
||||||
|
-- | Type-checked @coreProg@
|
||||||
|
coreProgT :: QuasiQuoter
|
||||||
|
coreProgT = QuasiQuoter
|
||||||
|
{ quoteExp = qCoreProgT
|
||||||
|
, quotePat = error "core quasiquotes may only be used in expressions"
|
||||||
|
, quoteType = error "core quasiquotes may only be used in expressions"
|
||||||
|
, quoteDec = error "core quasiquotes may only be used in expressions"
|
||||||
|
}
|
||||||
|
|
||||||
|
qCore :: String -> Q Exp
|
||||||
|
qCore s = case parse (T.pack s) of
|
||||||
|
Left e -> error (show e)
|
||||||
|
Right (m,ts) -> lift m
|
||||||
|
where
|
||||||
|
parse = evalRLPC def . (lexCore >=> parseCore)
|
||||||
|
|
||||||
|
qCoreExpr :: String -> Q Exp
|
||||||
|
qCoreExpr s = case parseExpr (T.pack s) of
|
||||||
|
Left e -> error (show e)
|
||||||
|
Right (m,ts) -> lift m
|
||||||
|
where
|
||||||
|
parseExpr = evalRLPC def . (lexCore >=> parseCoreExpr)
|
||||||
|
|
||||||
|
qCoreProg :: String -> Q Exp
|
||||||
|
qCoreProg s = case parse (T.pack s) of
|
||||||
|
Left e -> error (show e)
|
||||||
|
Right (m,ts) -> lift m
|
||||||
|
where
|
||||||
|
parse = evalRLPC def . (lexCoreR >=> parseCoreProgR)
|
||||||
|
|
||||||
|
qCoreProgT :: String -> Q Exp
|
||||||
|
qCoreProgT s = case parse (T.pack s) of
|
||||||
|
Left e -> error (show e)
|
||||||
|
Right (m,_) -> lift m
|
||||||
|
where
|
||||||
|
parse = evalRLPC def . (lexCoreR >=> parseCoreProgR >=> checkCoreProgR)
|
||||||
|
|
||||||
|
|||||||
@@ -1,10 +1,16 @@
|
|||||||
|
-- for recursion schemes
|
||||||
|
{-# LANGUAGE DeriveFunctor, DeriveFoldable, DeriveTraversable #-}
|
||||||
|
-- for recursion schemes
|
||||||
|
{-# LANGUAGE TemplateHaskell, TypeFamilies #-}
|
||||||
|
|
||||||
module Core.Utils
|
module Core.Utils
|
||||||
( programRhss
|
( bindersOf
|
||||||
, programGlobals
|
, rhssOf
|
||||||
, isAtomic
|
, isAtomic
|
||||||
-- , insertModule
|
-- , insertModule
|
||||||
, extractProgram
|
, extractProgram
|
||||||
, freeVariables
|
, freeVariables
|
||||||
|
, ExprF(..)
|
||||||
)
|
)
|
||||||
where
|
where
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
@@ -17,11 +23,13 @@ import Lens.Micro
|
|||||||
import GHC.Exts (IsList(..))
|
import GHC.Exts (IsList(..))
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
programGlobals :: Traversal' (Program b) b
|
bindersOf :: (IsList l, Item l ~ b) => [Binding b] -> l
|
||||||
programGlobals = programScDefs . each . _lhs . _1
|
bindersOf bs = fromList $ fmap f bs
|
||||||
|
where f (k := _) = k
|
||||||
|
|
||||||
programRhss :: Traversal' (Program b) (Expr b)
|
rhssOf :: (IsList l, Item l ~ Expr b) => [Binding b] -> l
|
||||||
programRhss = programScDefs . each . _rhs
|
rhssOf = fromList . fmap f
|
||||||
|
where f (_ := v) = v
|
||||||
|
|
||||||
isAtomic :: Expr b -> Bool
|
isAtomic :: Expr b -> Bool
|
||||||
isAtomic (Var _) = True
|
isAtomic (Var _) = True
|
||||||
@@ -39,6 +47,8 @@ extractProgram (Module _ p) = p
|
|||||||
|
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
makeBaseFunctor ''Expr
|
||||||
|
|
||||||
freeVariables :: Expr' -> Set Name
|
freeVariables :: Expr' -> Set Name
|
||||||
freeVariables = cata go
|
freeVariables = cata go
|
||||||
where
|
where
|
||||||
@@ -47,8 +57,8 @@ freeVariables = cata go
|
|||||||
-- TODO: collect free vars in rhss of bs
|
-- TODO: collect free vars in rhss of bs
|
||||||
go (LetF _ bs e) = (e `S.union` esFree) `S.difference` ns
|
go (LetF _ bs e) = (e `S.union` esFree) `S.difference` ns
|
||||||
where
|
where
|
||||||
es = bs ^.. each . _rhs :: [Expr']
|
es = rhssOf bs :: [Expr']
|
||||||
ns = S.fromList $ bs ^.. each . _lhs
|
ns = bindersOf bs
|
||||||
-- TODO: this feels a little wrong. maybe a different scheme is
|
-- TODO: this feels a little wrong. maybe a different scheme is
|
||||||
-- appropriate
|
-- appropriate
|
||||||
esFree = foldMap id $ freeVariables <$> es
|
esFree = foldMap id $ freeVariables <$> es
|
||||||
|
|||||||
@@ -1,4 +1,3 @@
|
|||||||
{-# LANGUAGE ImplicitParams #-}
|
|
||||||
{-# LANGUAGE LambdaCase #-}
|
{-# LANGUAGE LambdaCase #-}
|
||||||
module Core2Core
|
module Core2Core
|
||||||
( core2core
|
( core2core
|
||||||
@@ -16,12 +15,11 @@ import Data.Set (Set)
|
|||||||
import Data.Set qualified as S
|
import Data.Set qualified as S
|
||||||
import Data.List
|
import Data.List
|
||||||
import Control.Monad.Writer
|
import Control.Monad.Writer
|
||||||
import Control.Monad.State.Lazy
|
import Control.Monad.State
|
||||||
import Control.Arrow ((>>>))
|
import Control.Arrow ((>>>))
|
||||||
import Data.Text qualified as T
|
import Data.Text qualified as T
|
||||||
import Data.HashMap.Strict (HashMap)
|
|
||||||
import Numeric (showHex)
|
import Numeric (showHex)
|
||||||
import Lens.Micro.Platform
|
import Lens.Micro
|
||||||
import Core.Syntax
|
import Core.Syntax
|
||||||
import Core.Utils
|
import Core.Utils
|
||||||
----------------------------------------------------------------------------------
|
----------------------------------------------------------------------------------
|
||||||
@@ -30,35 +28,22 @@ core2core :: Program' -> Program'
|
|||||||
core2core p = undefined
|
core2core p = undefined
|
||||||
|
|
||||||
gmPrep :: Program' -> Program'
|
gmPrep :: Program' -> Program'
|
||||||
gmPrep p = p & appFloater (floatNonStrictCases globals)
|
gmPrep p = p' & programScDefs %~ (<>caseScs)
|
||||||
& tagData
|
|
||||||
where
|
where
|
||||||
|
rhss :: Applicative f => (Expr z -> f (Expr z)) -> Program z -> f (Program z)
|
||||||
|
rhss = programScDefs . each . _rhs
|
||||||
globals = p ^.. programScDefs . each . _lhs . _1
|
globals = p ^.. programScDefs . each . _lhs . _1
|
||||||
& S.fromList
|
& S.fromList
|
||||||
|
|
||||||
tagData :: Program' -> Program'
|
-- i kinda don't like that we're calling floatNonStrictCases twice tbh
|
||||||
tagData p = let ?dt = p ^. programDataTags
|
p' = p & rhss %~ fst . runFloater . floatNonStrictCases globals
|
||||||
in p & programRhss %~ cata go where
|
caseScs = (p ^.. rhss)
|
||||||
go :: (?dt :: HashMap Name (Tag, Int)) => ExprF' Expr' -> Expr'
|
<&> snd . runFloater . floatNonStrictCases globals
|
||||||
go (CaseF e as) = Case e (tagAlts <$> as)
|
& mconcat
|
||||||
go x = embed x
|
|
||||||
|
|
||||||
tagAlts :: (?dt :: HashMap Name (Tag, Int)) => Alter' -> Alter'
|
|
||||||
tagAlts (Alter (AltData c) bs e) = Alter (AltTag tag) bs e
|
|
||||||
where tag = case ?dt ^. at c of
|
|
||||||
Just (t,_) -> t
|
|
||||||
-- TODO: errorful
|
|
||||||
Nothing -> error $ "unknown constructor " <> show c
|
|
||||||
tagAlts x = x
|
|
||||||
|
|
||||||
-- | Auxilary type used in @floatNonSrictCases@
|
-- | Auxilary type used in @floatNonSrictCases@
|
||||||
type Floater = StateT [Name] (Writer [ScDef'])
|
type Floater = StateT [Name] (Writer [ScDef'])
|
||||||
|
|
||||||
appFloater :: (Expr' -> Floater Expr') -> Program' -> Program'
|
|
||||||
appFloater fl p = p & traverseOf programRhss fl
|
|
||||||
& runFloater
|
|
||||||
& \ (me,floats) -> me & programScDefs %~ (<>floats)
|
|
||||||
|
|
||||||
runFloater :: Floater a -> (a, [ScDef'])
|
runFloater :: Floater a -> (a, [ScDef'])
|
||||||
runFloater = flip evalStateT ns >>> runWriter
|
runFloater = flip evalStateT ns >>> runWriter
|
||||||
where
|
where
|
||||||
|
|||||||
@@ -661,8 +661,7 @@ buildInitialHeap (view programScDefs -> ss) = mapAccumL allocateSc mempty compil
|
|||||||
compileC _ (Con t n) = [PushConstr t n]
|
compileC _ (Con t n) = [PushConstr t n]
|
||||||
|
|
||||||
compileC _ (Case _ _) =
|
compileC _ (Case _ _) =
|
||||||
error "GM compiler found a non-strict case expression, which should\
|
error "case expressions may not appear in non-strict contexts :/"
|
||||||
\ have been floated by Core2Core.gmPrep. This is a bug!"
|
|
||||||
|
|
||||||
compileC _ _ = error "yet to be implemented!"
|
compileC _ _ = error "yet to be implemented!"
|
||||||
|
|
||||||
@@ -725,16 +724,12 @@ buildInitialHeap (view programScDefs -> ss) = mapAccumL allocateSc mempty compil
|
|||||||
compileD g as = fmap (compileA g) as
|
compileD g as = fmap (compileA g) as
|
||||||
|
|
||||||
compileA :: Env -> Alter' -> (Tag, Code)
|
compileA :: Env -> Alter' -> (Tag, Code)
|
||||||
compileA g (Alter (AltTag t) as e) = (t, [Split n] <> c <> [Slide n])
|
compileA g (Alter (AltData t) as e) = (t, [Split n] <> c <> [Slide n])
|
||||||
where
|
where
|
||||||
n = length as
|
n = length as
|
||||||
binds = (NameKey <$> as) `zip` [0..]
|
binds = (NameKey <$> as) `zip` [0..]
|
||||||
g' = binds ++ argOffset n g
|
g' = binds ++ argOffset n g
|
||||||
c = compileE g' e
|
c = compileE g' e
|
||||||
compileA _ (Alter _ as e) = error "GM.compileA found an untagged\
|
|
||||||
\ constructor, which should have\
|
|
||||||
\ been handled by Core2Core.gmPrep.\
|
|
||||||
\ This is a bug!"
|
|
||||||
|
|
||||||
inlineOp1 :: Env -> Instr -> Expr' -> Code
|
inlineOp1 :: Env -> Instr -> Expr' -> Code
|
||||||
inlineOp1 g i a = compileE g a <> [i]
|
inlineOp1 g i a = compileE g a <> [i]
|
||||||
|
|||||||
59
src/RLP/Syntax.hs
Normal file
59
src/RLP/Syntax.hs
Normal file
@@ -0,0 +1,59 @@
|
|||||||
|
{-# LANGUAGE OverloadedStrings #-}
|
||||||
|
module RLP.Syntax
|
||||||
|
( RlpExpr
|
||||||
|
)
|
||||||
|
where
|
||||||
|
----------------------------------------------------------------------------------
|
||||||
|
import Data.Text (Text)
|
||||||
|
import Lens.Micro
|
||||||
|
import Core (HasRHS(..), HasLHS(..))
|
||||||
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
newtype RlpProgram b = RlpProgram [Decl b]
|
||||||
|
|
||||||
|
data Decl b = InfixD InfixAssoc Int VarId
|
||||||
|
| FunD VarId [Pat b] (RlpExpr b)
|
||||||
|
| DataD ConId [ConId] [ConAlt]
|
||||||
|
|
||||||
|
data ConAlt = ConAlt ConId [ConId]
|
||||||
|
|
||||||
|
data InfixAssoc = Assoc | AssocL | AssocR
|
||||||
|
|
||||||
|
data RlpExpr b = LetE [Bind b] (RlpExpr b)
|
||||||
|
| VarE VarId
|
||||||
|
| ConE ConId
|
||||||
|
| LamE [Pat b] (RlpExpr b)
|
||||||
|
| CaseE (RlpExpr b) [Alt b]
|
||||||
|
| IfE (RlpExpr b) (RlpExpr b) (RlpExpr b)
|
||||||
|
| AppE (RlpExpr b) (RlpExpr b)
|
||||||
|
| LitE (Lit b)
|
||||||
|
|
||||||
|
-- do we want guards?
|
||||||
|
data Alt b = AltA (Pat b) (RlpExpr b)
|
||||||
|
|
||||||
|
data Bind b = PatB (Pat b) (RlpExpr b)
|
||||||
|
| FunB VarId [Pat b] (RlpExpr b)
|
||||||
|
|
||||||
|
data VarId = NameVar Text
|
||||||
|
| SymVar Text
|
||||||
|
|
||||||
|
data ConId = NameCon Text
|
||||||
|
| SymCon Text
|
||||||
|
|
||||||
|
data Pat b = VarP VarId
|
||||||
|
| LitP (Lit b)
|
||||||
|
| ConP ConId [Pat b]
|
||||||
|
|
||||||
|
data Lit b = IntL Int
|
||||||
|
| CharL Char
|
||||||
|
| ListL [RlpExpr b]
|
||||||
|
|
||||||
|
-- instance HasLHS Alt Alt Pat Pat where
|
||||||
|
-- _lhs = lens
|
||||||
|
-- (\ (AltA p _) -> p)
|
||||||
|
-- (\ (AltA _ e) p' -> AltA p' e)
|
||||||
|
|
||||||
|
-- instance HasRHS Alt Alt RlpExpr RlpExpr where
|
||||||
|
-- _rhs = lens
|
||||||
|
-- (\ (AltA _ e) -> e)
|
||||||
|
-- (\ (AltA p _) e' -> AltA p e')
|
||||||
349
src/Rlp/Lex.x
349
src/Rlp/Lex.x
@@ -1,349 +0,0 @@
|
|||||||
{
|
|
||||||
{-# LANGUAGE ViewPatterns, LambdaCase #-}
|
|
||||||
{-# LANGUAGE GeneralisedNewtypeDeriving #-}
|
|
||||||
{-# LANGUAGE OverloadedStrings #-}
|
|
||||||
module Rlp.Lex
|
|
||||||
( P(..)
|
|
||||||
, RlpToken(..)
|
|
||||||
, Located(..)
|
|
||||||
, lexToken
|
|
||||||
, lexStream
|
|
||||||
, lexDebug
|
|
||||||
, lexCont
|
|
||||||
)
|
|
||||||
where
|
|
||||||
import Codec.Binary.UTF8.String (encodeChar)
|
|
||||||
import Control.Monad
|
|
||||||
import Control.Monad.Errorful
|
|
||||||
import Core.Syntax (Name)
|
|
||||||
import Data.Functor.Identity
|
|
||||||
import Data.Char (digitToInt)
|
|
||||||
import Data.Monoid (First)
|
|
||||||
import Data.Maybe
|
|
||||||
import Data.Text (Text)
|
|
||||||
import Data.Text qualified as T
|
|
||||||
import Data.Word
|
|
||||||
import Data.Default
|
|
||||||
import Lens.Micro.Mtl
|
|
||||||
import Lens.Micro
|
|
||||||
|
|
||||||
import Debug.Trace
|
|
||||||
import Rlp.Parse.Types
|
|
||||||
}
|
|
||||||
|
|
||||||
$whitechar = [ \t\n\r\f\v]
|
|
||||||
|
|
||||||
$nl = [\n\r]
|
|
||||||
$white_no_nl = $white # $nl
|
|
||||||
|
|
||||||
$lower = [a-z \_]
|
|
||||||
$upper = [A-Z]
|
|
||||||
$alpha = [$lower $upper]
|
|
||||||
$digit = 0-9
|
|
||||||
|
|
||||||
$special = [\(\)\,\;\[\]\{\}]
|
|
||||||
$namechar = [$alpha $digit \' \#]
|
|
||||||
$asciisym = [\!\#\$\%\&\*\+\.\/\<\=\>\?\@\\\^\|\-\~\:]
|
|
||||||
|
|
||||||
@decimal = $digit+
|
|
||||||
|
|
||||||
@varname = $lower $namechar*
|
|
||||||
@conname = $upper $namechar*
|
|
||||||
@consym = \: $asciisym*
|
|
||||||
@varsym = $asciisym+
|
|
||||||
|
|
||||||
@reservedname =
|
|
||||||
case|data|do|import|in|let|letrec|module|of|where
|
|
||||||
|infixr|infixl|infix
|
|
||||||
|
|
||||||
@reservedop =
|
|
||||||
"=" | \\ | "->" | "|"
|
|
||||||
|
|
||||||
rlp :-
|
|
||||||
|
|
||||||
-- everywhere: skip whitespace
|
|
||||||
$white_no_nl+ ;
|
|
||||||
|
|
||||||
-- everywhere: skip comments
|
|
||||||
-- TODO: don't treat operators like (-->) as comments
|
|
||||||
"--".* ;
|
|
||||||
|
|
||||||
-- we are indentation-sensitive! do not skip NLs!. upon encountering a newline,
|
|
||||||
-- we check indentation and potentially insert extra tokens. search this file
|
|
||||||
-- for the definition of `doBol`
|
|
||||||
<0> \n { beginPush bol }
|
|
||||||
|
|
||||||
-- scan various identifiers and reserved words. order is important here!
|
|
||||||
<0>
|
|
||||||
{
|
|
||||||
@reservedname { tokenWith lexReservedName }
|
|
||||||
@conname { tokenWith TokenConName }
|
|
||||||
@varname { tokenWith TokenVarName }
|
|
||||||
@reservedop { tokenWith lexReservedOp }
|
|
||||||
@consym { tokenWith TokenConSym }
|
|
||||||
@varsym { tokenWith TokenVarSym }
|
|
||||||
}
|
|
||||||
|
|
||||||
-- literals -- currently this is just unsigned integer literals
|
|
||||||
<0>
|
|
||||||
{
|
|
||||||
@decimal { tokenWith (TokenLitInt . readInt) }
|
|
||||||
}
|
|
||||||
|
|
||||||
-- control characters
|
|
||||||
<0>
|
|
||||||
{
|
|
||||||
"(" { constToken TokenLParen }
|
|
||||||
")" { constToken TokenRParen }
|
|
||||||
"{" { explicitLBrace }
|
|
||||||
"}" { explicitRBrace }
|
|
||||||
";" { constToken TokenSemicolon }
|
|
||||||
}
|
|
||||||
|
|
||||||
-- consume all whitespace leaving us at the beginning of the next non-empty
|
|
||||||
-- line. we then compare the indentation of that line to the enclosing layout
|
|
||||||
-- context and proceed accordingly
|
|
||||||
<bol>
|
|
||||||
{
|
|
||||||
$whitechar ;
|
|
||||||
\n ;
|
|
||||||
() { doBol }
|
|
||||||
}
|
|
||||||
|
|
||||||
<layout_top>
|
|
||||||
{
|
|
||||||
\n ;
|
|
||||||
"{" { explicitLBrace `thenDo` popLexState }
|
|
||||||
() { doLayout }
|
|
||||||
}
|
|
||||||
|
|
||||||
{
|
|
||||||
|
|
||||||
lexReservedName :: Text -> RlpToken
|
|
||||||
lexReservedName = \case
|
|
||||||
"data" -> TokenData
|
|
||||||
"case" -> TokenCase
|
|
||||||
"of" -> TokenOf
|
|
||||||
"let" -> TokenLet
|
|
||||||
"in" -> TokenIn
|
|
||||||
"infix" -> TokenInfix
|
|
||||||
"infixl" -> TokenInfixL
|
|
||||||
"infixr" -> TokenInfixR
|
|
||||||
|
|
||||||
lexReservedOp :: Text -> RlpToken
|
|
||||||
lexReservedOp = \case
|
|
||||||
"=" -> TokenEquals
|
|
||||||
"::" -> TokenHasType
|
|
||||||
"|" -> TokenPipe
|
|
||||||
|
|
||||||
-- | @andBegin@, with the subtle difference that the start code is set
|
|
||||||
-- /after/ the action
|
|
||||||
thenBegin :: LexerAction a -> Int -> LexerAction a
|
|
||||||
thenBegin act c inp l = do
|
|
||||||
a <- act inp l
|
|
||||||
psLexState . _head .= c
|
|
||||||
pure a
|
|
||||||
|
|
||||||
andBegin :: LexerAction a -> Int -> LexerAction a
|
|
||||||
andBegin act c inp l = do
|
|
||||||
psLexState . _head .= c
|
|
||||||
act inp l
|
|
||||||
|
|
||||||
beginPush :: Int -> LexerAction (Located RlpToken)
|
|
||||||
beginPush n _ _ = pushLexState n >> lexToken
|
|
||||||
|
|
||||||
alexGetByte :: AlexInput -> Maybe (Word8, AlexInput)
|
|
||||||
alexGetByte inp = case inp ^. aiBytes of
|
|
||||||
[] -> do
|
|
||||||
(c,t) <- T.uncons (inp ^. aiSource)
|
|
||||||
let (b:bs) = encodeChar c
|
|
||||||
-- tail the source
|
|
||||||
inp' = inp & aiSource .~ t
|
|
||||||
-- record the excess bytes for successive calls
|
|
||||||
& aiBytes .~ bs
|
|
||||||
-- report the previous char
|
|
||||||
& aiPrevChar .~ c
|
|
||||||
-- update the position
|
|
||||||
& aiPos %~ \ (ln,col) ->
|
|
||||||
if c == '\n'
|
|
||||||
then (ln+1,1)
|
|
||||||
else (ln,col+1)
|
|
||||||
pure (b, inp')
|
|
||||||
|
|
||||||
_ -> Just (head bs, inp')
|
|
||||||
where
|
|
||||||
(bs, inp') = inp & aiBytes <<%~ drop 1
|
|
||||||
|
|
||||||
getInput :: P AlexInput
|
|
||||||
getInput = use psInput
|
|
||||||
|
|
||||||
getLexState :: P Int
|
|
||||||
getLexState = use (psLexState . singular _head)
|
|
||||||
|
|
||||||
alexInputPrevChar :: AlexInput -> Char
|
|
||||||
alexInputPrevChar = view aiPrevChar
|
|
||||||
|
|
||||||
pushLexState :: Int -> P ()
|
|
||||||
pushLexState n = psLexState %= (n:)
|
|
||||||
|
|
||||||
readInt :: Text -> Int
|
|
||||||
readInt = T.foldr f 0 where
|
|
||||||
f c n = digitToInt c + 10*n
|
|
||||||
|
|
||||||
constToken :: RlpToken -> LexerAction (Located RlpToken)
|
|
||||||
constToken t inp l = do
|
|
||||||
pos <- use (psInput . aiPos)
|
|
||||||
pure (Located (pos,l) t)
|
|
||||||
|
|
||||||
tokenWith :: (Text -> RlpToken) -> LexerAction (Located RlpToken)
|
|
||||||
tokenWith tf inp l = do
|
|
||||||
pos <- getPos
|
|
||||||
let t = tf (T.take l $ inp ^. aiSource)
|
|
||||||
pure (Located (pos,l) t)
|
|
||||||
|
|
||||||
getPos :: P Position
|
|
||||||
getPos = use (psInput . aiPos)
|
|
||||||
|
|
||||||
alexEOF :: P (Located RlpToken)
|
|
||||||
alexEOF = do
|
|
||||||
inp <- getInput
|
|
||||||
pure (Located undefined TokenEOF)
|
|
||||||
|
|
||||||
initParseState :: Text -> ParseState
|
|
||||||
initParseState s = ParseState
|
|
||||||
{ _psLayoutStack = []
|
|
||||||
-- IMPORTANT: the initial state is `bol` to begin the top-level layout,
|
|
||||||
-- which then returns to state 0 which continues the normal lexing process.
|
|
||||||
, _psLexState = [layout_top,0]
|
|
||||||
, _psInput = initAlexInput s
|
|
||||||
, _psOpTable = mempty
|
|
||||||
}
|
|
||||||
|
|
||||||
initAlexInput :: Text -> AlexInput
|
|
||||||
initAlexInput s = AlexInput
|
|
||||||
{ _aiPrevChar = '\0'
|
|
||||||
, _aiSource = s
|
|
||||||
, _aiBytes = []
|
|
||||||
, _aiPos = (1,1)
|
|
||||||
}
|
|
||||||
|
|
||||||
runP' :: P a -> Text -> (ParseState, [MsgEnvelope RlpParseError], Maybe a)
|
|
||||||
runP' p s = runP p st where
|
|
||||||
st = initParseState s
|
|
||||||
|
|
||||||
lexToken :: P (Located RlpToken)
|
|
||||||
lexToken = do
|
|
||||||
inp <- getInput
|
|
||||||
c <- getLexState
|
|
||||||
st <- use id
|
|
||||||
-- traceM $ "st: " <> show st
|
|
||||||
case alexScan inp c of
|
|
||||||
AlexEOF -> pure $ Located (inp ^. aiPos, 0) TokenEOF
|
|
||||||
AlexSkip inp' l -> do
|
|
||||||
psInput .= inp'
|
|
||||||
lexToken
|
|
||||||
AlexToken inp' l act -> do
|
|
||||||
psInput .= inp'
|
|
||||||
act inp l
|
|
||||||
AlexError inp' -> addFatalHere 1 RlpParErrLexical
|
|
||||||
|
|
||||||
lexCont :: (Located RlpToken -> P a) -> P a
|
|
||||||
lexCont = (lexToken >>=)
|
|
||||||
|
|
||||||
lexStream :: P [RlpToken]
|
|
||||||
lexStream = do
|
|
||||||
t <- lexToken
|
|
||||||
case t of
|
|
||||||
Located _ TokenEOF -> pure [TokenEOF]
|
|
||||||
Located _ t -> (t:) <$> lexStream
|
|
||||||
|
|
||||||
lexDebug :: (Located RlpToken -> P a) -> P a
|
|
||||||
lexDebug k = do
|
|
||||||
t <- lexToken
|
|
||||||
traceM $ "token: " <> show t
|
|
||||||
k t
|
|
||||||
|
|
||||||
lexTest :: Text -> Maybe [RlpToken]
|
|
||||||
lexTest s = runP' lexStream s ^. _3
|
|
||||||
|
|
||||||
indentLevel :: P Int
|
|
||||||
indentLevel = do
|
|
||||||
pos <- use (psInput . aiPos)
|
|
||||||
pure (pos ^. _2)
|
|
||||||
|
|
||||||
insertToken :: RlpToken -> P (Located RlpToken)
|
|
||||||
insertToken t = do
|
|
||||||
pos <- use (psInput . aiPos)
|
|
||||||
pure (Located (pos, 0) t)
|
|
||||||
|
|
||||||
popLayout :: P Layout
|
|
||||||
popLayout = do
|
|
||||||
-- traceM "pop layout"
|
|
||||||
ctx <- preuse (psLayoutStack . _head)
|
|
||||||
psLayoutStack %= (drop 1)
|
|
||||||
case ctx of
|
|
||||||
Just l -> pure l
|
|
||||||
Nothing -> error "uhh"
|
|
||||||
|
|
||||||
pushLayout :: Layout -> P ()
|
|
||||||
pushLayout l = do
|
|
||||||
-- traceM "push layout"
|
|
||||||
psLayoutStack %= (l:)
|
|
||||||
|
|
||||||
popLexState :: P ()
|
|
||||||
popLexState = do
|
|
||||||
psLexState %= tail
|
|
||||||
|
|
||||||
insertSemicolon, insertLBrace, insertRBrace :: P (Located RlpToken)
|
|
||||||
insertSemicolon = {- traceM "inserting semi" >> -} insertToken TokenSemicolonV
|
|
||||||
insertLBrace = {- traceM "inserting lbrace" >> -} insertToken TokenLBraceV
|
|
||||||
insertRBrace = {- traceM "inserting rbrace" >> -} insertToken TokenRBraceV
|
|
||||||
|
|
||||||
cmpLayout :: P Ordering
|
|
||||||
cmpLayout = do
|
|
||||||
i <- indentLevel
|
|
||||||
ctx <- preuse (psLayoutStack . _head)
|
|
||||||
case ctx of
|
|
||||||
Just (Implicit n) -> pure (i `compare` n)
|
|
||||||
_ -> pure GT
|
|
||||||
|
|
||||||
doBol :: LexerAction (Located RlpToken)
|
|
||||||
doBol inp l = do
|
|
||||||
off <- cmpLayout
|
|
||||||
i <- indentLevel
|
|
||||||
traceM $ "i: " <> show i
|
|
||||||
-- important that we pop the lex state lest we find our lexer diverging
|
|
||||||
popLexState
|
|
||||||
case off of
|
|
||||||
-- the line is aligned with the previous. it therefore belongs to the
|
|
||||||
-- same list
|
|
||||||
EQ -> insertSemicolon
|
|
||||||
-- the line is indented further than the previous, so we assume it is a
|
|
||||||
-- line continuation. ignore it and move on!
|
|
||||||
GT -> lexToken
|
|
||||||
-- the line is indented less than the previous, pop the layout stack and
|
|
||||||
-- insert a closing brace.
|
|
||||||
LT -> popLayout >> insertRBrace
|
|
||||||
|
|
||||||
thenDo :: LexerAction a -> P b -> LexerAction a
|
|
||||||
thenDo act p inp l = act inp l <* p
|
|
||||||
|
|
||||||
explicitLBrace :: LexerAction (Located RlpToken)
|
|
||||||
explicitLBrace inp l = do
|
|
||||||
pushLayout Explicit
|
|
||||||
constToken TokenLBrace inp l
|
|
||||||
|
|
||||||
explicitRBrace :: LexerAction (Located RlpToken)
|
|
||||||
explicitRBrace inp l = do
|
|
||||||
popLayout
|
|
||||||
constToken TokenRBrace inp l
|
|
||||||
|
|
||||||
doLayout :: LexerAction (Located RlpToken)
|
|
||||||
doLayout _ _ = do
|
|
||||||
i <- indentLevel
|
|
||||||
pushLayout (Implicit i)
|
|
||||||
popLexState
|
|
||||||
insertLBrace
|
|
||||||
|
|
||||||
}
|
|
||||||
|
|
||||||
181
src/Rlp/Parse.y
181
src/Rlp/Parse.y
@@ -1,181 +0,0 @@
|
|||||||
{
|
|
||||||
{-# LANGUAGE LambdaCase #-}
|
|
||||||
module Rlp.Parse
|
|
||||||
( parseRlpProg
|
|
||||||
)
|
|
||||||
where
|
|
||||||
import Compiler.RlpcError
|
|
||||||
import Rlp.Lex
|
|
||||||
import Rlp.Syntax
|
|
||||||
import Rlp.Parse.Types
|
|
||||||
import Rlp.Parse.Associate
|
|
||||||
import Lens.Micro
|
|
||||||
import Lens.Micro.Mtl
|
|
||||||
import Lens.Micro.Platform ()
|
|
||||||
import Data.List.Extra
|
|
||||||
import Data.Fix
|
|
||||||
import Data.Functor.Const
|
|
||||||
import Data.Text qualified as T
|
|
||||||
}
|
|
||||||
|
|
||||||
%name parseRlpProg StandaloneProgram
|
|
||||||
|
|
||||||
%monad { P }
|
|
||||||
%lexer { lexCont } { Located _ TokenEOF }
|
|
||||||
%error { parseError }
|
|
||||||
%tokentype { Located RlpToken }
|
|
||||||
|
|
||||||
%token
|
|
||||||
varname { Located _ (TokenVarName $$) }
|
|
||||||
conname { Located _ (TokenConName $$) }
|
|
||||||
consym { Located _ (TokenConSym $$) }
|
|
||||||
varsym { Located _ (TokenVarSym $$) }
|
|
||||||
data { Located _ TokenData }
|
|
||||||
litint { Located _ (TokenLitInt $$) }
|
|
||||||
'=' { Located _ TokenEquals }
|
|
||||||
'|' { Located _ TokenPipe }
|
|
||||||
';' { Located _ TokenSemicolon }
|
|
||||||
'(' { Located _ TokenLParen }
|
|
||||||
')' { Located _ TokenRParen }
|
|
||||||
'->' { Located _ TokenArrow }
|
|
||||||
vsemi { Located _ TokenSemicolonV }
|
|
||||||
'{' { Located _ TokenLBrace }
|
|
||||||
'}' { Located _ TokenRBrace }
|
|
||||||
vlbrace { Located _ TokenLBraceV }
|
|
||||||
vrbrace { Located _ TokenRBraceV }
|
|
||||||
infixl { Located _ TokenInfixL }
|
|
||||||
infixr { Located _ TokenInfixR }
|
|
||||||
infix { Located _ TokenInfix }
|
|
||||||
|
|
||||||
%right '->'
|
|
||||||
|
|
||||||
%%
|
|
||||||
|
|
||||||
StandaloneProgram :: { RlpProgram' }
|
|
||||||
StandaloneProgram : '{' Decls '}' {% mkProgram $2 }
|
|
||||||
| VL DeclsV VR {% mkProgram $2 }
|
|
||||||
|
|
||||||
VL :: { () }
|
|
||||||
VL : vlbrace { () }
|
|
||||||
|
|
||||||
VR :: { () }
|
|
||||||
VR : vrbrace { () }
|
|
||||||
| error { () }
|
|
||||||
|
|
||||||
Decls :: { [PartialDecl'] }
|
|
||||||
Decls : Decl ';' Decls { $1 : $3 }
|
|
||||||
| Decl ';' { [$1] }
|
|
||||||
| Decl { [$1] }
|
|
||||||
|
|
||||||
DeclsV :: { [PartialDecl'] }
|
|
||||||
DeclsV : Decl VS Decls { $1 : $3 }
|
|
||||||
| Decl VS { [$1] }
|
|
||||||
| Decl { [$1] }
|
|
||||||
|
|
||||||
VS :: { Located RlpToken }
|
|
||||||
VS : ';' { $1 }
|
|
||||||
| vsemi { $1 }
|
|
||||||
|
|
||||||
Decl :: { PartialDecl' }
|
|
||||||
: FunDecl { $1 }
|
|
||||||
| DataDecl { $1 }
|
|
||||||
| InfixDecl { $1 }
|
|
||||||
|
|
||||||
InfixDecl :: { PartialDecl' }
|
|
||||||
: InfixWord litint InfixOp {% mkInfixD $1 $2 $3 }
|
|
||||||
|
|
||||||
InfixWord :: { Assoc }
|
|
||||||
: infixl { InfixL }
|
|
||||||
| infixr { InfixR }
|
|
||||||
| infix { Infix }
|
|
||||||
|
|
||||||
DataDecl :: { PartialDecl' }
|
|
||||||
: data Con TyParams '=' DataCons { DataD $2 $3 $5 }
|
|
||||||
|
|
||||||
TyParams :: { [Name] }
|
|
||||||
: {- epsilon -} { [] }
|
|
||||||
| TyParams varname { $1 `snoc` $2 }
|
|
||||||
|
|
||||||
DataCons :: { [ConAlt] }
|
|
||||||
: DataCons '|' DataCon { $1 `snoc` $3 }
|
|
||||||
| DataCon { [$1] }
|
|
||||||
|
|
||||||
DataCon :: { ConAlt }
|
|
||||||
: Con Type1s { ConAlt $1 $2 }
|
|
||||||
|
|
||||||
Type1s :: { [Type] }
|
|
||||||
: {- epsilon -} { [] }
|
|
||||||
| Type1s Type1 { $1 `snoc` $2 }
|
|
||||||
|
|
||||||
Type1 :: { Type }
|
|
||||||
: '(' Type ')' { $2 }
|
|
||||||
| conname { TyCon $1 }
|
|
||||||
| varname { TyVar $1 }
|
|
||||||
|
|
||||||
Type :: { Type }
|
|
||||||
: Type '->' Type { $1 :-> $3 }
|
|
||||||
| Type1 { $1 }
|
|
||||||
|
|
||||||
FunDecl :: { PartialDecl' }
|
|
||||||
FunDecl : Var Params '=' Expr { FunD $1 $2 (Const $4) Nothing }
|
|
||||||
|
|
||||||
Params :: { [Pat'] }
|
|
||||||
Params : {- epsilon -} { [] }
|
|
||||||
| Params Pat1 { $1 `snoc` $2 }
|
|
||||||
|
|
||||||
Pat1 :: { Pat' }
|
|
||||||
: Var { VarP $1 }
|
|
||||||
| Lit { LitP $1 }
|
|
||||||
|
|
||||||
Expr :: { PartialExpr' }
|
|
||||||
: Expr1 varsym Expr { Fix $ B $2 (unFix $1) (unFix $3) }
|
|
||||||
| Expr1 { $1 }
|
|
||||||
|
|
||||||
Expr1 :: { PartialExpr' }
|
|
||||||
: '(' Expr ')' { wrapFix . Par . unwrapFix $ $2 }
|
|
||||||
| Lit { Fix . E $ LitEF $1 }
|
|
||||||
| Var { Fix . E $ VarEF $1 }
|
|
||||||
|
|
||||||
-- TODO: happy prefers left-associativity. doing such would require adjusting
|
|
||||||
-- the code in Rlp.Parse.Associate to expect left-associative input rather than
|
|
||||||
-- right.
|
|
||||||
InfixExpr :: { PartialExpr' }
|
|
||||||
: Expr1 varsym Expr { Fix $ B $2 (unFix $1) (unFix $3) }
|
|
||||||
|
|
||||||
InfixOp :: { Name }
|
|
||||||
: consym { $1 }
|
|
||||||
| varsym { $1 }
|
|
||||||
|
|
||||||
Lit :: { Lit' }
|
|
||||||
Lit : litint { IntL $1 }
|
|
||||||
|
|
||||||
Var :: { VarId }
|
|
||||||
Var : varname { NameVar $1 }
|
|
||||||
|
|
||||||
Con :: { ConId }
|
|
||||||
: conname { NameCon $1 }
|
|
||||||
|
|
||||||
{
|
|
||||||
|
|
||||||
mkProgram :: [PartialDecl'] -> P RlpProgram'
|
|
||||||
mkProgram ds = do
|
|
||||||
pt <- use psOpTable
|
|
||||||
pure $ RlpProgram (associate pt <$> ds)
|
|
||||||
|
|
||||||
parseError :: Located RlpToken -> P a
|
|
||||||
parseError (Located ((l,c),s) t) = addFatal $
|
|
||||||
errorMsg (SrcSpan l c s) RlpParErrUnexpectedToken
|
|
||||||
|
|
||||||
mkInfixD :: Assoc -> Int -> Name -> P PartialDecl'
|
|
||||||
mkInfixD a p n = do
|
|
||||||
let opl :: Lens' ParseState (Maybe OpInfo)
|
|
||||||
opl = psOpTable . at n
|
|
||||||
opl <~ (use opl >>= \case
|
|
||||||
Just o -> addWoundHere l e >> pure (Just o) where
|
|
||||||
e = RlpParErrDuplicateInfixD n
|
|
||||||
l = T.length n
|
|
||||||
Nothing -> pure (Just (a,p))
|
|
||||||
)
|
|
||||||
pure $ InfixD a p n
|
|
||||||
|
|
||||||
}
|
|
||||||
@@ -1,100 +0,0 @@
|
|||||||
{-# LANGUAGE OverloadedStrings #-}
|
|
||||||
{-# LANGUAGE PatternSynonyms, ViewPatterns, ImplicitParams #-}
|
|
||||||
module Rlp.Parse.Associate
|
|
||||||
( associate
|
|
||||||
)
|
|
||||||
where
|
|
||||||
--------------------------------------------------------------------------------
|
|
||||||
import Data.HashMap.Strict qualified as H
|
|
||||||
import Data.Functor.Foldable
|
|
||||||
import Data.Functor.Const
|
|
||||||
import Lens.Micro
|
|
||||||
import Rlp.Parse.Types
|
|
||||||
import Rlp.Syntax
|
|
||||||
--------------------------------------------------------------------------------
|
|
||||||
|
|
||||||
associate :: OpTable -> PartialDecl' -> Decl' RlpExpr
|
|
||||||
associate pt (FunD n as b w) = FunD n as b' w
|
|
||||||
where b' = let ?pt = pt in completeExpr (getConst b)
|
|
||||||
associate pt (TySigD ns t) = TySigD ns t
|
|
||||||
associate pt (DataD n as cs) = DataD n as cs
|
|
||||||
associate pt (InfixD a p n) = InfixD a p n
|
|
||||||
|
|
||||||
completeExpr :: (?pt :: OpTable) => PartialExpr' -> RlpExpr'
|
|
||||||
completeExpr = cata completePartial
|
|
||||||
|
|
||||||
completePartial :: (?pt :: OpTable) => PartialE -> RlpExpr'
|
|
||||||
completePartial (E e) = completeRlpExpr e
|
|
||||||
completePartial p@(B o l r) = completeB (build p)
|
|
||||||
completePartial (Par e) = completePartial e
|
|
||||||
|
|
||||||
completeRlpExpr :: (?pt :: OpTable) => RlpExprF' RlpExpr' -> RlpExpr'
|
|
||||||
completeRlpExpr = embed
|
|
||||||
|
|
||||||
completeB :: (?pt :: OpTable) => PartialE -> RlpExpr'
|
|
||||||
completeB p = case build p of
|
|
||||||
B o l r -> (o' `AppE` l') `AppE` r'
|
|
||||||
where
|
|
||||||
-- TODO: how do we know it's symbolic?
|
|
||||||
o' = VarE (SymVar o)
|
|
||||||
l' = completeB l
|
|
||||||
r' = completeB r
|
|
||||||
Par e -> completeB e
|
|
||||||
E e -> completeRlpExpr e
|
|
||||||
|
|
||||||
build :: (?pt :: OpTable) => PartialE -> PartialE
|
|
||||||
build e = go id e (rightmost e) where
|
|
||||||
rightmost :: PartialE -> PartialE
|
|
||||||
rightmost (B _ _ r) = rightmost r
|
|
||||||
rightmost p@(E _) = p
|
|
||||||
rightmost p@(Par _) = p
|
|
||||||
|
|
||||||
go :: (?pt :: OpTable)
|
|
||||||
=> (PartialE -> PartialE)
|
|
||||||
-> PartialE -> PartialE -> PartialE
|
|
||||||
go f p@(WithInfo o _ r) = case r of
|
|
||||||
E _ -> mkHole o (f . f')
|
|
||||||
Par _ -> mkHole o (f . f')
|
|
||||||
B _ _ _ -> go (mkHole o (f . f')) r
|
|
||||||
where f' r' = p & pR .~ r'
|
|
||||||
go f _ = id
|
|
||||||
|
|
||||||
mkHole :: (?pt :: OpTable)
|
|
||||||
=> OpInfo
|
|
||||||
-> (PartialE -> PartialE)
|
|
||||||
-> PartialE
|
|
||||||
-> PartialE
|
|
||||||
mkHole _ hole p@(Par _) = hole p
|
|
||||||
mkHole _ hole p@(E _) = hole p
|
|
||||||
mkHole (a,d) hole p@(WithInfo (a',d') _ _)
|
|
||||||
| d' < d = above
|
|
||||||
| d' > d = below
|
|
||||||
| d == d' = case (a,a') of
|
|
||||||
-- left-associative operators of equal precedence are
|
|
||||||
-- associated left
|
|
||||||
(InfixL,InfixL) -> above
|
|
||||||
-- right-associative operators are handled similarly
|
|
||||||
(InfixR,InfixR) -> below
|
|
||||||
-- non-associative operators of equal precedence, or equal
|
|
||||||
-- precedence operators of different associativities are
|
|
||||||
-- invalid
|
|
||||||
(_, _) -> error "invalid expression"
|
|
||||||
where
|
|
||||||
above = p & pL %~ hole
|
|
||||||
below = hole p
|
|
||||||
|
|
||||||
examplePrecTable :: OpTable
|
|
||||||
examplePrecTable = H.fromList
|
|
||||||
[ ("+", (InfixL,6))
|
|
||||||
, ("*", (InfixL,7))
|
|
||||||
, ("^", (InfixR,8))
|
|
||||||
, (".", (InfixR,7))
|
|
||||||
, ("~", (Infix, 9))
|
|
||||||
, ("=", (Infix, 4))
|
|
||||||
, ("&&", (Infix, 3))
|
|
||||||
, ("||", (Infix, 2))
|
|
||||||
, ("$", (InfixR,0))
|
|
||||||
, ("&", (InfixL,0))
|
|
||||||
]
|
|
||||||
|
|
||||||
|
|
||||||
@@ -1,242 +0,0 @@
|
|||||||
{-# LANGUAGE TemplateHaskell #-}
|
|
||||||
{-# LANGUAGE ImplicitParams, ViewPatterns, PatternSynonyms #-}
|
|
||||||
{-# LANGUAGE LambdaCase #-}
|
|
||||||
module Rlp.Parse.Types
|
|
||||||
( LexerAction
|
|
||||||
, MsgEnvelope(..)
|
|
||||||
, RlpcError(..)
|
|
||||||
, AlexInput(..)
|
|
||||||
, Position(..)
|
|
||||||
, RlpToken(..)
|
|
||||||
, P(..)
|
|
||||||
, ParseState(..)
|
|
||||||
, psLayoutStack
|
|
||||||
, psLexState
|
|
||||||
, psInput
|
|
||||||
, psOpTable
|
|
||||||
, Layout(..)
|
|
||||||
, Located(..)
|
|
||||||
, OpTable
|
|
||||||
, OpInfo
|
|
||||||
, RlpParseError(..)
|
|
||||||
, PartialDecl'
|
|
||||||
, Partial(..)
|
|
||||||
, pL, pR
|
|
||||||
, PartialE
|
|
||||||
, pattern WithInfo
|
|
||||||
, opInfoOrDef
|
|
||||||
, PartialExpr'
|
|
||||||
, aiPrevChar
|
|
||||||
, aiSource
|
|
||||||
, aiBytes
|
|
||||||
, aiPos
|
|
||||||
, addFatal
|
|
||||||
, addWound
|
|
||||||
, addFatalHere
|
|
||||||
, addWoundHere
|
|
||||||
)
|
|
||||||
where
|
|
||||||
--------------------------------------------------------------------------------
|
|
||||||
import Core.Syntax (Name)
|
|
||||||
import Control.Monad
|
|
||||||
import Control.Monad.State.Strict
|
|
||||||
import Control.Monad.Errorful
|
|
||||||
import Compiler.RlpcError
|
|
||||||
import Data.Text (Text)
|
|
||||||
import Data.Maybe
|
|
||||||
import Data.Fix
|
|
||||||
import Data.Functor.Foldable
|
|
||||||
import Data.Functor.Const
|
|
||||||
import Data.Functor.Classes
|
|
||||||
import Data.HashMap.Strict qualified as H
|
|
||||||
import Data.Word (Word8)
|
|
||||||
import Lens.Micro.TH
|
|
||||||
import Lens.Micro
|
|
||||||
import Rlp.Syntax
|
|
||||||
--------------------------------------------------------------------------------
|
|
||||||
|
|
||||||
type LexerAction a = AlexInput -> Int -> P a
|
|
||||||
|
|
||||||
data AlexInput = AlexInput
|
|
||||||
{ _aiPrevChar :: Char
|
|
||||||
, _aiSource :: Text
|
|
||||||
, _aiBytes :: [Word8]
|
|
||||||
, _aiPos :: Position
|
|
||||||
}
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
type Position =
|
|
||||||
( Int -- line
|
|
||||||
, Int -- column
|
|
||||||
)
|
|
||||||
|
|
||||||
posLine :: Lens' Position Int
|
|
||||||
posLine = _1
|
|
||||||
|
|
||||||
posColumn :: Lens' Position Int
|
|
||||||
posColumn = _2
|
|
||||||
|
|
||||||
data RlpToken
|
|
||||||
-- literals
|
|
||||||
= TokenLitInt Int
|
|
||||||
-- identifiers
|
|
||||||
| TokenVarName Name
|
|
||||||
| TokenConName Name
|
|
||||||
| TokenVarSym Name
|
|
||||||
| TokenConSym Name
|
|
||||||
-- reserved words
|
|
||||||
| TokenData
|
|
||||||
| TokenCase
|
|
||||||
| TokenOf
|
|
||||||
| TokenLet
|
|
||||||
| TokenIn
|
|
||||||
| TokenInfixL
|
|
||||||
| TokenInfixR
|
|
||||||
| TokenInfix
|
|
||||||
-- reserved ops
|
|
||||||
| TokenArrow
|
|
||||||
| TokenPipe
|
|
||||||
| TokenHasType
|
|
||||||
| TokenLambda
|
|
||||||
| TokenEquals
|
|
||||||
-- control symbols
|
|
||||||
| TokenSemicolon
|
|
||||||
| TokenLBrace
|
|
||||||
| TokenRBrace
|
|
||||||
| TokenLParen
|
|
||||||
| TokenRParen
|
|
||||||
-- 'virtual' control symbols, inserted by the lexer without any correlation
|
|
||||||
-- to a specific symbol
|
|
||||||
| TokenSemicolonV
|
|
||||||
| TokenLBraceV
|
|
||||||
| TokenRBraceV
|
|
||||||
| TokenEOF
|
|
||||||
deriving (Show)
|
|
||||||
|
|
||||||
newtype P a = P {
|
|
||||||
runP :: ParseState
|
|
||||||
-> (ParseState, [MsgEnvelope RlpParseError], Maybe a)
|
|
||||||
}
|
|
||||||
deriving (Functor)
|
|
||||||
|
|
||||||
instance Applicative P where
|
|
||||||
pure a = P $ \st -> (st, [], pure a)
|
|
||||||
liftA2 = liftM2
|
|
||||||
|
|
||||||
instance Monad P where
|
|
||||||
p >>= k = P $ \st ->
|
|
||||||
let (st',es,ma) = runP p st
|
|
||||||
in case ma of
|
|
||||||
Just a -> runP (k a) st'
|
|
||||||
& _2 %~ (es<>)
|
|
||||||
Nothing -> (st',es,Nothing)
|
|
||||||
|
|
||||||
{-# INLINE (>>=) #-}
|
|
||||||
|
|
||||||
instance MonadState ParseState P where
|
|
||||||
state f = P $ \st ->
|
|
||||||
let (a,st') = f st
|
|
||||||
in (st', [], Just a)
|
|
||||||
|
|
||||||
instance MonadErrorful (MsgEnvelope RlpParseError) P where
|
|
||||||
addWound e = P $ \st -> (st, [e], Just ())
|
|
||||||
addFatal e = P $ \st -> (st, [e], Nothing)
|
|
||||||
|
|
||||||
data ParseState = ParseState
|
|
||||||
{ _psLayoutStack :: [Layout]
|
|
||||||
, _psLexState :: [Int]
|
|
||||||
, _psInput :: AlexInput
|
|
||||||
, _psOpTable :: OpTable
|
|
||||||
}
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
data Layout = Explicit
|
|
||||||
| Implicit Int
|
|
||||||
deriving (Show, Eq)
|
|
||||||
|
|
||||||
data Located a = Located (Position, Int) a
|
|
||||||
deriving (Show)
|
|
||||||
|
|
||||||
type OpTable = H.HashMap Name OpInfo
|
|
||||||
type OpInfo = (Assoc, Int)
|
|
||||||
|
|
||||||
-- data WithLocation a = WithLocation [String] a
|
|
||||||
|
|
||||||
data RlpParseError = RlpParErrOutOfBoundsPrecedence Int
|
|
||||||
| RlpParErrDuplicateInfixD Name
|
|
||||||
| RlpParErrLexical
|
|
||||||
| RlpParErrUnexpectedToken
|
|
||||||
deriving (Eq, Ord, Show)
|
|
||||||
|
|
||||||
instance IsRlpcError RlpParseError where
|
|
||||||
|
|
||||||
----------------------------------------------------------------------------------
|
|
||||||
-- absolute psycho shit (partial ASTs)
|
|
||||||
|
|
||||||
type PartialDecl' = Decl (Const PartialExpr') Name
|
|
||||||
|
|
||||||
data Partial a = E (RlpExprF Name a)
|
|
||||||
| B Name (Partial a) (Partial a)
|
|
||||||
| Par (Partial a)
|
|
||||||
deriving (Show, Functor)
|
|
||||||
|
|
||||||
pL :: Traversal' (Partial a) (Partial a)
|
|
||||||
pL k (B o l r) = (\l' -> B o l' r) <$> k l
|
|
||||||
pL _ x = pure x
|
|
||||||
|
|
||||||
pR :: Traversal' (Partial a) (Partial a)
|
|
||||||
pR k (B o l r) = (\r' -> B o l r') <$> k r
|
|
||||||
pR _ x = pure x
|
|
||||||
|
|
||||||
type PartialE = Partial RlpExpr'
|
|
||||||
|
|
||||||
-- i love you haskell
|
|
||||||
pattern WithInfo :: (?pt :: OpTable) => OpInfo -> PartialE -> PartialE -> PartialE
|
|
||||||
pattern WithInfo p l r <- B (opInfoOrDef -> p) l r
|
|
||||||
|
|
||||||
opInfoOrDef :: (?pt :: OpTable) => Name -> OpInfo
|
|
||||||
opInfoOrDef c = fromMaybe (InfixL,9) $ H.lookup c ?pt
|
|
||||||
|
|
||||||
-- required to satisfy constraint on Fix's show instance
|
|
||||||
instance Show1 Partial where
|
|
||||||
liftShowsPrec :: forall a. (Int -> a -> ShowS)
|
|
||||||
-> ([a] -> ShowS)
|
|
||||||
-> Int -> Partial a -> ShowS
|
|
||||||
|
|
||||||
liftShowsPrec sp sl p m = case m of
|
|
||||||
(E e) -> showsUnaryWith lshow "E" p e
|
|
||||||
(B f a b) -> showsTernaryWith showsPrec lshow lshow "B" p f a b
|
|
||||||
(Par e) -> showsUnaryWith lshow "Par" p e
|
|
||||||
where
|
|
||||||
lshow :: forall f. (Show1 f) => Int -> f a -> ShowS
|
|
||||||
lshow = liftShowsPrec sp sl
|
|
||||||
|
|
||||||
type PartialExpr' = Fix Partial
|
|
||||||
|
|
||||||
makeLenses ''AlexInput
|
|
||||||
makeLenses ''ParseState
|
|
||||||
|
|
||||||
addWoundHere :: Int -> RlpParseError -> P ()
|
|
||||||
addWoundHere l e = P $ \st ->
|
|
||||||
let e' = MsgEnvelope
|
|
||||||
{ _msgSpan = let pos = psInput . aiPos
|
|
||||||
in SrcSpan (st ^. pos . posLine)
|
|
||||||
(st ^. pos . posColumn)
|
|
||||||
l
|
|
||||||
, _msgDiagnostic = e
|
|
||||||
, _msgSeverity = SevError
|
|
||||||
}
|
|
||||||
in (st, [e'], Just ())
|
|
||||||
|
|
||||||
addFatalHere :: Int -> RlpParseError -> P a
|
|
||||||
addFatalHere l e = P $ \st ->
|
|
||||||
let e' = MsgEnvelope
|
|
||||||
{ _msgSpan = let pos = psInput . aiPos
|
|
||||||
in SrcSpan (st ^. pos . posLine)
|
|
||||||
(st ^. pos . posColumn)
|
|
||||||
l
|
|
||||||
, _msgDiagnostic = e
|
|
||||||
, _msgSeverity = SevError
|
|
||||||
}
|
|
||||||
in (st, [e'], Nothing)
|
|
||||||
|
|
||||||
@@ -1,177 +0,0 @@
|
|||||||
-- recursion-schemes
|
|
||||||
{-# LANGUAGE DeriveFunctor, DeriveFoldable, DeriveTraversable #-}
|
|
||||||
-- recursion-schemes
|
|
||||||
{-# LANGUAGE TemplateHaskell, TypeFamilies #-}
|
|
||||||
{-# LANGUAGE OverloadedStrings, PatternSynonyms #-}
|
|
||||||
module Rlp.Syntax
|
|
||||||
( RlpModule(..)
|
|
||||||
, RlpProgram(..)
|
|
||||||
, RlpProgram'
|
|
||||||
, rlpmodName
|
|
||||||
, rlpmodProgram
|
|
||||||
, RlpExpr(..)
|
|
||||||
, RlpExpr'
|
|
||||||
, RlpExprF(..)
|
|
||||||
, RlpExprF'
|
|
||||||
, Decl(..)
|
|
||||||
, Decl'
|
|
||||||
, Bind(..)
|
|
||||||
, Where
|
|
||||||
, Where'
|
|
||||||
, ConAlt(..)
|
|
||||||
, Type(..)
|
|
||||||
, pattern (:->)
|
|
||||||
, Assoc(..)
|
|
||||||
, VarId(..)
|
|
||||||
, ConId(..)
|
|
||||||
, Pat(..)
|
|
||||||
, Pat'
|
|
||||||
, Lit(..)
|
|
||||||
, Lit'
|
|
||||||
, Name
|
|
||||||
|
|
||||||
-- TODO: ugh move this somewhere else later
|
|
||||||
, showsTernaryWith
|
|
||||||
|
|
||||||
-- * Convenience re-exports
|
|
||||||
, Text
|
|
||||||
)
|
|
||||||
where
|
|
||||||
----------------------------------------------------------------------------------
|
|
||||||
import Data.Text (Text)
|
|
||||||
import Data.Text qualified as T
|
|
||||||
import Data.String (IsString(..))
|
|
||||||
import Data.Functor.Foldable.TH (makeBaseFunctor)
|
|
||||||
import Data.Functor.Classes
|
|
||||||
import Lens.Micro
|
|
||||||
import Lens.Micro.TH
|
|
||||||
import Core.Syntax hiding (Lit)
|
|
||||||
import Core (HasRHS(..), HasLHS(..))
|
|
||||||
----------------------------------------------------------------------------------
|
|
||||||
|
|
||||||
data RlpModule b = RlpModule
|
|
||||||
{ _rlpmodName :: Text
|
|
||||||
, _rlpmodProgram :: RlpProgram b
|
|
||||||
}
|
|
||||||
|
|
||||||
newtype RlpProgram b = RlpProgram [Decl RlpExpr b]
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
type RlpProgram' = RlpProgram Name
|
|
||||||
|
|
||||||
-- | The @e@ parameter is used for partial results. When parsing an input, we
|
|
||||||
-- first parse all top-level declarations in order to extract infix[lr]
|
|
||||||
-- declarations. This process yields a @[Decl (Const Text) Name]@, where @Const
|
|
||||||
-- Text@ stores the remaining unparsed function bodies. Once infixities are
|
|
||||||
-- accounted for, we may complete the parsing task and get a proper @[Decl
|
|
||||||
-- RlpExpr Name]@.
|
|
||||||
|
|
||||||
data Decl e b = FunD VarId [Pat b] (e b) (Maybe (Where b))
|
|
||||||
| TySigD [VarId] Type
|
|
||||||
| DataD ConId [Name] [ConAlt]
|
|
||||||
| InfixD Assoc Int Name
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
type Decl' e = Decl e Name
|
|
||||||
|
|
||||||
data Assoc = InfixL
|
|
||||||
| InfixR
|
|
||||||
| Infix
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
data ConAlt = ConAlt ConId [Type]
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
data RlpExpr b = LetE [Bind b] (RlpExpr b)
|
|
||||||
| VarE VarId
|
|
||||||
| ConE ConId
|
|
||||||
| LamE [Pat b] (RlpExpr b)
|
|
||||||
| CaseE (RlpExpr b) [(Alt b, Where b)]
|
|
||||||
| IfE (RlpExpr b) (RlpExpr b) (RlpExpr b)
|
|
||||||
| AppE (RlpExpr b) (RlpExpr b)
|
|
||||||
| LitE (Lit b)
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
type RlpExpr' = RlpExpr Name
|
|
||||||
|
|
||||||
type Where b = [Bind b]
|
|
||||||
type Where' = [Bind Name]
|
|
||||||
|
|
||||||
-- do we want guards?
|
|
||||||
data Alt b = AltA (Pat b) (RlpExpr b)
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
data Bind b = PatB (Pat b) (RlpExpr b)
|
|
||||||
| FunB VarId [Pat b] (RlpExpr b)
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
data VarId = NameVar Text
|
|
||||||
| SymVar Text
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
instance IsString VarId where
|
|
||||||
-- TODO: use symvar if it's an operator
|
|
||||||
fromString = NameVar . T.pack
|
|
||||||
|
|
||||||
data ConId = NameCon Text
|
|
||||||
| SymCon Text
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
data Pat b = VarP VarId
|
|
||||||
| LitP (Lit b)
|
|
||||||
| ConP ConId [Pat b]
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
type Pat' = Pat Name
|
|
||||||
|
|
||||||
data Lit b = IntL Int
|
|
||||||
| CharL Char
|
|
||||||
| ListL [RlpExpr b]
|
|
||||||
deriving Show
|
|
||||||
|
|
||||||
type Lit' = Lit Name
|
|
||||||
|
|
||||||
-- instance HasLHS Alt Alt Pat Pat where
|
|
||||||
-- _lhs = lens
|
|
||||||
-- (\ (AltA p _) -> p)
|
|
||||||
-- (\ (AltA _ e) p' -> AltA p' e)
|
|
||||||
|
|
||||||
-- instance HasRHS Alt Alt RlpExpr RlpExpr where
|
|
||||||
-- _rhs = lens
|
|
||||||
-- (\ (AltA _ e) -> e)
|
|
||||||
-- (\ (AltA p _) e' -> AltA p e')
|
|
||||||
|
|
||||||
makeBaseFunctor ''RlpExpr
|
|
||||||
|
|
||||||
deriving instance (Show b, Show a) => Show (RlpExprF b a)
|
|
||||||
|
|
||||||
type RlpExprF' = RlpExprF Name
|
|
||||||
|
|
||||||
-- society if derivable Show1
|
|
||||||
instance (Show b) => Show1 (RlpExprF b) where
|
|
||||||
liftShowsPrec sp _ p m = case m of
|
|
||||||
(LetEF bs e) -> showsBinaryWith showsPrec sp "LetEF" p bs e
|
|
||||||
(VarEF n) -> showsUnaryWith showsPrec "VarEF" p n
|
|
||||||
(ConEF n) -> showsUnaryWith showsPrec "ConEF" p n
|
|
||||||
(LamEF bs e) -> showsBinaryWith showsPrec sp "LamEF" p bs e
|
|
||||||
(CaseEF e as) -> showsBinaryWith sp showsPrec "CaseEF" p e as
|
|
||||||
(IfEF a b c) -> showsTernaryWith sp sp sp "IfEF" p a b c
|
|
||||||
(AppEF f x) -> showsBinaryWith sp sp "AppEF" p f x
|
|
||||||
(LitEF l) -> showsUnaryWith showsPrec "LitEF" p l
|
|
||||||
|
|
||||||
showsTernaryWith :: (Int -> x -> ShowS)
|
|
||||||
-> (Int -> y -> ShowS)
|
|
||||||
-> (Int -> z -> ShowS)
|
|
||||||
-> String -> Int
|
|
||||||
-> x -> y -> z
|
|
||||||
-> ShowS
|
|
||||||
showsTernaryWith sa sb sc name p a b c = showParen (p > 10)
|
|
||||||
$ showString name
|
|
||||||
. showChar ' ' . sa 11 a
|
|
||||||
. showChar ' ' . sb 11 b
|
|
||||||
. showChar ' ' . sc 11 c
|
|
||||||
|
|
||||||
--------------------------------------------------------------------------------
|
|
||||||
|
|
||||||
makeLenses ''RlpModule
|
|
||||||
|
|
||||||
@@ -38,25 +38,9 @@ spec = do
|
|||||||
let e = [coreExpr|3|]
|
let e = [coreExpr|3|]
|
||||||
in check' [] (TyCon "Bool") e `shouldSatisfy` isLeft
|
in check' [] (TyCon "Bool") e `shouldSatisfy` isLeft
|
||||||
|
|
||||||
it "should infer `fix ((+#) 1)` :: Int" $
|
infer' :: Context' -> Expr' -> Either TypeError Type
|
||||||
let g = [ ("fix", ("a" :-> "a") :-> "a")
|
infer' g e = fmap fst . runErrorful $ infer g e
|
||||||
, ("+#", TyInt :-> TyInt :-> TyInt) ]
|
|
||||||
e = [coreExpr|fix ((+#) 1)|]
|
|
||||||
in infer' g e `shouldBe` Right TyInt
|
|
||||||
|
|
||||||
it "should infer mutually recursively defined lists" $
|
check' :: Context' -> Type -> Expr' -> Either TypeError ()
|
||||||
let g = [ ("cons", TyInt :-> TyCon "IntList" :-> TyCon "IntList") ]
|
check' g t e = fmap fst . runErrorful $ check g t e
|
||||||
e :: Expr'
|
|
||||||
e = [coreExpr|letrec { as = cons 1 bs; bs = cons 2 as } in as|]
|
|
||||||
in infer' g e `shouldBe` Right (TyCon "IntList")
|
|
||||||
|
|
||||||
infer' :: Context' -> Expr' -> Either [TypeError] Type
|
|
||||||
infer' g e = case runErrorful $ infer g e of
|
|
||||||
(Just t, _) -> Right t
|
|
||||||
(Nothing, es) -> Left es
|
|
||||||
|
|
||||||
check' :: Context' -> Type -> Expr' -> Either [TypeError] ()
|
|
||||||
check' g t e = case runErrorful $ check g t e of
|
|
||||||
(Just t, _) -> Right ()
|
|
||||||
(Nothing, es) -> Left es
|
|
||||||
|
|
||||||
|
|||||||
40
tst/Core/ParseSpec.hs
Normal file
40
tst/Core/ParseSpec.hs
Normal file
@@ -0,0 +1,40 @@
|
|||||||
|
module Core.ParseSpec
|
||||||
|
( spec
|
||||||
|
)
|
||||||
|
where
|
||||||
|
----------------------------------------------------------------------------------
|
||||||
|
import CoreSyntax
|
||||||
|
import Core.Syntax
|
||||||
|
import Compiler.JustRun
|
||||||
|
import Compiler.RlpcError
|
||||||
|
import Control.Monad ((<=<))
|
||||||
|
import Data.Coerce
|
||||||
|
import Data.Text qualified as T
|
||||||
|
import Data.Functor.Classes (Eq1(..))
|
||||||
|
import Test.Hspec
|
||||||
|
import Test.QuickCheck
|
||||||
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
spec :: Spec
|
||||||
|
spec = do
|
||||||
|
it "should be a right-inverse to the unparser \
|
||||||
|
\up to source code congruency" $
|
||||||
|
withMaxSuccess 20 $ property $
|
||||||
|
\p -> (unparse <=< parse) p ~== Right p
|
||||||
|
|
||||||
|
-- TODO: abitrary ASTs
|
||||||
|
-- it "should be a right-inverse to the unparser\
|
||||||
|
-- \up to source code congruency" $
|
||||||
|
-- property $ \p -> (parse <=< unparse) p == Right p
|
||||||
|
|
||||||
|
(~==) :: (Eq1 f) => f ProgramSrc -> f ProgramSrc -> Bool
|
||||||
|
(~==) = liftEq congruentSrc
|
||||||
|
|
||||||
|
infix 4 ~==
|
||||||
|
|
||||||
|
parse :: ProgramSrc -> Either RlpcError Program'
|
||||||
|
parse (ProgramSrc s) = justParseSrc (T.unpack s)
|
||||||
|
|
||||||
|
unparse :: Program' -> Either RlpcError ProgramSrc
|
||||||
|
unparse = Right . unparseCoreProg
|
||||||
|
|
||||||
303
tst/CoreSyntax.hs
Normal file
303
tst/CoreSyntax.hs
Normal file
@@ -0,0 +1,303 @@
|
|||||||
|
{-# LANGUAGE OverloadedStrings, LambdaCase, GeneralisedNewtypeDeriving #-}
|
||||||
|
module CoreSyntax
|
||||||
|
( ProgramSrc(..)
|
||||||
|
, congruentSrc
|
||||||
|
, unparseCoreProg
|
||||||
|
)
|
||||||
|
where
|
||||||
|
----------------------------------------------------------------------------------
|
||||||
|
import Core.Syntax
|
||||||
|
import Compiler.JustRun (justParseSrc)
|
||||||
|
import Control.Arrow ((>>>), (&&&))
|
||||||
|
import Control.Monad
|
||||||
|
import Data.List (intersperse)
|
||||||
|
import Data.Coerce (coerce)
|
||||||
|
import Data.Text (Text)
|
||||||
|
import Data.Text qualified as T
|
||||||
|
import Data.HashMap.Strict qualified as H
|
||||||
|
import Test.QuickCheck
|
||||||
|
import Text.PrettyPrint hiding ((<>))
|
||||||
|
import Data.Functor ((<&>))
|
||||||
|
import Data.Function ((&), on)
|
||||||
|
import Data.String (IsString(..))
|
||||||
|
import Lens.Micro.Platform
|
||||||
|
import Lens.Micro.Platform.Internal (IsText(..))
|
||||||
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
newtype ProgramSrc = ProgramSrc Text
|
||||||
|
deriving (Show, Read, Eq, Semigroup, Monoid, IsString)
|
||||||
|
|
||||||
|
instance Arbitrary ProgramSrc where
|
||||||
|
arbitrary = sized genProg where
|
||||||
|
|
||||||
|
genProg :: Int -> Gen ProgramSrc
|
||||||
|
genProg n = do
|
||||||
|
-- in generating a program, we create a random list of sc names and
|
||||||
|
-- assign them type signatures and definitions in random order.
|
||||||
|
ns <- replicateM n genName
|
||||||
|
-- generate a typesig and def for each name
|
||||||
|
ns & each %~ (genTySig &&& genScDef)
|
||||||
|
-- [(typesig, scdef)] -> [typesigs and scdefs]
|
||||||
|
& uncurry (++) . unzip
|
||||||
|
-- [Gen Text] -> Gen [Text]
|
||||||
|
& sequenceA
|
||||||
|
-- shuffle order of tysigs and scdefs
|
||||||
|
>>= shuffle
|
||||||
|
-- terminate each tysig and scdef with a semicolon with a blank
|
||||||
|
-- line for legibility
|
||||||
|
<&> intersperse ";\n\n"
|
||||||
|
-- mconcat into a single body of text
|
||||||
|
<&> mconcat
|
||||||
|
-- she's done! put a bow on her! :D
|
||||||
|
<&> ProgramSrc
|
||||||
|
|
||||||
|
genTySig :: Name -> Gen Text
|
||||||
|
genTySig n = conseq [pure n, ws, pure "::", ws, genTy]
|
||||||
|
|
||||||
|
genScDef :: Name -> Gen Text
|
||||||
|
genScDef n = conseq [pure n, ws, pure "=", ws, genExpr]
|
||||||
|
|
||||||
|
genExpr :: Gen Text
|
||||||
|
genExpr = gen 4 0 where
|
||||||
|
gen 0 _ = oneof
|
||||||
|
[ genVar
|
||||||
|
, genLit
|
||||||
|
]
|
||||||
|
gen n p = oneof
|
||||||
|
[ gen 0 p
|
||||||
|
, wrapParens <$> gen n' 0
|
||||||
|
, genApp n p
|
||||||
|
, genLet n p
|
||||||
|
-- , genLam n p
|
||||||
|
-- , genCase n p
|
||||||
|
]
|
||||||
|
where n' = next n
|
||||||
|
|
||||||
|
genVar = oneof
|
||||||
|
[ genName
|
||||||
|
, genCon
|
||||||
|
, wrapParens <$> genSymName
|
||||||
|
, wrapParens <$> genSymCon
|
||||||
|
]
|
||||||
|
|
||||||
|
genCase n p = conseq [ pure "case", ws1, gen n' 0, ws1, pure "of"
|
||||||
|
, pure "{", alts, pure "}"
|
||||||
|
]
|
||||||
|
<&> pprec 0 p
|
||||||
|
where
|
||||||
|
n' = next n
|
||||||
|
alts = chooseSize (1,6) (listOf1 alt)
|
||||||
|
<&> intersperse ";"
|
||||||
|
<&> mconcat
|
||||||
|
alt = conseq [ tag, ws, pure "->", ws1, gen n' 0 ]
|
||||||
|
tag = T.pack . show <$> chooseInt (0,maxBound)
|
||||||
|
|
||||||
|
genLit = T.pack . show <$> chooseInt (0,maxBound)
|
||||||
|
|
||||||
|
genApp n p = chooseSize (2,10) (listOf1 (gen n' 1))
|
||||||
|
<&> pprec 0 p . mconcat . intersperse " "
|
||||||
|
where
|
||||||
|
n' = next n
|
||||||
|
|
||||||
|
genLet n p = conseq [ letw, ws, pure "{", ws, binds
|
||||||
|
, ws, pure "}", ws, pure "in"
|
||||||
|
, ws1, gen n' 0
|
||||||
|
]
|
||||||
|
where
|
||||||
|
letw = arbitrary <&> \case
|
||||||
|
Rec -> "letrec"
|
||||||
|
NonRec -> "let"
|
||||||
|
binds = chooseSize (1,6) (listOf1 bind)
|
||||||
|
<&> intersperse ";"
|
||||||
|
<&> mconcat
|
||||||
|
bind = conseq [var, ws, pure "=", ws, gen n' 0]
|
||||||
|
var = oneof [genName, wrapParens <$> genSymName]
|
||||||
|
n' = next n
|
||||||
|
|
||||||
|
genLam n p = conseq [l, ws, bs, ws, pure "->", ws, gen n' 0]
|
||||||
|
<&> pprec 0 p
|
||||||
|
where
|
||||||
|
-- whitespace because reserved op shenanigans :3
|
||||||
|
l = elements [" \\ ", "λ"]
|
||||||
|
n' = next n
|
||||||
|
bs = chooseSize (0,6) (listOf1 genName)
|
||||||
|
<&> mconcat
|
||||||
|
|
||||||
|
next = (`div` 2)
|
||||||
|
|
||||||
|
genTy :: Gen Text
|
||||||
|
genTy = gen 4 where
|
||||||
|
gen 0 = genCon
|
||||||
|
gen n = oneof
|
||||||
|
[ gen 0
|
||||||
|
-- function types
|
||||||
|
, conseq [gen n', ws, pure "->", ws, gen n']
|
||||||
|
-- TODO: type applications (remember precedence lol)
|
||||||
|
]
|
||||||
|
where n' = n `div` 2
|
||||||
|
|
||||||
|
instance Arbitrary Rec where
|
||||||
|
arbitrary = elements [Rec,NonRec]
|
||||||
|
|
||||||
|
chooseSize :: (Int, Int) -> Gen a -> Gen a
|
||||||
|
chooseSize (a,b) g = do
|
||||||
|
n <- chooseInt (a,b)
|
||||||
|
resize n g
|
||||||
|
|
||||||
|
-- | @pprec q p s@ wraps @s@ with parens when @p <= q@
|
||||||
|
pprec :: (IsString a, Monoid a) => Int -> Int -> a -> a
|
||||||
|
pprec maxp p
|
||||||
|
| p <= maxp = id
|
||||||
|
| otherwise = wrapParens
|
||||||
|
|
||||||
|
wrapParens :: (IsString a, Monoid a) => a -> a
|
||||||
|
wrapParens t = "(" <> t <> ")"
|
||||||
|
|
||||||
|
conseq :: (Applicative f, Monoid m, Traversable t)
|
||||||
|
=> t (f m)
|
||||||
|
-> f m
|
||||||
|
conseq tfm = sequenceA tfm <&> the_cool_kid's_concat
|
||||||
|
-- me when `concat` is generalised in the container but specialised in the
|
||||||
|
-- value, and `mconcat` is specialised in the container but generalised in
|
||||||
|
-- the value. shoutout `foldMap id`
|
||||||
|
where the_cool_kid's_concat = foldMap id
|
||||||
|
|
||||||
|
genName :: Gen Name
|
||||||
|
genName = T.pack <$> liftA2 (:) small namechars where
|
||||||
|
small = elements ['a'..'z']
|
||||||
|
|
||||||
|
genCon :: Gen Name
|
||||||
|
genCon = T.pack <$> liftA2 (:) large namechars where
|
||||||
|
large = elements ['A'..'Z']
|
||||||
|
|
||||||
|
genSymName :: Gen Name
|
||||||
|
genSymName = T.pack <$> liftA2 (:) symbol symchars where
|
||||||
|
symbol = elements nameSymbols
|
||||||
|
|
||||||
|
genSymCon :: Gen Name
|
||||||
|
genSymCon = T.pack . (':' :) <$> symchars
|
||||||
|
|
||||||
|
namechars :: Gen String
|
||||||
|
namechars = liftArbitrary namechar where
|
||||||
|
namechar :: Gen Char
|
||||||
|
namechar = elements $ ['a'..'z'] <> ['A'..'Z'] <> ['0'..'9'] <> "'"
|
||||||
|
|
||||||
|
nameSymbols :: [Char]
|
||||||
|
nameSymbols = "!#$%&*+./<=>?@^|-~"
|
||||||
|
|
||||||
|
symchars :: Gen String
|
||||||
|
symchars = liftArbitrary symchar where
|
||||||
|
symchar = elements $ ':' : nameSymbols
|
||||||
|
|
||||||
|
txt :: (IsText t) => t -> Doc
|
||||||
|
txt t = t ^. unpacked & text
|
||||||
|
|
||||||
|
ws :: (IsString a) => Gen a
|
||||||
|
ws = elements [""," ", " "]
|
||||||
|
|
||||||
|
ws1 :: (IsString a) => Gen a
|
||||||
|
ws1 = elements [" ", " "]
|
||||||
|
|
||||||
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
-- | Two bodies of source code are considered congruent iff the parser produces
|
||||||
|
-- identical ASTs for both.
|
||||||
|
congruentSrc :: ProgramSrc -> ProgramSrc -> Bool
|
||||||
|
congruentSrc = (==) `on` (justParseSrc . T.unpack . coerce)
|
||||||
|
|
||||||
|
----------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
-- TODO: unparseCoreProg :: Program -> [CoreToken]
|
||||||
|
-- womp womp.
|
||||||
|
|
||||||
|
-- TODO: implement shrink
|
||||||
|
|
||||||
|
-- | @unparseCoreProg@ should be inverse to @parseCoreProg@ up to source code
|
||||||
|
-- congruency, newtype coercion and errors handling.
|
||||||
|
unparseCoreProg :: Program' -> ProgramSrc
|
||||||
|
unparseCoreProg p = unparseTypeSigs (p ^. programTypeSigs)
|
||||||
|
<> unparseScDefs (p ^. programScDefs)
|
||||||
|
|
||||||
|
unparseTypeSigs :: H.HashMap Name Type -> ProgramSrc
|
||||||
|
unparseTypeSigs = H.foldrWithKey f mempty
|
||||||
|
where f k v a = unparseTypeSig k v <> ";\n\n" <> a
|
||||||
|
|
||||||
|
unparseTypeSig :: Name -> Type -> ProgramSrc
|
||||||
|
unparseTypeSig n t = unparseName n <> " :: " <> unparseType t
|
||||||
|
|
||||||
|
unparseName :: Name -> ProgramSrc
|
||||||
|
unparseName n
|
||||||
|
| T.head n `elem` (':' : nameSymbols) = coerce $ wrapParens n
|
||||||
|
| otherwise = coerce n
|
||||||
|
|
||||||
|
unparseType :: Type -> ProgramSrc
|
||||||
|
unparseType = go 0 where
|
||||||
|
go :: Int -> Type -> ProgramSrc
|
||||||
|
-- (:->) is a special case of TyApp, but we want the infix syntax
|
||||||
|
go p (a :-> b) = a : assocFun b
|
||||||
|
<&> go 1
|
||||||
|
& coerce (T.intercalate " -> ")
|
||||||
|
& pprec 0 p
|
||||||
|
go p a@(TyApp f x) = assocApp a
|
||||||
|
<&> go 1
|
||||||
|
& coerce (T.intercalate " ")
|
||||||
|
& pprec 1 p
|
||||||
|
go _ TyFun = "(->)"
|
||||||
|
go _ (TyCon a) = unparseName a
|
||||||
|
go _ (TyVar a) = unparseName a
|
||||||
|
|
||||||
|
assocFun :: Type -> [Type]
|
||||||
|
assocFun (a :-> b) = a : assocFun b
|
||||||
|
assocFun x = [x]
|
||||||
|
|
||||||
|
assocApp :: Type -> [Type]
|
||||||
|
assocApp (TyApp f x) = assocApp f ++ [x]
|
||||||
|
assocApp x = [x]
|
||||||
|
|
||||||
|
unparseScDefs :: [ScDef'] -> ProgramSrc
|
||||||
|
unparseScDefs = foldr f mempty where
|
||||||
|
f sc a = unparseScDef sc <> ";\n\n" <> a
|
||||||
|
|
||||||
|
unparseScDef :: ScDef' -> ProgramSrc
|
||||||
|
unparseScDef (ScDef n as e) = (unparseName <$> (n:as)) <> ["=", unparseExpr e]
|
||||||
|
& coerce (T.intercalate " ")
|
||||||
|
|
||||||
|
unparseExpr :: Expr' -> ProgramSrc
|
||||||
|
unparseExpr = go 0 where
|
||||||
|
go :: Int -> Expr' -> ProgramSrc
|
||||||
|
go _ (Var n) = unparseName n
|
||||||
|
go _ (Con t a) = mconcat ["Pack{",srcShow t," ",srcShow a,"}"]
|
||||||
|
go _ (Lit l) = unparseLit l
|
||||||
|
go p a@(App _ _) = srci " " (go 1 <$> assocApp a)
|
||||||
|
& pprec 0 p
|
||||||
|
go p (Lam bs e) = "λ" <> srci " " (unparseName <$> bs)
|
||||||
|
<> " -> " <> go 0 e
|
||||||
|
& pprec 0 p
|
||||||
|
go p (Let r bs e) = mconcat [lw," { ",bs'," } in ",go 0 e]
|
||||||
|
& pprec 0 p
|
||||||
|
where
|
||||||
|
lw = case r of { NonRec -> "let"; Rec -> "letrec" }
|
||||||
|
bs' = srci "; " $ unparseBinding <$> bs
|
||||||
|
go p (Case e as) = mconcat ["case ",go 0 e," of {",as',"}"]
|
||||||
|
& pprec 0 p
|
||||||
|
where as' = srci "; " (unparseAlter <$> as)
|
||||||
|
|
||||||
|
assocApp (App f x) = assocApp f ++ [x]
|
||||||
|
assocApp f = [f]
|
||||||
|
|
||||||
|
srci :: ProgramSrc -> [ProgramSrc] -> ProgramSrc
|
||||||
|
srci = coerce T.intercalate
|
||||||
|
|
||||||
|
unparseBinding :: Binding' -> ProgramSrc
|
||||||
|
unparseBinding (k := v) = mconcat [unparseName k, " = ", unparseExpr v]
|
||||||
|
|
||||||
|
unparseLit :: Lit -> ProgramSrc
|
||||||
|
unparseLit (IntL n) = srcShow n
|
||||||
|
|
||||||
|
srcShow :: (Show a) => a -> ProgramSrc
|
||||||
|
srcShow = coerce . T.pack . show
|
||||||
|
|
||||||
|
unparseAlter :: Alter' -> ProgramSrc
|
||||||
|
unparseAlter (Alter (AltData t) as e) = srcShow t <> " " <> coerce (T.unwords as)
|
||||||
|
<> " -> " <> unparseExpr e
|
||||||
|
|
||||||
@@ -21,28 +21,21 @@ spec = do
|
|||||||
resultOf [coreProg|id x = x; main = (id (-#)) 3 2;|] `shouldBe` Just (NNum 1)
|
resultOf [coreProg|id x = x; main = (id (-#)) 3 2;|] `shouldBe` Just (NNum 1)
|
||||||
|
|
||||||
it "should correctly evaluate arbitrary arithmetic" $ do
|
it "should correctly evaluate arbitrary arithmetic" $ do
|
||||||
property $ \e ->
|
withMaxSuccess 40 $ property $ \e ->
|
||||||
let arithRes = Just (evalArith e)
|
let arithRes = Just (evalArith e)
|
||||||
coreRes = evalCore e
|
coreRes = evalCore e
|
||||||
in coreRes `shouldBe` arithRes
|
in coreRes `shouldBe` arithRes
|
||||||
|
|
||||||
describe "test programs" $ do
|
describe "test programs" $ do
|
||||||
it "fac 3" $
|
it "fac 3" $ do
|
||||||
resultOf Ex.fac3 `shouldBe` Just (NNum 6)
|
resultOf Ex.fac3 `shouldBe` Just (NNum 6)
|
||||||
|
|
||||||
it "sum [1,2,3]" $
|
it "sum [1,2,3]" $ do
|
||||||
resultOf Ex.sumList `shouldBe` Just (NNum 6)
|
resultOf Ex.sumList `shouldBe` Just (NNum 6)
|
||||||
|
|
||||||
it "k 3 ((/#) 1 0)" $
|
it "k 3 ((/#) 1 0)" $ do
|
||||||
resultOf Ex.constDivZero `shouldBe` Just (NNum 3)
|
resultOf Ex.constDivZero `shouldBe` Just (NNum 3)
|
||||||
|
|
||||||
it "id (case ... of { ... })" $
|
it "id (case ... of { ... })" $ do
|
||||||
resultOf Ex.idCase `shouldBe` Just (NNum 5)
|
resultOf Ex.idCase `shouldBe` Just (NNum 5)
|
||||||
|
|
||||||
it "bool pattern matching with named constructors" $
|
|
||||||
resultOf Ex.namedBoolCase `shouldBe` Just (NNum 123)
|
|
||||||
|
|
||||||
it "list pattern matching with named constructors" $
|
|
||||||
resultOf Ex.namedConsCase `shouldBe` Just (NNum 6)
|
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user