Compare commits
2 commits
f870bbe3c7
...
01a6a5bbba
Author | SHA1 | Date | |
---|---|---|---|
Alex Bethel | 01a6a5bbba | ||
Alex Bethel | cd0353b31a |
|
@ -2,13 +2,13 @@
|
||||||
|
|
||||||
use std::{error::Error, fmt::Display, fs::File, io::Write, process::exit, str::FromStr};
|
use std::{error::Error, fmt::Display, fs::File, io::Write, process::exit, str::FromStr};
|
||||||
|
|
||||||
|
use clap::Parser;
|
||||||
use drimc_rs::{
|
use drimc_rs::{
|
||||||
ast2ir::ast2ir,
|
ast2ir::ast2ir,
|
||||||
backends,
|
backends,
|
||||||
parser::{parser, ParserError, ParserMeta},
|
parser::{parser, ParserError, ParserMeta},
|
||||||
typeck::typeck,
|
typeck::typeck,
|
||||||
};
|
};
|
||||||
use clap::Parser;
|
|
||||||
|
|
||||||
/// Optimization levels.
|
/// Optimization levels.
|
||||||
#[derive(Debug)]
|
#[derive(Debug)]
|
||||||
|
@ -256,7 +256,7 @@ fn main() {
|
||||||
let source = std::fs::read_to_string(&args.source_file)?;
|
let source = std::fs::read_to_string(&args.source_file)?;
|
||||||
let meta = ParserMeta::default();
|
let meta = ParserMeta::default();
|
||||||
let ast = chumsky::Parser::parse(&parser(&meta), source).map_err(ParserError)?;
|
let ast = chumsky::Parser::parse(&parser(&meta), source).map_err(ParserError)?;
|
||||||
typeck(&ast)?;
|
let ast = typeck(ast)?;
|
||||||
|
|
||||||
let ir = ast2ir(ast);
|
let ir = ast2ir(ast);
|
||||||
|
|
||||||
|
|
|
@ -10,7 +10,8 @@ use chumsky::{
|
||||||
};
|
};
|
||||||
|
|
||||||
use crate::syntax::{
|
use crate::syntax::{
|
||||||
ClassMember, Expr, Identifier, Literal, Pattern, Statement, SyntaxTree, Type, TypeConstructor,
|
ClassMember, Expr, ExprKind, Identifier, Literal, Pattern, Statement, SyntaxTree, Type,
|
||||||
|
TypeConstructor,
|
||||||
};
|
};
|
||||||
|
|
||||||
/// Adapter to make `chumsky`'s parser errors usable as standard Rust errors.
|
/// Adapter to make `chumsky`'s parser errors usable as standard Rust errors.
|
||||||
|
@ -330,6 +331,7 @@ fn parse_func_decl<'a>(
|
||||||
name,
|
name,
|
||||||
arguments,
|
arguments,
|
||||||
definition,
|
definition,
|
||||||
|
typ: None,
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -372,15 +374,15 @@ fn parse_expression<'a>(
|
||||||
let application = term.repeated().at_least(1).map(|exprs| {
|
let application = term.repeated().at_least(1).map(|exprs| {
|
||||||
exprs
|
exprs
|
||||||
.into_iter()
|
.into_iter()
|
||||||
.reduce(|l, r| Expr::Application {
|
.reduce(|l, r| {
|
||||||
|
expr(ExprKind::Application {
|
||||||
func: Box::new(l),
|
func: Box::new(l),
|
||||||
argument: Box::new(r),
|
argument: Box::new(r),
|
||||||
})
|
})
|
||||||
|
})
|
||||||
.unwrap()
|
.unwrap()
|
||||||
});
|
});
|
||||||
|
|
||||||
// let unary = parse_unary(m, term);
|
|
||||||
// let unary = term;
|
|
||||||
let unary = parse_unary(m, application);
|
let unary = parse_unary(m, application);
|
||||||
|
|
||||||
let binary = (0..=10).rev().fold(unary.boxed(), |p, precedence| {
|
let binary = (0..=10).rev().fold(unary.boxed(), |p, precedence| {
|
||||||
|
@ -399,12 +401,14 @@ fn parse_unary(
|
||||||
.repeated()
|
.repeated()
|
||||||
.then(base)
|
.then(base)
|
||||||
.map(|(ops, exp)| {
|
.map(|(ops, exp)| {
|
||||||
ops.into_iter().fold(exp, |exp, op| Expr::UnaryOp {
|
ops.into_iter().fold(exp, |exp, op| {
|
||||||
|
expr(ExprKind::UnaryOp {
|
||||||
kind: op.to_string(),
|
kind: op.to_string(),
|
||||||
val: Box::new(exp),
|
val: Box::new(exp),
|
||||||
translation: "negate".to_string(),
|
translation: "negate".to_string(),
|
||||||
})
|
})
|
||||||
})
|
})
|
||||||
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_binary<'a>(
|
fn parse_binary<'a>(
|
||||||
|
@ -442,12 +446,12 @@ fn parse_binary<'a>(
|
||||||
others
|
others
|
||||||
.into_iter()
|
.into_iter()
|
||||||
.fold(first, |left, (op_name, _assoc, translation, right)| {
|
.fold(first, |left, (op_name, _assoc, translation, right)| {
|
||||||
Expr::BinaryOp {
|
expr(ExprKind::BinaryOp {
|
||||||
kind: op_name.to_owned(),
|
kind: op_name.to_owned(),
|
||||||
left: Box::new(left),
|
left: Box::new(left),
|
||||||
right: Box::new(right),
|
right: Box::new(right),
|
||||||
translation: translation.to_string(),
|
translation: translation.to_string(),
|
||||||
}
|
})
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
Some(Associativity::Right) => {
|
Some(Associativity::Right) => {
|
||||||
|
@ -488,12 +492,14 @@ fn parse_binary<'a>(
|
||||||
others_l
|
others_l
|
||||||
.into_iter()
|
.into_iter()
|
||||||
.rev()
|
.rev()
|
||||||
.fold(last.to_owned(), |r, (l, (op, trans))| Expr::BinaryOp {
|
.fold(last.to_owned(), |r, (l, (op, trans))| {
|
||||||
|
expr(ExprKind::BinaryOp {
|
||||||
kind: op.to_string(),
|
kind: op.to_string(),
|
||||||
left: Box::new(l.to_owned()),
|
left: Box::new(l.to_owned()),
|
||||||
right: Box::new(r),
|
right: Box::new(r),
|
||||||
translation: trans.to_string(),
|
translation: trans.to_string(),
|
||||||
})
|
})
|
||||||
|
})
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
})
|
})
|
||||||
|
@ -501,66 +507,72 @@ fn parse_binary<'a>(
|
||||||
|
|
||||||
fn parse_let_expr(
|
fn parse_let_expr(
|
||||||
m: &ParserMeta,
|
m: &ParserMeta,
|
||||||
base: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
rec: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
||||||
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
||||||
pad(keyword("let"))
|
pad(keyword("let"))
|
||||||
.ignore_then(parse_pattern(m))
|
.ignore_then(parse_pattern(m))
|
||||||
.then_ignore(pad(just('=')))
|
.then_ignore(pad(just('=')))
|
||||||
.then(base.clone())
|
.then(rec.clone())
|
||||||
.then_ignore(pad(keyword("in")))
|
.then_ignore(pad(keyword("in")))
|
||||||
.then(base)
|
.then(rec)
|
||||||
.map(|((left, right), into)| Expr::Let {
|
.map(|((left, right), into)| {
|
||||||
|
expr(ExprKind::Let {
|
||||||
left,
|
left,
|
||||||
right: Box::new(right),
|
right: Box::new(right),
|
||||||
into: Box::new(into),
|
into: Box::new(into),
|
||||||
})
|
})
|
||||||
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_match_expr(
|
fn parse_match_expr(
|
||||||
m: &ParserMeta,
|
m: &ParserMeta,
|
||||||
base: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
rec: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
||||||
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
||||||
pad(keyword("match"))
|
pad(keyword("match"))
|
||||||
.ignore_then(base.clone())
|
.ignore_then(rec.clone())
|
||||||
.then(
|
.then(
|
||||||
parse_pattern(m)
|
parse_pattern(m)
|
||||||
.then_ignore(pad(just("=>")))
|
.then_ignore(pad(just("=>")))
|
||||||
.then(base)
|
.then(rec)
|
||||||
.separated_by(pad(just(",")))
|
.separated_by(pad(just(",")))
|
||||||
.allow_trailing()
|
.allow_trailing()
|
||||||
.delimited_by(pad(just('{')), pad(just('}'))),
|
.delimited_by(pad(just('{')), pad(just('}'))),
|
||||||
)
|
)
|
||||||
.map(|(matcher, cases)| Expr::Match {
|
.map(|(matcher, cases)| {
|
||||||
|
expr(ExprKind::Match {
|
||||||
matcher: Box::new(matcher),
|
matcher: Box::new(matcher),
|
||||||
cases,
|
cases,
|
||||||
})
|
})
|
||||||
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_record_expr(
|
fn parse_record_expr(
|
||||||
_m: &ParserMeta,
|
_m: &ParserMeta,
|
||||||
base: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
rec: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
||||||
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
||||||
pad(ident())
|
pad(ident())
|
||||||
.then_ignore(pad(just(':')))
|
.then_ignore(pad(just(':')))
|
||||||
.then(base)
|
.then(rec)
|
||||||
.separated_by(pad(just(',')))
|
.separated_by(pad(just(',')))
|
||||||
.allow_trailing()
|
.allow_trailing()
|
||||||
.delimited_by(pad(just('{')), pad(just('}')))
|
.delimited_by(pad(just('{')), pad(just('}')))
|
||||||
.map(Expr::Record)
|
.map(|elems| expr(ExprKind::Record(elems)))
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_lambda_expr(
|
fn parse_lambda_expr(
|
||||||
m: &ParserMeta,
|
m: &ParserMeta,
|
||||||
base: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
rec: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
||||||
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
||||||
pad(keyword("fn"))
|
pad(keyword("fn"))
|
||||||
.ignore_then(parse_pattern(m).repeated())
|
.ignore_then(parse_pattern(m).repeated())
|
||||||
.then_ignore(pad(just("->")))
|
.then_ignore(pad(just("->")))
|
||||||
.then(base)
|
.then(rec)
|
||||||
.map(|(arguments, result)| Expr::Lambda {
|
.map(|(arguments, result)| {
|
||||||
|
expr(ExprKind::Lambda {
|
||||||
arguments,
|
arguments,
|
||||||
result: Box::new(result),
|
result: Box::new(result),
|
||||||
})
|
})
|
||||||
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_subscript_expr(
|
fn parse_subscript_expr(
|
||||||
|
@ -585,36 +597,38 @@ fn parse_subscript_expr(
|
||||||
.repeated(),
|
.repeated(),
|
||||||
)
|
)
|
||||||
.map(|(l, subscripts): (Expr, Vec<(SubscriptKind, Expr)>)| {
|
.map(|(l, subscripts): (Expr, Vec<(SubscriptKind, Expr)>)| {
|
||||||
subscripts.into_iter().fold(l, |l, (kind, r)| match kind {
|
subscripts.into_iter().fold(l, |l, (kind, r)| {
|
||||||
SubscriptKind::Dot => Expr::DotSubscript {
|
expr(match kind {
|
||||||
|
SubscriptKind::Dot => ExprKind::DotSubscript {
|
||||||
value: Box::new(l),
|
value: Box::new(l),
|
||||||
subscript: Box::new(r),
|
subscript: Box::new(r),
|
||||||
},
|
},
|
||||||
SubscriptKind::Bracket => Expr::BracketSubscript {
|
SubscriptKind::Bracket => ExprKind::BracketSubscript {
|
||||||
value: Box::new(l),
|
value: Box::new(l),
|
||||||
subscript: Box::new(r),
|
subscript: Box::new(r),
|
||||||
},
|
},
|
||||||
})
|
})
|
||||||
})
|
})
|
||||||
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_tuple_expr(
|
fn parse_tuple_expr(
|
||||||
_m: &ParserMeta,
|
_m: &ParserMeta,
|
||||||
base: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
rec: impl Parser<char, Expr, Error = Simple<char>> + Clone,
|
||||||
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
||||||
base.separated_by(pad(just(',')))
|
rec.separated_by(pad(just(',')))
|
||||||
.delimited_by(pad(just('(')), pad(just(')')))
|
.delimited_by(pad(just('(')), pad(just(')')))
|
||||||
.map(|exprs| {
|
.map(|exprs| {
|
||||||
if exprs.len() == 1 {
|
if exprs.len() == 1 {
|
||||||
exprs.into_iter().next().unwrap()
|
exprs.into_iter().next().unwrap()
|
||||||
} else {
|
} else {
|
||||||
Expr::Tuple(exprs)
|
expr(ExprKind::Tuple(exprs))
|
||||||
}
|
}
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_var_ref_expr(m: &ParserMeta) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
fn parse_var_ref_expr(m: &ParserMeta) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
||||||
parse_identifier(m).map(Expr::VariableReference)
|
parse_identifier(m).map(|r| expr(ExprKind::VariableReference(r)))
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_literal(_m: &ParserMeta) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
fn parse_literal(_m: &ParserMeta) -> impl Parser<char, Expr, Error = Simple<char>> + Clone {
|
||||||
|
@ -659,7 +673,7 @@ fn parse_literal(_m: &ParserMeta) -> impl Parser<char, Expr, Error = Simple<char
|
||||||
.map(|(l, r)| (l + "." + &r).parse().unwrap())
|
.map(|(l, r)| (l + "." + &r).parse().unwrap())
|
||||||
.map(Literal::Float);
|
.map(Literal::Float);
|
||||||
|
|
||||||
pad(choice((int, float, string))).map(Expr::Literal)
|
pad(choice((int, float, string))).map(|lit| expr(ExprKind::Literal(lit)))
|
||||||
}
|
}
|
||||||
|
|
||||||
fn parse_identifier(
|
fn parse_identifier(
|
||||||
|
@ -797,8 +811,8 @@ fn parse_record_pattern(
|
||||||
|
|
||||||
fn parse_literal_pattern(m: &ParserMeta) -> impl Parser<char, Pattern, Error = Simple<char>> {
|
fn parse_literal_pattern(m: &ParserMeta) -> impl Parser<char, Pattern, Error = Simple<char>> {
|
||||||
// TODO: factor out literal parsing so we don't have to do this ugly `unreachable` stuff.
|
// TODO: factor out literal parsing so we don't have to do this ugly `unreachable` stuff.
|
||||||
parse_literal(m).map(|e| match e {
|
parse_literal(m).map(|e| match e.kind {
|
||||||
Expr::Literal(lit) => Pattern::Literal(lit),
|
ExprKind::Literal(lit) => Pattern::Literal(lit),
|
||||||
_ => unreachable!(),
|
_ => unreachable!(),
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
@ -829,6 +843,10 @@ fn ident() -> impl Parser<char, String, Error = Simple<char>> + Clone {
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
|
fn expr(e: ExprKind) -> Expr {
|
||||||
|
Expr { kind: e, typ: None }
|
||||||
|
}
|
||||||
|
|
||||||
#[cfg(test)]
|
#[cfg(test)]
|
||||||
mod tests {
|
mod tests {
|
||||||
use super::*;
|
use super::*;
|
||||||
|
|
|
@ -2,6 +2,8 @@
|
||||||
|
|
||||||
use num_bigint::BigUint;
|
use num_bigint::BigUint;
|
||||||
|
|
||||||
|
use crate::typeck;
|
||||||
|
|
||||||
/// A concrete syntax tree. This represents the full content of a Drim program, including all
|
/// A concrete syntax tree. This represents the full content of a Drim program, including all
|
||||||
/// whitespace, comments, and tokens: the source code of the original program can be recovered
|
/// whitespace, comments, and tokens: the source code of the original program can be recovered
|
||||||
/// completely using the syntax tree.
|
/// completely using the syntax tree.
|
||||||
|
@ -65,6 +67,10 @@ pub enum ClassMember {
|
||||||
|
|
||||||
/// The definition of the function.
|
/// The definition of the function.
|
||||||
definition: Option<Expr>,
|
definition: Option<Expr>,
|
||||||
|
|
||||||
|
/// The type of the overall function; this is filled in by the typechecker, and is left
|
||||||
|
/// blank by the parser.
|
||||||
|
typ: Option<typeck::Type>,
|
||||||
},
|
},
|
||||||
|
|
||||||
/// Declaration of a type that is a literal alias for another type.
|
/// Declaration of a type that is a literal alias for another type.
|
||||||
|
@ -87,9 +93,19 @@ pub struct TypeConstructor {
|
||||||
pub args: Vec<Type>,
|
pub args: Vec<Type>,
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Expressions.
|
/// An expression.
|
||||||
#[derive(Clone, Debug)]
|
#[derive(Clone, Debug)]
|
||||||
pub enum Expr {
|
pub struct Expr {
|
||||||
|
/// The contents of the expression.
|
||||||
|
pub kind: ExprKind,
|
||||||
|
|
||||||
|
/// An optional type signature, left as `None` by the parser and added by the type checker.
|
||||||
|
pub typ: Option<typeck::Type>,
|
||||||
|
}
|
||||||
|
|
||||||
|
/// The different kinds of expressions.
|
||||||
|
#[derive(Clone, Debug)]
|
||||||
|
pub enum ExprKind {
|
||||||
/// Unary operators, e.g., `-5`.
|
/// Unary operators, e.g., `-5`.
|
||||||
UnaryOp {
|
UnaryOp {
|
||||||
/// The text of the operator.
|
/// The text of the operator.
|
||||||
|
@ -252,7 +268,7 @@ pub enum Pattern {
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Namespaced identifiers.
|
/// Namespaced identifiers.
|
||||||
#[derive(Clone, Debug)]
|
#[derive(Clone, Debug, Hash, PartialEq)]
|
||||||
pub struct Identifier {
|
pub struct Identifier {
|
||||||
/// The elements of the identifier; there must be at least one of these.
|
/// The elements of the identifier; there must be at least one of these.
|
||||||
pub elems: Vec<String>,
|
pub elems: Vec<String>,
|
||||||
|
|
|
@ -1,8 +1,10 @@
|
||||||
//! Type checker.
|
//! Type checker.
|
||||||
|
|
||||||
use std::{error::Error, fmt::Display};
|
use std::{collections::BTreeMap, error::Error, fmt::Display};
|
||||||
|
|
||||||
use crate::syntax::SyntaxTree;
|
use num_bigint::BigInt;
|
||||||
|
|
||||||
|
use crate::syntax::{Identifier, SyntaxTree};
|
||||||
|
|
||||||
/// A compile-time type error from the user's source code.
|
/// A compile-time type error from the user's source code.
|
||||||
#[derive(Debug)]
|
#[derive(Debug)]
|
||||||
|
@ -16,7 +18,39 @@ impl Display for TypeError {
|
||||||
|
|
||||||
impl Error for TypeError {}
|
impl Error for TypeError {}
|
||||||
|
|
||||||
|
/// A type known at compile time. While this resembles the AST `Type` structure, this enum is
|
||||||
|
/// optimized for unifying types against one another and representing compiler-generated types
|
||||||
|
/// rather than strictly representing named types.
|
||||||
|
#[derive(Debug, Clone, PartialEq)]
|
||||||
|
pub enum Type {
|
||||||
|
/// `Foo`
|
||||||
|
Named(Identifier),
|
||||||
|
|
||||||
|
/// `List Int`
|
||||||
|
Application {
|
||||||
|
/// The function being applied. This must be a generic type.
|
||||||
|
function: Box<Type>,
|
||||||
|
|
||||||
|
/// The type given as an argument to the type.
|
||||||
|
expression: Box<Type>,
|
||||||
|
},
|
||||||
|
|
||||||
|
/// `(a, b)`
|
||||||
|
Tuple(Vec<Type>),
|
||||||
|
|
||||||
|
/// `{ a: x, b: y }`
|
||||||
|
Record(BTreeMap<String, Type>),
|
||||||
|
|
||||||
|
/// Compiler-internal type representing an arbitrary-precision integer whose value is known at
|
||||||
|
/// compile time. This is the default type of integer literals. A `CompInt` can be converted to
|
||||||
|
/// an actual integer type via implicit application of the `fromCompInt` generic function.
|
||||||
|
CompInt(BigInt),
|
||||||
|
|
||||||
|
/// Compiler-internal type representing a string literal. See `CompInt`.
|
||||||
|
CompString(String),
|
||||||
|
}
|
||||||
|
|
||||||
/// Type-checks the syntax tree.
|
/// Type-checks the syntax tree.
|
||||||
pub fn typeck(_: &SyntaxTree) -> Result<(), TypeError> {
|
pub fn typeck(_: SyntaxTree) -> Result<SyntaxTree, TypeError> {
|
||||||
todo!()
|
todo!()
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue