schala/schala-lang/src/parsing.rs

1359 lines
44 KiB
Rust
Raw Normal View History

2017-08-29 05:08:09 -07:00
use std::rc::Rc;
use std::iter::Peekable;
2017-09-09 01:25:11 -07:00
use std::vec::IntoIter;
2017-08-29 04:27:07 -07:00
2018-03-23 18:43:43 -07:00
use tokenizing::*;
use tokenizing::Kw::*;
use tokenizing::TokenType::*;
2017-09-06 09:42:29 -07:00
2018-03-23 18:43:43 -07:00
use builtin::{BinOp, PrefixOp};
2017-09-11 02:07:17 -07:00
/* Schala EBNF Grammar */
2017-09-17 00:04:27 -07:00
/* Terminal productions are in 'single quotes' or UPPERCASE if they are a class
2017-09-13 22:40:05 -07:00
* or not representable in ASCII
2017-09-11 02:07:17 -07:00
program := (statement delimiter)* EOF
2017-09-17 00:04:27 -07:00
delimiter := NEWLINE | ';'
2017-09-11 02:07:17 -07:00
statement := expression | declaration
2017-10-04 22:02:31 -07:00
declaration := type_declaration | func_declaration | binding_declaration | impl_declaration
2017-09-11 02:07:17 -07:00
2017-10-04 22:02:31 -07:00
type_declaration := 'type' type_declaration_body
2018-02-12 00:51:53 -08:00
type_declaration_body := 'alias' type_alias | type_singleton_name '=' type_body
2017-10-08 18:47:57 -07:00
type_alias := IDENTIFIER '=' type_name
2017-09-17 00:04:27 -07:00
type_body := variant_specifier ('|' variant_specifier)*
2017-10-08 18:47:57 -07:00
2017-10-08 19:02:52 -07:00
variant_specifier := IDENTIFIER | IDENTIFIER '{' typed_identifier_list '}' | IDENTIFIER '(' type_name* ')'
typed_identifier_list := typed_identifier*
typed_identifier := IDENTIFIER type_anno
2017-09-11 20:37:19 -07:00
func_declaration := func_signature func_body
func_body := ε | '{' (statement delimiter)* '}'
func_signature := 'fn' IDENTIFIER formal_param_list func_body
2017-10-08 20:55:05 -07:00
formal_param_list := '(' (formal_param ',')* ')'
formal_param := IDENTIFIER type_anno+
2017-09-11 02:07:17 -07:00
2017-09-17 06:04:24 -07:00
binding_declaration: 'var' IDENTIFIER '=' expression
| 'const' IDENTIFIER '=' expression
2018-04-24 16:30:17 -07:00
interface_declaration := 'interface' interface_name signature_block
impl_declaration := 'impl' IDENTIFIER decl_block | 'impl' interface_name 'for' IDENTIFIER decl_block
2017-10-08 14:24:02 -07:00
decl_block := '{' (func_declaration)* '}'
2018-02-21 22:06:56 -08:00
signature_block := '{' (func_signature)* '}'
2017-10-08 14:24:02 -07:00
2018-04-24 16:30:17 -07:00
interface_name := IDENTIFIER
2017-10-03 03:49:07 -07:00
2017-09-28 23:55:10 -07:00
type_anno := (':' type_name)+
2018-02-12 00:51:53 -08:00
type_name := type_singleton_name | '(' type_names ')'
2017-09-28 23:55:10 -07:00
type_names := ε | type_name (, type_name)*
2018-02-12 00:51:53 -08:00
type_singleton_name = IDENTIFIER (type_params)*
2017-09-28 23:55:10 -07:00
type_params := '<' type_name (, type_name)* '>'
2017-09-11 23:16:37 -07:00
expression := precedence_expr type_anno+
2017-09-17 17:44:06 -07:00
precedence_expr := prefix_expr
prefix_expr := prefix_op call_expr
2017-09-17 17:44:06 -07:00
prefix_op := '+' | '-' | '!' | '~'
2018-03-06 02:51:45 -08:00
call_expr := index_expr ( '(' expr_list ')' )*
index_expr := primary ( '[' (expression (',' (expression)* | ε) ']' )*
primary := literal | paren_expr | if_expr | match_expr | for_expr | while_expr | identifier_expr | curly_brace_expr | list_expr
2018-03-04 02:11:22 -08:00
curly_brace_expr := lambda_expr | anonymous_struct //TODO
2018-03-08 12:01:24 -08:00
list_expr := '[' (expression, ',')* ']'
2018-05-13 01:40:14 -07:00
lambda_expr := '{' '|' (formal_param ',')* '|' (type_anno)* (statement delimiter)* '}'
2017-10-06 20:28:07 -07:00
paren_expr := LParen paren_inner RParen
paren_inner := (expression ',')*
2018-03-06 02:51:45 -08:00
identifier_expr := named_struct | IDENTIFIER
2018-03-08 12:01:24 -08:00
2017-09-17 00:04:27 -07:00
literal := 'true' | 'false' | number_literal | STR_LITERAL
2017-09-11 02:07:17 -07:00
named_struct := IDENTIFIER record_block
2017-10-14 13:54:17 -07:00
record_block := '{' (record_entry, ',')* | '}' //TODO support anonymus structs, update syntax
record_entry := IDENTIFIER ':' expression
2018-03-04 02:11:22 -08:00
anonymous_struct := TODO
2017-09-18 23:22:28 -07:00
if_expr := 'if' expression block else_clause
else_clause := ε | 'else' block
2017-09-30 14:11:38 -07:00
match_expr := 'match' expression match_body
match_body := '{' (match_arm)* '}'
match_arm := pattern '=>' expression
2017-09-21 16:00:14 -07:00
pattern := identifier //TODO NOT DONE
2017-09-20 20:30:30 -07:00
2018-05-13 01:40:14 -07:00
block := '{' (statement delimiter)* '}'
2017-09-18 23:22:28 -07:00
2017-09-17 00:04:27 -07:00
expr_list := expression (',' expression)* | ε
2017-09-11 15:42:49 -07:00
2018-05-13 01:40:14 -07:00
while_expr := 'while' while_cond '{' (statement delimiter)* '}'
while_cond := ε | expression | expression 'is' pattern //TODO maybe is-expresions should be primary
2018-05-13 01:40:14 -07:00
//TODO this implies there must be at least one enumerator, which the parser doesn't support right
//this second, and maybe should fail later anyway
for_expr := 'for' (enumerator | '{' enumerators '}') for_expr_body
2018-05-13 01:40:14 -07:00
for_expr_body := 'return' expression | '{' (statement delimiter)* '}
enumerators := enumerator (',' enumerators)*
2018-05-13 01:40:14 -07:00
enumerator := identifier '<-' expression | identifier '=' expression //TODO add guards, etc.
2017-09-18 23:22:28 -07:00
2017-09-11 02:07:17 -07:00
// a float_literal can still be assigned to an int in type-checking
number_literal := int_literal | float_literal
2017-09-13 22:40:05 -07:00
int_literal = ('0x' | '0b') digits
float_literal := digits ('.' digits)
digits := (DIGIT_GROUP underscore)+
2017-09-11 02:07:17 -07:00
*/
2017-09-09 01:25:11 -07:00
type TokenIter = Peekable<IntoIter<Token>>;
#[derive(Debug, PartialEq)]
2017-09-11 02:07:17 -07:00
pub struct ParseError {
pub msg: String,
}
impl ParseError {
fn new<T>(msg: &str) -> ParseResult<T> {
Err(ParseError { msg: msg.to_string() })
}
}
pub type ParseResult<T> = Result<T, ParseError>;
#[derive(Debug)]
2017-09-17 05:06:58 -07:00
pub struct ParseRecord {
production_name: String,
next_token: String,
2018-02-10 15:10:06 -08:00
level: u32,
2017-09-17 05:06:58 -07:00
}
2017-09-08 16:42:42 -07:00
struct Parser {
2017-09-09 01:25:11 -07:00
tokens: TokenIter,
parse_record: Vec<ParseRecord>,
parse_level: u32,
restrictions: ParserRestrictions,
}
struct ParserRestrictions {
no_struct_literal: bool
2017-09-09 01:25:11 -07:00
}
impl Parser {
fn new(input: Vec<Token>) -> Parser {
Parser {
tokens: input.into_iter().peekable(),
parse_record: vec![],
parse_level: 0,
restrictions: ParserRestrictions { no_struct_literal: false }
}
2017-09-09 01:25:11 -07:00
}
2017-09-11 02:07:17 -07:00
fn peek(&mut self) -> TokenType {
self.tokens.peek().map(|ref t| { t.token_type.clone() }).unwrap_or(TokenType::EOF)
2017-09-09 01:27:15 -07:00
}
fn peek_with_token_offset(&mut self) -> Token {
2018-03-02 15:21:48 -08:00
self.tokens.peek().map(|t: &Token| { t.clone()}).unwrap_or(Token { token_type: TokenType::EOF, offset: (0,0)})
}
2017-09-11 02:07:17 -07:00
fn next(&mut self) -> TokenType {
self.tokens.next().map(|ref t| { t.token_type.clone() }).unwrap_or(TokenType::EOF)
2017-09-09 01:25:11 -07:00
}
2017-09-08 16:42:42 -07:00
}
macro_rules! print_token_pattern {
($tokenpattern:pat) => { stringify!($tokenpattern) }
}
2017-09-11 02:07:17 -07:00
macro_rules! expect {
($self:expr, $token_type:pat) => { expect!($self, $token_type if true) };
($self:expr, $token_type:pat if $cond:expr) => {
2017-09-13 22:40:05 -07:00
match $self.peek() {
$token_type if $cond => $self.next(),
2017-09-30 14:41:37 -07:00
tok => {
let msg = format!("Expected {}, got {:?}", print_token_pattern!($token_type), tok);
2017-09-30 14:41:37 -07:00
return Err(ParseError { msg })
}
2017-09-13 22:40:05 -07:00
}
2017-09-11 02:07:17 -07:00
}
2017-09-09 00:31:15 -07:00
}
2017-09-11 03:21:07 -07:00
#[derive(Debug, PartialEq)]
2017-10-01 12:55:28 -07:00
pub struct AST(pub Vec<Statement>);
2017-09-08 16:42:42 -07:00
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-09-08 16:42:42 -07:00
pub enum Statement {
2017-09-28 00:06:08 -07:00
ExpressionStatement(Expression),
2017-09-08 16:42:42 -07:00
Declaration(Declaration),
}
2018-05-06 23:09:03 -07:00
type Block = Vec<Statement>;
2017-09-13 23:04:45 -07:00
type ParamName = Rc<String>;
2018-04-24 16:30:17 -07:00
type InterfaceName = Rc<String>; //should be a singleton I think??
2017-10-08 20:55:05 -07:00
type FormalParam = (ParamName, Option<TypeName>);
2017-09-13 23:04:45 -07:00
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-09-08 16:42:42 -07:00
pub enum Declaration {
FuncSig(Signature),
2018-05-06 23:09:03 -07:00
FuncDecl(Signature, Block),
2018-02-12 00:51:53 -08:00
TypeDecl(TypeSingletonName, TypeBody), //should have TypeSingletonName in it
2018-02-12 00:25:48 -08:00
TypeAlias(Rc<String>, Rc<String>), //should have TypeSingletonName in it, or maybe just String, not sure
2017-09-17 06:04:24 -07:00
Binding {
name: Rc<String>,
constant: bool,
expr: Expression,
2017-10-03 03:49:07 -07:00
},
Impl {
type_name: TypeName,
2018-04-24 16:30:17 -07:00
interface_name: Option<InterfaceName>,
2017-10-03 03:49:07 -07:00
block: Vec<Declaration>,
},
2018-04-24 16:30:17 -07:00
Interface {
2018-02-22 03:26:32 -08:00
name: Rc<String>,
2018-02-21 22:06:56 -08:00
signatures: Vec<Signature>
}
2017-09-11 15:42:49 -07:00
}
#[derive(Debug, PartialEq, Clone)]
pub struct Signature {
2017-10-09 02:26:59 -07:00
pub name: Rc<String>,
pub params: Vec<FormalParam>,
pub type_anno: Option<TypeName>,
}
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-10-01 12:55:28 -07:00
pub struct TypeBody(pub Vec<Variant>);
2017-09-13 22:40:05 -07:00
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-09-13 22:40:05 -07:00
pub enum Variant {
UnitStruct(Rc<String>),
2017-10-08 19:30:52 -07:00
TupleStruct(Rc<String>, Vec<TypeName>),
Record(Rc<String>, Vec<(Rc<String>, TypeName)>),
2017-09-08 16:42:42 -07:00
}
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-10-08 19:30:52 -07:00
pub struct Expression(pub ExpressionType, pub Option<TypeName>);
2017-09-27 22:27:50 -07:00
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-10-08 19:30:52 -07:00
pub enum TypeName {
Tuple(Vec<TypeName>),
2018-02-12 00:25:48 -08:00
Singleton(TypeSingletonName)
}
#[derive(Debug, PartialEq, Clone)]
pub struct TypeSingletonName {
pub name: Rc<String>,
pub params: Vec<TypeName>,
2017-09-28 23:55:10 -07:00
}
2017-09-27 22:27:50 -07:00
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-09-27 22:27:50 -07:00
pub enum ExpressionType {
2018-05-12 01:44:03 -07:00
NatLiteral(u64),
2017-09-08 16:42:42 -07:00
FloatLiteral(f64),
2017-09-16 15:57:48 -07:00
StringLiteral(Rc<String>),
2017-09-17 04:31:27 -07:00
BoolLiteral(bool),
BinExp(BinOp, Box<Expression>, Box<Expression>),
PrefixExp(PrefixOp, Box<Expression>),
2017-10-06 20:28:07 -07:00
TupleLiteral(Vec<Expression>),
Value(Rc<String>),
NamedStruct {
name: Rc<String>,
fields: Vec<(Rc<String>, Expression)>,
},
Call {
f: Box<Expression>,
2017-10-08 22:52:05 -07:00
arguments: Vec<Expression>,
},
Index {
indexee: Box<Expression>,
indexers: Vec<Expression>,
2017-09-18 23:22:28 -07:00
},
2018-05-06 23:09:03 -07:00
IfExpression(Box<Expression>, Block, Option<Block>),
2017-10-08 22:02:58 -07:00
MatchExpression(Box<Expression>, Vec<MatchArm>),
WhileExpression {
condition: Option<Box<Expression>>,
body: Block,
},
ForExpression {
2018-05-13 01:40:14 -07:00
enumerators: Vec<Enumerator>,
body: Box<ForBody>,
},
2018-03-04 02:11:22 -08:00
Lambda {
params: Vec<FormalParam>,
2018-05-06 23:09:03 -07:00
body: Block,
2018-03-04 02:11:22 -08:00
},
2018-03-08 12:01:24 -08:00
ListLiteral(Vec<Expression>),
2017-09-12 02:30:27 -07:00
}
2018-05-13 01:40:14 -07:00
#[derive(Debug, PartialEq, Clone)]
pub struct Enumerator {
id: Rc<String>,
generator: Expression,
}
#[derive(Debug, PartialEq, Clone)]
pub enum ForBody {
MonadicReturn(Expression),
StatementBlock(Block),
}
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-09-20 21:05:08 -07:00
pub struct MatchArm {
pat: Pattern,
expr: Expression,
}
2017-10-08 13:51:56 -07:00
#[derive(Debug, PartialEq, Clone)]
2017-09-21 16:00:14 -07:00
pub struct Pattern(Rc<String>);
2017-09-20 21:05:08 -07:00
macro_rules! parse_method {
($name:ident(&mut $self:ident) -> $type:ty $body:block) => {
fn $name(&mut $self) -> $type {
let next_token = $self.peek_with_token_offset();
2017-09-17 05:06:58 -07:00
let record = ParseRecord {
production_name: stringify!($name).to_string(),
2018-03-02 22:11:25 -08:00
next_token: format!("{}", next_token.to_string_with_metadata()),
2018-02-10 15:10:06 -08:00
level: $self.parse_level,
2017-09-17 05:06:58 -07:00
};
2018-02-10 15:10:06 -08:00
$self.parse_level += 1;
$self.parse_record.push(record);
2018-02-10 15:10:06 -08:00
let result = { $body };
if $self.parse_level != 0 {
$self.parse_level -= 1;
}
result
}
};
}
2017-09-28 23:55:10 -07:00
macro_rules! delimited {
2018-05-13 02:50:43 -07:00
($self:expr, $start:pat, $parse_fn:ident, $( $delim:pat )|+, $end:pat, nonstrict) => {
delimited!($self, $start, $parse_fn, $( $delim )|*, $end, false)
};
2018-05-13 02:50:43 -07:00
($self:expr, $start:pat, $parse_fn:ident, $( $delim:pat )|+, $end:pat) => {
delimited!($self, $start, $parse_fn, $( $delim )|*, $end, true)
};
2018-05-13 02:50:43 -07:00
($self:expr, $start:pat, $parse_fn:ident, $( $delim:pat )|+, $end:pat, $strictness:expr) => {
2017-09-28 23:55:10 -07:00
{
expect!($self, $start);
let mut acc = vec![];
loop {
2017-09-30 13:46:50 -07:00
let peek = $self.peek();
match peek {
$end | EOF => break,
_ => (),
}
if !$strictness {
match peek {
$( $delim )|* => { $self.next(); continue },
_ => ()
}
}
acc.push($self.$parse_fn()?);
match $self.peek() {
$( $delim )|* => { $self.next(); continue },
_ if $strictness => break,
_ => continue,
};
}
expect!($self, $end);
acc
2017-09-28 23:55:10 -07:00
}
};
2017-09-28 23:55:10 -07:00
}
2017-09-11 02:07:17 -07:00
impl Parser {
parse_method!(program(&mut self) -> ParseResult<AST> {
let mut statements = Vec::new();
loop {
match self.peek() {
EOF => break,
Newline | Semicolon => {
self.next();
continue;
},
_ => statements.push(self.statement()?),
}
}
Ok(AST(statements))
});
2017-09-11 02:07:17 -07:00
parse_method!(statement(&mut self) -> ParseResult<Statement> {
2017-09-11 02:07:17 -07:00
//TODO handle error recovery here
match self.peek() {
Keyword(Type) => self.type_declaration().map(|decl| { Statement::Declaration(decl) }),
Keyword(Func)=> self.func_declaration().map(|func| { Statement::Declaration(func) }),
2017-09-17 06:04:24 -07:00
Keyword(Var) | Keyword(Const) => self.binding_declaration().map(|decl| Statement::Declaration(decl)),
2018-04-24 16:30:17 -07:00
Keyword(Interface) => self.interface_declaration().map(|decl| Statement::Declaration(decl)),
2017-10-03 03:49:07 -07:00
Keyword(Impl) => self.impl_declaration().map(|decl| Statement::Declaration(decl)),
2017-09-28 00:06:08 -07:00
_ => self.expression().map(|expr| { Statement::ExpressionStatement(expr) } ),
2017-09-11 02:07:17 -07:00
}
});
2017-09-11 02:07:17 -07:00
2017-10-04 22:02:31 -07:00
parse_method!(type_declaration(&mut self) -> ParseResult<Declaration> {
expect!(self, Keyword(Type));
2017-10-04 22:02:31 -07:00
self.type_declaration_body()
});
parse_method!(type_declaration_body(&mut self) -> ParseResult<Declaration> {
if let Keyword(Alias) = self.peek() {
self.type_alias()
} else {
2018-02-12 00:51:53 -08:00
let name = self.type_singleton_name()?;
expect!(self, Operator(ref c) if **c == "=");
2017-10-04 22:02:31 -07:00
let body = self.type_body()?;
Ok(Declaration::TypeDecl(name, body))
}
});
parse_method!(type_alias(&mut self) -> ParseResult<Declaration> {
expect!(self, Keyword(Alias));
2017-09-13 22:40:05 -07:00
let alias = self.identifier()?;
expect!(self, Operator(ref c) if **c == "=");
2017-09-13 22:40:05 -07:00
let original = self.identifier()?;
Ok(Declaration::TypeAlias(alias, original))
});
2017-09-13 22:40:05 -07:00
parse_method!(type_body(&mut self) -> ParseResult<TypeBody> {
2017-10-08 18:47:57 -07:00
let mut variants = Vec::new();
variants.push(self.variant_specifier()?);
loop {
if let Pipe = self.peek() {
self.next();
variants.push(self.variant_specifier()?);
} else {
break;
}
}
Ok(TypeBody(variants))
});
parse_method!(variant_specifier(&mut self) -> ParseResult<Variant> {
2017-10-08 19:02:52 -07:00
use self::Variant::*;
let name = self.identifier()?;
match self.peek() {
LParen => {
2018-05-13 02:50:43 -07:00
let tuple_members = delimited!(self, LParen, type_name, Comma, RParen);
2017-10-08 19:02:52 -07:00
Ok(TupleStruct(name, tuple_members))
},
LCurlyBrace => {
2018-05-13 02:50:43 -07:00
let typed_identifier_list = delimited!(self, LCurlyBrace, typed_identifier, Comma, RCurlyBrace);
2017-10-08 19:02:52 -07:00
Ok(Record(name, typed_identifier_list))
},
_ => Ok(UnitStruct(name))
2017-10-08 19:02:52 -07:00
}
});
2017-10-08 19:30:52 -07:00
parse_method!(typed_identifier(&mut self) -> ParseResult<(Rc<String>, TypeName)> {
2017-10-08 19:02:52 -07:00
let identifier = self.identifier()?;
expect!(self, Colon);
2017-10-08 19:02:52 -07:00
let type_name = self.type_name()?;
Ok((identifier, type_name))
});
2017-09-11 02:07:17 -07:00
parse_method!(func_declaration(&mut self) -> ParseResult<Declaration> {
let signature = self.signature()?;
if let LCurlyBrace = self.peek() {
2018-05-13 02:50:43 -07:00
let statements = delimited!(self, LCurlyBrace, statement, Newline | Semicolon, RCurlyBrace, nonstrict);
Ok(Declaration::FuncDecl(signature, statements))
} else {
Ok(Declaration::FuncSig(signature))
}
});
parse_method!(signature(&mut self) -> ParseResult<Signature> {
expect!(self, Keyword(Func));
2017-09-11 20:37:19 -07:00
let name = self.identifier()?;
2018-05-13 02:50:43 -07:00
let params = delimited!(self, LParen, formal_param, Comma, RParen);
let type_anno = match self.peek() {
Colon => Some(self.type_anno()?),
_ => None,
};
Ok(Signature { name, params, type_anno })
});
2017-09-11 20:37:19 -07:00
2017-10-08 20:55:05 -07:00
parse_method!(formal_param(&mut self) -> ParseResult<FormalParam> {
let name = self.identifier()?;
let ty = match self.peek() {
Colon => Some(self.type_anno()?),
_ => None
};
Ok((name, ty))
});
2017-09-11 02:07:17 -07:00
2017-09-17 06:04:24 -07:00
parse_method!(binding_declaration(&mut self) -> ParseResult<Declaration> {
let constant = match self.next() {
Keyword(Var) => false,
Keyword(Const) => true,
_ => return ParseError::new("Expected 'var' or 'const'"),
};
let name = self.identifier()?;
expect!(self, Operator(ref o) if **o == "=");
2017-09-17 06:04:24 -07:00
let expr = self.expression()?;
Ok(Declaration::Binding { name, constant, expr })
});
2018-04-24 16:30:17 -07:00
parse_method!(interface_declaration(&mut self) -> ParseResult<Declaration> {
expect!(self, Keyword(Interface));
2018-02-21 22:06:56 -08:00
let name = self.identifier()?;
let signatures = self.signature_block()?;
2018-04-24 16:30:17 -07:00
Ok(Declaration::Interface { name, signatures })
2018-02-21 22:06:56 -08:00
});
parse_method!(signature_block(&mut self) -> ParseResult<Vec<Signature>> {
2018-05-13 02:50:43 -07:00
Ok(delimited!(self, LCurlyBrace, signature, Newline | Semicolon, RCurlyBrace, nonstrict))
2017-10-03 03:49:07 -07:00
});
parse_method!(impl_declaration(&mut self) -> ParseResult<Declaration> {
expect!(self, Keyword(Impl));
2017-10-08 19:30:52 -07:00
let first = self.type_name()?;
2017-10-03 03:49:07 -07:00
let second = if let Keyword(For) = self.peek() {
self.next();
2017-10-08 19:30:52 -07:00
Some(self.type_name()?)
2017-10-03 03:49:07 -07:00
} else {
None
};
2017-10-08 14:24:02 -07:00
let block = self.decl_block()?;
let result = match (first, second) {
2017-10-08 19:30:52 -07:00
(first, Some(second)) => {
match first {
2018-02-12 00:25:48 -08:00
TypeName::Singleton(TypeSingletonName { ref name, ref params }) if params.len() == 0 =>
2018-04-24 16:30:17 -07:00
Declaration::Impl { type_name: second, interface_name: Some(name.clone()), block },
_ => return ParseError::new(&format!("Invalid name for an interface")),
2017-10-08 19:30:52 -07:00
}
},
2018-04-24 16:30:17 -07:00
(first, None) => Declaration::Impl { type_name: first, interface_name: None, block }
2017-10-08 14:24:02 -07:00
};
Ok(result)
});
parse_method!(decl_block(&mut self) -> ParseResult<Vec<Declaration>> {
2018-05-13 02:50:43 -07:00
Ok(delimited!(self, LCurlyBrace, func_declaration, Newline | Semicolon, RCurlyBrace, nonstrict))
2017-10-03 03:49:07 -07:00
});
parse_method!(expression(&mut self) -> ParseResult<Expression> {
let mut expr_body = self.precedence_expr(BinOp::min_precedence())?;
let type_anno = match self.peek() {
2017-09-28 23:55:10 -07:00
Colon => Some(self.type_anno()?),
_ => None
};
2017-10-01 00:50:13 -07:00
if let Some(_) = expr_body.1 {
2017-09-30 23:30:02 -07:00
return ParseError::new("Bad parse state");
2017-09-27 22:27:50 -07:00
}
expr_body.1 = type_anno;
Ok(expr_body)
});
2017-10-08 19:30:52 -07:00
parse_method!(type_anno(&mut self) -> ParseResult<TypeName> {
expect!(self, Colon);
self.type_name()
});
2017-10-08 19:30:52 -07:00
parse_method!(type_name(&mut self) -> ParseResult<TypeName> {
use self::TypeName::*;
2017-09-28 23:55:10 -07:00
Ok(match self.peek() {
2018-05-13 02:50:43 -07:00
LParen => Tuple(delimited!(self, LParen, type_name, Comma, RParen)),
2018-02-12 00:51:53 -08:00
_ => Singleton(self.type_singleton_name()?),
})
});
parse_method!(type_singleton_name(&mut self) -> ParseResult<TypeSingletonName> {
Ok(TypeSingletonName {
name: self.identifier()?,
params: match self.peek() {
2018-05-13 02:50:43 -07:00
LAngleBracket => delimited!(self, LAngleBracket, type_name, Comma, RAngleBracket),
2018-02-12 00:51:53 -08:00
_ => vec![],
}
2017-09-28 23:55:10 -07:00
})
});
// this implements Pratt parsing, see http://journal.stuffwithstuff.com/2011/03/19/pratt-parsers-expression-parsing-made-easy/
fn precedence_expr(&mut self, precedence: i32) -> ParseResult<Expression> {
2017-09-17 05:06:58 -07:00
let record = ParseRecord {
production_name: "precedence_expr".to_string(),
2018-03-02 22:11:25 -08:00
next_token: format!("{}", self.peek_with_token_offset().to_string_with_metadata()),
2018-02-10 15:10:06 -08:00
level: self.parse_level,
2017-09-17 05:06:58 -07:00
};
2018-02-10 17:45:00 -08:00
self.parse_level += 1;
2017-09-17 05:06:58 -07:00
self.parse_record.push(record);
2017-09-17 17:44:06 -07:00
let mut lhs = self.prefix_expr()?;
loop {
2017-09-17 05:12:20 -07:00
let new_precedence = match self.peek() {
Operator(op) => BinOp::get_precedence(&*op),
Period => BinOp::get_precedence("."),
2018-02-26 02:27:36 -08:00
Pipe => BinOp::get_precedence("|"),
2018-03-17 19:12:58 -07:00
Slash => BinOp::get_precedence("/"),
_ => break,
};
2017-09-17 05:12:20 -07:00
if precedence >= new_precedence {
break;
}
let sigil = match self.next() {
Operator(op) => op,
2017-09-17 04:26:44 -07:00
Period => Rc::new(".".to_string()),
2018-02-26 02:27:36 -08:00
Pipe => Rc::new("|".to_string()),
2018-05-11 01:39:31 -07:00
Slash => Rc::new("/".to_string()),
_ => unreachable!(),
};
let rhs = self.precedence_expr(new_precedence)?;
let operation = BinOp::from_sigil(sigil.as_ref());
lhs = Expression(ExpressionType::BinExp(operation, bx!(lhs), bx!(rhs)), None);
}
2018-02-10 17:45:00 -08:00
self.parse_level -= 1;
2017-09-12 02:30:27 -07:00
Ok(lhs)
2017-09-11 02:07:17 -07:00
}
2017-09-17 17:44:06 -07:00
parse_method!(prefix_expr(&mut self) -> ParseResult<Expression> {
match self.peek() {
Operator(ref op) if PrefixOp::is_prefix(&*op) => {
let sigil = match self.next() {
2017-09-17 17:44:06 -07:00
Operator(op) => op,
_ => unreachable!(),
};
let expr = self.primary()?;
2017-09-27 22:27:50 -07:00
Ok(Expression(
ExpressionType::PrefixExp(PrefixOp::from_sigil(sigil.as_str()), bx!(expr)),
2017-09-27 22:27:50 -07:00
None))
2017-09-17 17:44:06 -07:00
},
_ => self.call_expr()
2017-09-17 17:44:06 -07:00
}
});
parse_method!(call_expr(&mut self) -> ParseResult<Expression> {
2018-03-06 02:51:45 -08:00
let index = self.index_expr()?;
Ok(if let LParen = self.peek() {
2018-05-13 02:50:43 -07:00
let arguments = delimited!(self, LParen, expression, Comma, RParen);
2018-03-06 02:51:45 -08:00
Expression(ExpressionType::Call { f: bx!(index), arguments }, None) //TODO fix this none
} else {
index
})
});
parse_method!(index_expr(&mut self) -> ParseResult<Expression> {
let primary = self.primary()?;
Ok(if let LSquareBracket = self.peek() {
2018-05-13 02:50:43 -07:00
let indexers = delimited!(self, LSquareBracket, expression, Comma, RSquareBracket);
2018-03-06 02:51:45 -08:00
Expression(ExpressionType::Index {
indexee: bx!(Expression(primary.0, None)),
indexers,
}, None)
} else {
primary
})
});
parse_method!(primary(&mut self) -> ParseResult<Expression> {
2017-09-13 03:46:16 -07:00
match self.peek() {
2018-03-04 02:11:22 -08:00
LCurlyBrace => self.curly_brace_expr(),
2017-09-13 03:46:16 -07:00
LParen => self.paren_expr(),
2018-03-08 12:01:24 -08:00
LSquareBracket => self.list_expr(),
2017-09-18 23:22:28 -07:00
Keyword(Kw::If) => self.if_expr(),
2017-09-20 20:30:30 -07:00
Keyword(Kw::Match) => self.match_expr(),
2017-10-08 22:02:58 -07:00
Keyword(Kw::For) => self.for_expr(),
Keyword(Kw::While) => self.while_expr(),
Identifier(_) => self.identifier_expr(),
2017-09-13 03:46:16 -07:00
_ => self.literal(),
}
});
2017-09-13 03:46:16 -07:00
2018-03-08 12:01:24 -08:00
parse_method!(list_expr(&mut self) -> ParseResult<Expression> {
2018-05-13 02:50:43 -07:00
let exprs = delimited!(self, LSquareBracket, expression, Comma, RSquareBracket);
2018-03-08 12:01:24 -08:00
Ok(Expression(ExpressionType::ListLiteral(exprs), None))
});
2018-03-04 02:11:22 -08:00
parse_method!(curly_brace_expr(&mut self) -> ParseResult<Expression> {
self.lambda_expr()
});
parse_method!(lambda_expr(&mut self) -> ParseResult<Expression> {
expect!(self, LCurlyBrace);
2018-05-13 02:50:43 -07:00
let params = delimited!(self, Pipe, formal_param, Comma, Pipe);
2018-03-04 02:11:22 -08:00
let mut body = Vec::new();
loop {
match self.peek() {
EOF | RCurlyBrace => break,
Newline | Semicolon => {
self.next();
continue;
},
_ => body.push(self.statement()?),
}
}
expect!(self, RCurlyBrace);
2018-03-04 02:11:22 -08:00
Ok(Expression(ExpressionType::Lambda { params, body }, None)) //TODO need to handle types somehow
});
parse_method!(paren_expr(&mut self) -> ParseResult<Expression> {
2017-10-06 20:28:07 -07:00
use self::ExpressionType::*;
let old_struct_value = self.restrictions.no_struct_literal;
self.restrictions.no_struct_literal = false;
2018-05-13 01:43:29 -07:00
let output = {
2018-05-13 02:50:43 -07:00
let mut inner = delimited!(self, LParen, expression, Comma, RParen);
match inner.len() {
0 => Ok(Expression(TupleLiteral(vec![]), None)),
1 => Ok(inner.pop().unwrap()),
_ => Ok(Expression(TupleLiteral(inner), None)),
}
2018-05-13 01:43:29 -07:00
};
self.restrictions.no_struct_literal = old_struct_value;
output
});
2017-09-11 15:42:49 -07:00
2017-09-18 23:22:28 -07:00
parse_method!(identifier_expr(&mut self) -> ParseResult<Expression> {
2017-09-27 22:27:50 -07:00
use self::ExpressionType::*;
let identifier = self.identifier()?;
2017-10-08 22:52:05 -07:00
Ok(match self.peek() {
LCurlyBrace if !self.restrictions.no_struct_literal => {
2017-10-14 13:54:17 -07:00
let fields = self.record_block()?;
Expression(NamedStruct { name: identifier, fields }, None)
},
_ => Expression(Value(identifier), None)
2017-10-08 22:52:05 -07:00
})
2017-09-18 23:22:28 -07:00
});
2017-10-14 13:54:17 -07:00
parse_method!(record_block(&mut self) -> ParseResult<Vec<(Rc<String>, Expression)>> {
2018-05-13 02:50:43 -07:00
Ok(delimited!(self, LCurlyBrace, record_entry, Comma, RCurlyBrace))
2017-10-14 13:54:17 -07:00
});
parse_method!(record_entry(&mut self) -> ParseResult<(Rc<String>, Expression)> {
let field_name = self.identifier()?;
expect!(self, Colon);
2017-10-14 13:54:17 -07:00
let value = self.expression()?;
Ok((field_name, value))
});
2017-09-18 23:22:28 -07:00
parse_method!(if_expr(&mut self) -> ParseResult<Expression> {
expect!(self, Keyword(Kw::If));
2018-05-12 20:51:30 -07:00
let condition = {
self.restrictions.no_struct_literal = true;
let x = self.expression();
self.restrictions.no_struct_literal = false;
2018-05-12 20:51:30 -07:00
x?
};
2017-09-18 23:22:28 -07:00
let then_clause = self.block()?;
let else_clause = self.else_clause()?;
Ok(Expression(ExpressionType::IfExpression(bx!(condition), then_clause, else_clause), None))
2017-09-18 23:22:28 -07:00
});
2018-05-06 23:09:03 -07:00
parse_method!(else_clause(&mut self) -> ParseResult<Option<Block>> {
2017-09-18 23:22:28 -07:00
Ok(if let Keyword(Kw::Else) = self.peek() {
self.next();
Some(self.block()?)
} else {
None
})
});
2018-05-06 23:09:03 -07:00
parse_method!(block(&mut self) -> ParseResult<Block> {
2018-05-13 02:50:43 -07:00
Ok(delimited!(self, LCurlyBrace, statement, Newline | Semicolon, RCurlyBrace, nonstrict))
2017-09-18 23:22:28 -07:00
});
2017-09-20 20:30:30 -07:00
parse_method!(match_expr(&mut self) -> ParseResult<Expression> {
expect!(self, Keyword(Kw::Match));
2017-09-20 20:30:30 -07:00
let expr = self.expression()?;
2017-09-30 14:11:38 -07:00
//TODO abstract these errors into the delimited macro
//expect!(self, LCurlyBrace, "Expected '{'");
2017-09-20 20:30:30 -07:00
let body = self.match_body()?;
2017-09-30 14:11:38 -07:00
//expect!(self, RCurlyBrace, "Expected '}'");
Ok(Expression(ExpressionType::MatchExpression(bx!(expr), body), None))
2017-09-20 21:05:08 -07:00
});
parse_method!(match_body(&mut self) -> ParseResult<Vec<MatchArm>> {
2018-05-13 02:50:43 -07:00
Ok(delimited!(self, LCurlyBrace, match_arm, Comma, RCurlyBrace))
2017-09-30 14:11:38 -07:00
});
parse_method!(match_arm(&mut self) -> ParseResult<MatchArm> {
let pat = self.pattern()?;
expect!(self, Operator(ref c) if **c == "=>");
2017-09-30 14:11:38 -07:00
let expr = self.expression()?;
Ok(MatchArm { pat, expr })
2017-09-21 16:00:14 -07:00
});
parse_method!(pattern(&mut self) -> ParseResult<Pattern> {
let identifier = self.identifier()?;
Ok(Pattern(identifier))
2017-09-20 20:30:30 -07:00
});
parse_method!(while_expr(&mut self) -> ParseResult<Expression> {
use self::ExpressionType::*;
expect!(self, Keyword(Kw::While));
let condition = {
self.restrictions.no_struct_literal = true;
let x = self.while_cond();
self.restrictions.no_struct_literal = false;
x?.map(|expr| bx!(expr))
};
let body = self.block()?;
Ok(Expression(WhileExpression {condition, body}, None))
});
parse_method!(while_cond(&mut self) -> ParseResult<Option<Expression>> {
Ok(match self.peek() {
LCurlyBrace => None,
_ => Some(self.expression()?),
})
});
2017-10-08 22:02:58 -07:00
parse_method!(for_expr(&mut self) -> ParseResult<Expression> {
expect!(self, Keyword(Kw::For));
2018-05-13 01:40:14 -07:00
let enumerators = if let LCurlyBrace = self.peek() {
2018-05-13 02:50:43 -07:00
delimited!(self, LCurlyBrace, enumerator, Comma | Newline, RCurlyBrace)
2018-05-13 01:40:14 -07:00
} else {
let single_enum = {
self.restrictions.no_struct_literal = true;
let s = self.enumerator();
self.restrictions.no_struct_literal = false;
s?
};
vec![single_enum]
};
let body = Box::new(self.for_expr_body()?);
Ok(Expression(ExpressionType::ForExpression { enumerators, body }, None))
});
parse_method!(enumerator(&mut self) -> ParseResult<Enumerator> {
let id = self.identifier()?;
expect!(self, Operator(ref c) if **c == "<-");
2018-05-13 01:40:14 -07:00
let generator = self.expression()?;
Ok(Enumerator { id, generator })
});
parse_method!(for_expr_body(&mut self) -> ParseResult<ForBody> {
use self::ForBody::*;
Ok(match self.peek() {
LCurlyBrace => {
2018-05-13 02:50:43 -07:00
let statements = delimited!(self, LCurlyBrace, statement, Newline | Semicolon, RCurlyBrace, nonstrict);
2018-05-13 01:40:14 -07:00
StatementBlock(statements)
},
Keyword(Kw::Return) => {
self.next();
MonadicReturn(self.expression()?)
},
_ => return ParseError::new("for expressions must end in a block or 'return'"),
})
2017-10-08 22:02:58 -07:00
});
parse_method!(identifier(&mut self) -> ParseResult<Rc<String>> {
2017-09-11 15:42:49 -07:00
match self.next() {
Identifier(s) => Ok(s),
p => ParseError::new(&format!("Expected an identifier, got {:?}", p)),
}
});
2017-09-11 02:07:17 -07:00
parse_method!(literal(&mut self) -> ParseResult<Expression> {
2017-09-27 22:27:50 -07:00
use self::ExpressionType::*;
2017-09-11 02:07:17 -07:00
match self.peek() {
2018-01-08 06:12:45 -08:00
DigitGroup(_) | HexLiteral(_) | BinNumberSigil | Period => self.number_literal(),
2017-09-27 22:27:50 -07:00
Keyword(Kw::True) => {
self.next();
Ok(Expression(BoolLiteral(true), None))
},
Keyword(Kw::False) => {
self.next();
Ok(Expression(BoolLiteral(false), None))
},
2017-09-16 15:57:48 -07:00
StrLiteral(s) => {
self.next();
2017-09-27 22:27:50 -07:00
Ok(Expression(StringLiteral(s), None))
2017-09-16 15:57:48 -07:00
}
e => ParseError::new(&format!("Expected a literal expression, got {:?}", e)),
2017-09-11 02:07:17 -07:00
}
});
parse_method!(number_literal(&mut self) -> ParseResult<Expression> {
2017-09-11 02:07:17 -07:00
match self.peek() {
2018-01-08 06:12:45 -08:00
HexLiteral(_) | BinNumberSigil => self.int_literal(),
2017-09-11 02:07:17 -07:00
_ => self.float_literal(),
}
});
2017-09-11 02:07:17 -07:00
parse_method!(int_literal(&mut self) -> ParseResult<Expression> {
2017-09-27 22:27:50 -07:00
use self::ExpressionType::*;
2017-09-11 02:07:17 -07:00
match self.next() {
BinNumberSigil => {
2017-09-11 23:27:15 -07:00
let digits = self.digits()?;
let n = parse_binary(digits)?;
2018-05-12 01:44:03 -07:00
Ok(Expression(NatLiteral(n), None))
2017-09-11 02:07:17 -07:00
},
2018-01-08 06:12:45 -08:00
HexLiteral(text) => {
2018-02-11 16:35:38 -08:00
let digits: String = text.chars().filter(|c| c.is_digit(16)).collect();
let n = parse_hex(digits)?;
2018-05-12 01:44:03 -07:00
Ok(Expression(NatLiteral(n), None))
2017-09-11 02:07:17 -07:00
},
_ => return ParseError::new("Expected '0x' or '0b'"),
}
});
2017-09-11 02:07:17 -07:00
parse_method!(float_literal(&mut self) -> ParseResult<Expression> {
2017-09-27 22:27:50 -07:00
use self::ExpressionType::*;
2017-09-11 02:38:27 -07:00
let mut digits = self.digits()?;
if let TokenType::Period = self.peek() {
self.next();
digits.push_str(".");
digits.push_str(&self.digits()?);
match digits.parse::<f64>() {
2017-09-27 22:27:50 -07:00
Ok(f) => Ok(Expression(FloatLiteral(f), None)),
2017-09-16 17:44:06 -07:00
Err(e) => ParseError::new(&format!("Float failed to parse with error: {}", e)),
2017-09-11 02:38:27 -07:00
}
} else {
match digits.parse::<u64>() {
2018-05-12 01:44:03 -07:00
Ok(d) => Ok(Expression(NatLiteral(d), None)),
2017-09-16 17:44:06 -07:00
Err(e) => ParseError::new(&format!("Integer failed to parse with error: {}", e)),
2017-09-11 02:38:27 -07:00
}
2017-09-11 02:07:17 -07:00
}
});
2017-09-11 02:07:17 -07:00
parse_method!(digits(&mut self) -> ParseResult<String> {
2017-09-11 02:07:17 -07:00
let mut ds = String::new();
loop {
2017-09-11 02:38:27 -07:00
match self.peek() {
Underscore => { self.next(); continue; },
DigitGroup(ref s) => { self.next(); ds.push_str(s)},
2017-09-11 02:07:48 -07:00
_ => break,
2017-09-11 02:07:17 -07:00
}
}
Ok(ds)
});
2017-09-11 02:07:17 -07:00
}
2017-09-09 00:31:15 -07:00
2017-09-11 23:27:15 -07:00
fn parse_binary(digits: String) -> ParseResult<u64> {
let mut result: u64 = 0;
let mut multiplier = 1;
for d in digits.chars().rev() {
match d {
'1' => result += multiplier,
'0' => (),
_ => return ParseError::new("Encountered a character not '1' or '0 while parsing a binary literal"),
}
multiplier = match multiplier.checked_mul(2) {
Some(m) => m,
None => return ParseError::new("This binary expression will overflow")
}
2017-09-11 23:27:15 -07:00
}
Ok(result)
}
2018-01-08 05:57:36 -08:00
fn parse_hex(digits: String) -> ParseResult<u64> {
let mut result: u64 = 0;
let mut multiplier: u64 = 1;
for d in digits.chars().rev() {
match d.to_digit(16) {
Some(n) => result += n as u64 * multiplier,
None => return ParseError::new("Encountered a non-hex digit in a hex literal"),
}
multiplier = match multiplier.checked_mul(16) {
Some(m) => m,
None => return ParseError::new("This hex expression will overflow")
}
2018-01-08 05:57:36 -08:00
}
Ok(result)
}
2017-09-16 14:29:22 -07:00
pub fn parse(input: Vec<Token>) -> (Result<AST, ParseError>, Vec<String>) {
2017-09-09 00:31:15 -07:00
let mut parser = Parser::new(input);
let ast = parser.program();
2017-09-17 05:06:58 -07:00
let trace = parser.parse_record.into_iter().map(|r| {
2018-02-10 15:10:06 -08:00
let mut indent = String::new();
2018-02-22 03:26:32 -08:00
for _ in 0..r.level {
2018-02-10 15:10:06 -08:00
indent.push(' ');
}
2018-03-02 22:11:25 -08:00
format!("{}Production `{}`, token: {}", indent, r.production_name, r.next_token)
2017-09-17 05:06:58 -07:00
}).collect();
(ast, trace)
2017-08-29 05:08:09 -07:00
}
2017-09-11 03:21:07 -07:00
#[cfg(test)]
mod parse_tests {
2017-09-28 00:06:08 -07:00
use ::std::rc::Rc;
2018-05-13 01:40:14 -07:00
use super::{AST, Expression, Statement, PrefixOp, BinOp, TypeBody, Variant, Enumerator, ForBody, parse, tokenize};
2017-09-11 03:21:07 -07:00
use super::Statement::*;
2017-09-13 22:40:05 -07:00
use super::Declaration::*;
use super::Signature;
2017-10-08 19:30:52 -07:00
use super::TypeName::*;
2018-02-12 00:51:53 -08:00
use super::TypeSingletonName;
2017-09-28 00:06:08 -07:00
use super::ExpressionType::*;
use super::Variant::*;
2018-05-13 01:40:14 -07:00
use super::ForBody::*;
2017-09-12 00:48:37 -07:00
2017-09-13 22:40:05 -07:00
macro_rules! rc {
2017-09-13 22:47:25 -07:00
($string:tt) => { Rc::new(stringify!($string).to_string()) }
2017-09-13 22:40:05 -07:00
}
2017-09-12 00:48:37 -07:00
macro_rules! parse_test {
2017-09-16 15:57:48 -07:00
($string:expr, $correct:expr) => { assert_eq!(parse(tokenize($string)).0.unwrap(), $correct) }
2017-09-12 00:48:37 -07:00
}
macro_rules! parse_error {
($string:expr) => { assert!(parse(tokenize($string)).0.is_err()) }
}
2017-10-10 21:02:32 -07:00
macro_rules! val {
($var:expr) => { Value(Rc::new($var.to_string())) }
2017-09-13 20:49:17 -07:00
}
2017-09-28 00:06:08 -07:00
macro_rules! exprstatement {
2017-09-29 19:10:37 -07:00
($expr_type:expr) => { Statement::ExpressionStatement(Expression($expr_type, None)) };
($expr_type:expr, $type_anno:expr) => { Statement::ExpressionStatement(Expression($expr_type, Some($type_anno))) };
2017-09-28 00:06:08 -07:00
}
2017-09-29 19:10:37 -07:00
macro_rules! ty {
2018-02-12 00:51:53 -08:00
($name:expr) => { Singleton(tys!($name)) }
}
macro_rules! tys {
($name:expr) => { TypeSingletonName { name: Rc::new($name.to_string()), params: vec![] } };
2017-09-29 19:10:37 -07:00
}
2017-09-12 00:48:37 -07:00
2018-03-06 01:06:36 -08:00
/* new style of test macros */
macro_rules! single_expr {
($exprtype:expr) => { AST(vec![Statement::ExpressionStatement(Expression($exprtype, None))]) };
($exprtype:expr, $type:expr) => { AST(vec![Statement::ExpressionStatement(Expression($exprtype, $type))]) }
}
2018-03-06 01:31:31 -08:00
macro_rules! ex {
($expr_type:expr) => { Expression($expr_type, None) }
}
2018-03-06 01:06:36 -08:00
macro_rules! binexp {
($op:expr, $lhs:expr, $rhs:expr) => { BinExp(BinOp::from_sigil($op), bx!(Expression($lhs, None)), bx!(Expression($rhs, None))) }
}
macro_rules! prefexp {
($op:expr, $lhs:expr) => { PrefixExp(PrefixOp::from_sigil($op), bx!(Expression($lhs, None))) }
}
2018-03-06 01:31:31 -08:00
macro_rules! exst {
($expr_type:expr) => { Statement::ExpressionStatement(Expression($expr_type, None)) };
($expr_type:expr, $type_anno:expr) => { Statement::ExpressionStatement(Expression($expr_type, Some($type_anno))) };
($op:expr, $lhs:expr, $rhs:expr) => { Statement::ExpressionStatement(ex!(binexp!($op, $lhs, $rhs))) };
}
2018-03-06 01:06:36 -08:00
2017-09-11 03:21:07 -07:00
#[test]
2017-09-13 03:46:16 -07:00
fn parsing_number_literals_and_binexps() {
2018-03-06 01:06:36 -08:00
parse_test! { ".2", single_expr!(FloatLiteral(0.2)) };
parse_test! { "8.1", single_expr!(FloatLiteral(8.1)) };
2018-02-11 16:35:38 -08:00
2018-05-12 01:44:03 -07:00
parse_test! { "0b010", single_expr!(NatLiteral(2)) };
parse_test! { "0b0_1_0_", single_expr!(NatLiteral(2)) }
2018-02-11 16:35:38 -08:00
2018-05-12 01:44:03 -07:00
parse_test! {"0xff", single_expr!(NatLiteral(255)) };
parse_test! {"0xf_f_", single_expr!(NatLiteral(255)) };
2018-02-11 16:35:38 -08:00
2018-05-12 01:44:03 -07:00
parse_test!("0xf_f_+1", AST(vec![exprstatement!(binexp!("+", NatLiteral(255), NatLiteral(1)))]));
2018-02-11 16:35:38 -08:00
2018-03-06 01:06:36 -08:00
parse_test! {"3; 4; 4.3", AST(
2018-05-12 01:44:03 -07:00
vec![exprstatement!(NatLiteral(3)), exprstatement!(NatLiteral(4)),
2018-03-06 01:06:36 -08:00
exprstatement!(FloatLiteral(4.3))])
};
parse_test!("1 + 2 * 3", AST(vec!
[
2018-05-12 01:44:03 -07:00
exprstatement!(binexp!("+", NatLiteral(1), binexp!("*", NatLiteral(2), NatLiteral(3))))
]));
parse_test!("1 * 2 + 3", AST(vec!
[
2018-05-12 01:44:03 -07:00
exprstatement!(binexp!("+", binexp!("*", NatLiteral(1), NatLiteral(2)), NatLiteral(3)))
]));
2017-09-12 15:52:23 -07:00
2018-05-12 01:44:03 -07:00
parse_test!("1 && 2", AST(vec![exprstatement!(binexp!("&&", NatLiteral(1), NatLiteral(2)))]));
2017-09-12 15:52:23 -07:00
2017-09-28 00:06:08 -07:00
parse_test!("1 + 2 * 3 + 4", AST(vec![exprstatement!(
2017-09-28 00:45:36 -07:00
binexp!("+",
2018-05-12 01:44:03 -07:00
binexp!("+", NatLiteral(1), binexp!("*", NatLiteral(2), NatLiteral(3))),
NatLiteral(4)))]));
2017-09-12 15:52:23 -07:00
2017-09-13 03:46:16 -07:00
parse_test!("(1 + 2) * 3", AST(vec!
2018-05-12 01:44:03 -07:00
[exprstatement!(binexp!("*", binexp!("+", NatLiteral(1), NatLiteral(2)), NatLiteral(3)))]));
2017-09-17 04:26:44 -07:00
2017-09-28 00:06:08 -07:00
parse_test!(".1 + .2", AST(vec![exprstatement!(binexp!("+", FloatLiteral(0.1), FloatLiteral(0.2)))]));
2018-05-12 01:44:03 -07:00
parse_test!("1 / 2", AST(vec![exprstatement!(binexp!("/", NatLiteral(1), NatLiteral(2)))]));
2017-09-11 03:21:07 -07:00
}
2017-09-13 03:46:16 -07:00
2017-10-06 20:28:07 -07:00
#[test]
fn parsing_tuples() {
parse_test!("()", AST(vec![exprstatement!(TupleLiteral(vec![]))]));
parse_test!("(\"hella\", 34)", AST(vec![exprstatement!(
TupleLiteral(
2018-05-12 01:44:03 -07:00
vec![ex!(StringLiteral(rc!(hella))), ex!(NatLiteral(34))]
2017-10-06 20:28:07 -07:00
)
)]));
parse_test!("((1+2), \"slough\")", AST(vec![exprstatement!(TupleLiteral(vec![
2018-05-12 01:44:03 -07:00
ex!(binexp!("+", NatLiteral(1), NatLiteral(2))),
2017-10-06 20:28:07 -07:00
ex!(StringLiteral(rc!(slough))),
]))]))
}
2017-09-13 20:49:17 -07:00
#[test]
fn parsing_identifiers() {
2017-10-10 21:02:32 -07:00
parse_test!("a", AST(vec![exprstatement!(val!("a"))]));
parse_test!("a + b", AST(vec![exprstatement!(binexp!("+", val!("a"), val!("b")))]));
//parse_test!("a[b]", AST(vec![Expression(
//parse_test!("a[]", <- TODO THIS NEEDS TO FAIL
//parse_test!(damn()[a] ,<- TODO needs to succeed
parse_test!("a[b,c]", AST(vec![exprstatement!(Index { indexee: bx!(ex!(val!("a"))), indexers: vec![ex!(val!("b")), ex!(val!("c"))]} )]));
parse_test!("None", AST(vec![exprstatement!(val!("None"))]));
2017-10-14 13:54:17 -07:00
parse_test!("Pandas { a: x + y }", AST(vec![
exprstatement!(NamedStruct { name: rc!(Pandas), fields: vec![(rc!(a), ex!(binexp!("+", val!("x"), val!("y"))))]})
]));
2017-09-13 20:49:17 -07:00
}
2017-09-13 22:40:05 -07:00
2017-09-17 02:38:11 -07:00
#[test]
2017-09-17 06:04:24 -07:00
fn parsing_complicated_operators() {
2017-10-10 21:02:32 -07:00
parse_test!("a <- b", AST(vec![exprstatement!(binexp!("<-", val!("a"), val!("b")))]));
parse_test!("a || b", AST(vec![exprstatement!(binexp!("||", val!("a"), val!("b")))]));
parse_test!("a<>b", AST(vec![exprstatement!(binexp!("<>", val!("a"), val!("b")))]));
2017-09-28 00:06:08 -07:00
parse_test!("a.b.c.d", AST(vec![exprstatement!(binexp!(".",
binexp!(".",
2017-10-10 21:02:32 -07:00
binexp!(".", val!("a"), val!("b")),
val!("c")),
val!("d")))]));
2018-05-12 01:44:03 -07:00
parse_test!("-3", AST(vec![exprstatement!(prefexp!("-", NatLiteral(3)))]));
2017-09-28 00:06:08 -07:00
parse_test!("-0.2", AST(vec![exprstatement!(prefexp!("-", FloatLiteral(0.2)))]));
2018-05-12 01:44:03 -07:00
parse_test!("!3", AST(vec![exprstatement!(prefexp!("!", NatLiteral(3)))]));
2017-10-10 21:02:32 -07:00
parse_test!("a <- -b", AST(vec![exprstatement!(binexp!("<-", val!("a"), prefexp!("-", val!("b"))))]));
parse_test!("a <--b", AST(vec![exprstatement!(binexp!("<--", val!("a"), val!("b")))]));
2017-09-17 02:38:11 -07:00
}
2017-09-13 23:37:49 -07:00
#[test]
fn parsing_functions() {
parse_test!("fn oi()", AST(vec![Declaration(FuncSig(Signature { name: rc!(oi), params: vec![], type_anno: None }))]));
parse_test!("oi()", AST(vec![exprstatement!(Call { f: bx!(ex!(val!("oi"))), arguments: vec![] })]));
2017-09-28 00:06:08 -07:00
parse_test!("oi(a, 2 + 2)", AST(vec![exprstatement!(Call
{ f: bx!(ex!(val!("oi"))),
2018-05-12 01:44:03 -07:00
arguments: vec![ex!(val!("a")), ex!(binexp!("+", NatLiteral(2), NatLiteral(2)))]
2017-09-15 03:49:47 -07:00
})]));
parse_error!("a(b,,c)");
2017-10-08 20:55:05 -07:00
2017-10-08 21:25:51 -07:00
parse_test!("fn a(b, c: Int): Int", AST(vec![Declaration(
FuncSig(Signature { name: rc!(a), params: vec![
2017-10-08 20:55:05 -07:00
(rc!(b), None), (rc!(c), Some(ty!("Int")))
2017-10-08 21:25:51 -07:00
], type_anno: Some(ty!("Int")) }))]));
parse_test!("fn a(x) { x() }", AST(vec![Declaration(
FuncDecl(Signature { name: rc!(a), params: vec![(rc!(x),None)], type_anno: None },
vec![exprstatement!(Call { f: bx!(ex!(val!("x"))), arguments: vec![] })]))]));
parse_test!("fn a(x) {\n x() }", AST(vec![Declaration(
FuncDecl(Signature { name: rc!(a), params: vec![(rc!(x),None)], type_anno: None },
vec![exprstatement!(Call { f: bx!(ex!(val!("x"))), arguments: vec![] })]))]));
let multiline = r#"
fn a(x) {
x()
}
"#;
parse_test!(multiline, AST(vec![Declaration(
FuncDecl(Signature { name: rc!(a), params: vec![(rc!(x),None)], type_anno: None },
vec![exprstatement!(Call { f: bx!(ex!(val!("x"))), arguments: vec![] })]))]));
let multiline2 = r#"
fn a(x) {
x()
}
"#;
parse_test!(multiline2, AST(vec![Declaration(
FuncDecl(Signature { name: rc!(a), params: vec![(rc!(x),None)], type_anno: None },
vec![exprstatement!(Call { f: bx!(ex!(val!("x"))), arguments: vec![] })]))]));
2017-09-13 23:37:49 -07:00
}
2017-09-17 04:31:27 -07:00
#[test]
2017-09-17 06:04:24 -07:00
fn parsing_bools() {
2017-09-28 00:06:08 -07:00
parse_test!("false", AST(vec![exprstatement!(BoolLiteral(false))]));
parse_test!("true", AST(vec![exprstatement!(BoolLiteral(true))]));
2017-09-17 04:31:27 -07:00
}
2017-09-16 15:57:48 -07:00
#[test]
fn parsing_strings() {
2017-09-28 00:06:08 -07:00
parse_test!(r#""hello""#, AST(vec![exprstatement!(StringLiteral(rc!(hello)))]));
2017-09-16 15:57:48 -07:00
}
2017-09-13 22:40:05 -07:00
#[test]
fn parsing_types() {
2018-02-12 00:51:53 -08:00
parse_test!("type Yolo = Yolo", AST(vec![Declaration(TypeDecl(tys!("Yolo"), TypeBody(vec![UnitStruct(rc!(Yolo))])))]));
2017-10-04 22:02:31 -07:00
parse_test!("type alias Sex = Drugs", AST(vec![Declaration(TypeAlias(rc!(Sex), rc!(Drugs)))]));
2018-02-12 01:45:36 -08:00
parse_test!("type Sanchez = Miguel | Alejandro(Int, Option<a>) | Esperanza { a: Int, b: String }",
2018-02-12 00:51:53 -08:00
AST(vec![Declaration(TypeDecl(tys!("Sanchez"), TypeBody(vec![
UnitStruct(rc!(Miguel)),
TupleStruct(rc!(Alejandro), vec![
2018-02-12 00:51:53 -08:00
Singleton(TypeSingletonName { name: rc!(Int), params: vec![] }),
Singleton(TypeSingletonName { name: rc!(Option), params: vec![Singleton(TypeSingletonName { name: rc!(a), params: vec![] })] }),
]),
2018-02-12 01:45:36 -08:00
Record(rc!(Esperanza), vec![
2018-02-12 00:51:53 -08:00
(rc!(a), Singleton(TypeSingletonName { name: rc!(Int), params: vec![] })),
(rc!(b), Singleton(TypeSingletonName { name: rc!(String), params: vec![] })),
])])))]));
2018-02-12 01:45:36 -08:00
parse_test!("type Jorge<a> = Diego | Kike(a)", AST(vec![
Declaration(TypeDecl(
TypeSingletonName { name: rc!(Jorge), params: vec![Singleton(TypeSingletonName { name: rc!(a), params: vec![] })] },
TypeBody(vec![UnitStruct(rc!(Diego)), TupleStruct(rc!(Kike), vec![Singleton(TypeSingletonName { name: rc!(a), params: vec![] })])]))
)]));
2017-09-13 22:40:05 -07:00
}
2017-09-17 06:04:24 -07:00
#[test]
fn parsing_bindings() {
2018-05-12 01:44:03 -07:00
parse_test!("var a = 10", AST(vec![Declaration(Binding { name: rc!(a), constant: false, expr: ex!(NatLiteral(10)) } )]));
parse_test!("const a = 2 + 2", AST(vec![Declaration(Binding { name: rc!(a), constant: true, expr: ex!(binexp!("+", NatLiteral(2), NatLiteral(2))) }) ]));
2017-09-17 06:04:24 -07:00
}
2017-09-18 23:22:28 -07:00
#[test]
fn parsing_block_expressions() {
2017-09-28 00:06:08 -07:00
parse_test!("if a() { b(); c() }", AST(vec![exprstatement!(
IfExpression(bx!(ex!(Call { f: bx!(ex!(val!("a"))), arguments: vec![]})),
vec![exprstatement!(Call { f: bx!(ex!(val!("b"))), arguments: vec![]}), exprstatement!(Call { f: bx!(ex!(val!("c"))), arguments: vec![] })],
2017-09-28 00:06:08 -07:00
None)
)]));
2017-09-18 23:22:28 -07:00
parse_test!(r#"
if true {
const a = 10
b
} else {
c
2017-09-28 00:06:08 -07:00
}"#,
AST(vec![exprstatement!(IfExpression(bx!(ex!(BoolLiteral(true))),
2018-05-12 01:44:03 -07:00
vec![Declaration(Binding { name: rc!(a), constant: true, expr: ex!(NatLiteral(10)) }),
exprstatement!(val!(rc!(b)))],
Some(vec![exprstatement!(val!(rc!(c)))])))])
2017-09-18 23:22:28 -07:00
);
parse_test!("if a { b } else { c }", AST(vec![exprstatement!(
IfExpression(bx!(ex!(val!("a"))),
vec![exprstatement!(val!("b"))],
Some(vec![exprstatement!(val!("c"))])))]));
parse_test!("if (A {a: 1}) { b } else { c }", AST(vec![exprstatement!(
2018-05-12 01:44:03 -07:00
IfExpression(bx!(ex!(NamedStruct { name: rc!(A), fields: vec![(rc!(a), ex!(NatLiteral(1)))]})),
vec![exprstatement!(val!("b"))],
Some(vec![exprstatement!(val!("c"))])))]));
parse_error!("if A {a: 1} { b } else { c }");
2017-09-18 23:22:28 -07:00
}
2018-02-21 22:06:56 -08:00
#[test]
2018-04-24 16:30:17 -07:00
fn parsing_interfaces() {
parse_test!("interface Unglueable { fn unglue(a: Glue); fn mar(): Glue }", AST(vec![
Declaration(Interface {
2018-02-22 03:26:32 -08:00
name: rc!(Unglueable),
2018-02-21 22:06:56 -08:00
signatures: vec![
Signature { name: rc!(unglue), params: vec![(rc!(a), Some(Singleton(TypeSingletonName { name: rc!(Glue), params: vec![] })))], type_anno: None },
Signature { name: rc!(mar), params: vec![], type_anno: Some(Singleton(TypeSingletonName { name: rc!(Glue), params: vec![] })) },
]
})
]));
}
2017-09-28 00:45:36 -07:00
2017-10-08 14:24:02 -07:00
#[test]
fn parsing_impls() {
parse_test!("impl Heh { fn yolo(); fn swagg(); }", AST(vec![
Declaration(Impl {
2017-10-08 19:39:41 -07:00
type_name: ty!("Heh"),
2018-04-24 16:30:17 -07:00
interface_name: None,
2017-10-08 14:24:02 -07:00
block: vec![
FuncSig(Signature { name: rc!(yolo), params: vec![], type_anno: None }),
FuncSig(Signature { name: rc!(swagg), params: vec![], type_anno: None })
2017-10-08 14:24:02 -07:00
] })]));
parse_test!("impl Mondai for Lollerino { fn yolo(); fn swagg(); }", AST(vec![
Declaration(Impl {
2017-10-08 19:39:41 -07:00
type_name: ty!("Lollerino"),
2018-04-24 16:30:17 -07:00
interface_name: Some(rc!(Mondai)),
2017-10-08 14:24:02 -07:00
block: vec![
FuncSig(Signature { name: rc!(yolo), params: vec![], type_anno: None}),
FuncSig(Signature { name: rc!(swagg), params: vec![], type_anno: None })
2017-10-08 14:24:02 -07:00
] })]));
2017-10-08 19:39:41 -07:00
parse_test!("impl Option<WTFMate> { fn oi() }", AST(vec![
Declaration(Impl {
2018-02-12 00:51:53 -08:00
type_name: Singleton(TypeSingletonName { name: rc!(Option), params: vec![ty!("WTFMate")]}),
2018-04-24 16:30:17 -07:00
interface_name: None,
2017-10-08 19:39:41 -07:00
block: vec![
FuncSig(Signature { name: rc!(oi), params: vec![], type_anno: None }),
2017-10-08 19:39:41 -07:00
]
})]));
2017-10-08 14:24:02 -07:00
}
2017-09-28 00:45:36 -07:00
#[test]
fn parsing_type_annotations() {
parse_test!("const a = b : Int", AST(vec![
Declaration(Binding { name: rc!(a), constant: true, expr:
2017-10-10 21:02:32 -07:00
Expression(val!("b"), Some(ty!("Int"))) })]));
2017-09-28 00:45:36 -07:00
2017-09-29 19:10:37 -07:00
parse_test!("a : Int", AST(vec![
2017-10-10 21:02:32 -07:00
exprstatement!(val!("a"), ty!("Int"))
2017-09-29 19:10:37 -07:00
]));
parse_test!("a : Option<Int>", AST(vec![
2018-02-12 00:51:53 -08:00
exprstatement!(val!("a"), Singleton(TypeSingletonName { name: rc!(Option), params: vec![ty!("Int")] }))
2017-09-29 19:10:37 -07:00
]));
2017-09-28 00:45:36 -07:00
2017-09-29 19:10:37 -07:00
parse_test!("a : KoreanBBQSpecifier<Kimchi, Option<Bulgogi> >", AST(vec![
2018-02-12 00:51:53 -08:00
exprstatement!(val!("a"), Singleton(TypeSingletonName { name: rc!(KoreanBBQSpecifier), params: vec![
ty!("Kimchi"), Singleton(TypeSingletonName { name: rc!(Option), params: vec![ty!("Bulgogi")] })
] }))
2017-09-29 19:10:37 -07:00
]));
2017-09-30 01:14:49 -07:00
parse_test!("a : (Int, Yolo<a>)", AST(vec![
2017-10-10 21:02:32 -07:00
exprstatement!(val!("a"), Tuple(
2018-02-12 00:51:53 -08:00
vec![ty!("Int"), Singleton(TypeSingletonName {
2017-09-30 01:14:49 -07:00
name: rc!(Yolo), params: vec![ty!("a")]
2018-02-12 00:51:53 -08:00
})]))]));
2017-09-28 00:45:36 -07:00
}
2018-03-04 02:11:22 -08:00
#[test]
fn parsing_lambdas() {
2018-03-06 01:31:31 -08:00
parse_test! { "{|x| x + 1}", single_expr!(
2018-05-12 01:44:03 -07:00
Lambda { params: vec![(rc!(x), None)], body: vec![exst!("+", val!("x"), NatLiteral(1))] }
2018-03-06 01:31:31 -08:00
) }
2018-03-04 02:11:22 -08:00
parse_test!("{ |x: Int, y| a;b;c;}", AST(vec![
exprstatement!(Lambda {
params: vec![(rc!(x), Some(ty!("Int"))), (rc!(y), None)],
2018-03-06 01:31:31 -08:00
body: vec![exst!(val!("a")), exst!(val!("b")), exst!(val!("c"))]
2018-03-04 02:11:22 -08:00
})
]));
2018-03-06 00:56:19 -08:00
parse_test!("{|x| y}(1)", AST(vec![
exprstatement!(Call { f: bx!(ex!(
Lambda { params: vec![(rc!(x), None)], body: vec![exprstatement!(val!("y"))] })),
2018-05-12 01:44:03 -07:00
arguments: vec![ex!(NatLiteral(1))] })]));
2018-03-04 02:11:22 -08:00
}
2018-03-08 12:01:24 -08:00
#[test]
fn list_literals() {
parse_test! {
"[1,2]", AST(vec![
2018-05-12 01:44:03 -07:00
exprstatement!(ListLiteral(vec![ex!(NatLiteral(1)), ex!(NatLiteral(2))]))])
2018-03-08 12:01:24 -08:00
};
}
#[test]
2018-05-13 01:40:14 -07:00
fn while_expr() {
parse_test! {
"while { }", AST(vec![
exprstatement!(WhileExpression { condition: None, body: vec![] })])
}
2018-05-13 01:40:14 -07:00
parse_test! {
"while a == b { }", AST(vec![
exprstatement!(WhileExpression { condition: Some(bx![ex![binexp!("==", val!("a"), val!("b"))]]), body: vec![] })])
}
}
#[test]
fn for_expr() {
parse_test! {
"for { a <- maybeValue } return 1", AST(vec![
exprstatement!(ForExpression {
enumerators: vec![Enumerator { id: rc!(a), generator: ex!(val!("maybeValue")) }],
body: bx!(MonadicReturn(ex!(NatLiteral(1))))
})])
}
parse_test! {
"for n <- someRange { f(n); }", AST(vec![
exprstatement!(ForExpression { enumerators: vec![Enumerator { id: rc!(n), generator: ex!(val!("someRange"))}],
body: bx!(ForBody::StatementBlock(vec![exprstatement!(Call { f: bx![ex!(val!("f"))], arguments: vec![ex!(val!("n"))] })]))
})])
}
}
2017-09-11 03:21:07 -07:00
}