2020-11-28 19:53:51 +01:00
|
|
|
// This implements the grammar of Lox as described starting in the
|
|
|
|
// Crafting Interpreters chapter "Representing Code". Note that the
|
2020-12-06 14:21:06 +01:00
|
|
|
// upstream Java implementation works around Java being bad at value
|
2020-11-28 19:53:51 +01:00
|
|
|
// classes by writing a code generator for Java.
|
|
|
|
//
|
|
|
|
// My Rust implementation skips this step because it's unnecessary, we
|
|
|
|
// have real types.
|
2020-12-06 14:43:43 +01:00
|
|
|
use crate::errors::{Error, ErrorKind};
|
2020-11-28 19:53:51 +01:00
|
|
|
use crate::scanner::{Token, TokenKind};
|
|
|
|
|
|
|
|
// AST
|
|
|
|
|
2020-12-31 14:31:34 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct Assign<'a> {
|
|
|
|
pub name: Token<'a>,
|
|
|
|
pub value: Box<Expr<'a>>,
|
|
|
|
}
|
|
|
|
|
2020-11-28 19:53:51 +01:00
|
|
|
#[derive(Debug)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub struct Binary<'a> {
|
2020-12-19 13:01:16 +01:00
|
|
|
pub left: Box<Expr<'a>>,
|
|
|
|
pub operator: Token<'a>,
|
|
|
|
pub right: Box<Expr<'a>>,
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
2021-01-06 18:35:05 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct Logical<'a> {
|
|
|
|
pub left: Box<Expr<'a>>,
|
|
|
|
pub operator: Token<'a>,
|
|
|
|
pub right: Box<Expr<'a>>,
|
|
|
|
}
|
|
|
|
|
2020-11-28 19:53:51 +01:00
|
|
|
#[derive(Debug)]
|
2020-12-19 13:01:16 +01:00
|
|
|
pub struct Grouping<'a>(pub Box<Expr<'a>>);
|
2020-11-28 19:53:51 +01:00
|
|
|
|
2020-12-19 13:01:16 +01:00
|
|
|
#[derive(Debug, Clone, PartialEq)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub enum Literal {
|
2020-12-06 14:21:06 +01:00
|
|
|
Boolean(bool),
|
|
|
|
Number(f64),
|
|
|
|
String(String),
|
|
|
|
Nil,
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub struct Unary<'a> {
|
2020-12-19 13:01:16 +01:00
|
|
|
pub operator: Token<'a>,
|
|
|
|
pub right: Box<Expr<'a>>,
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
2020-11-28 19:53:51 +01:00
|
|
|
|
2021-01-11 18:29:20 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct Call<'a> {
|
|
|
|
pub callee: Box<Expr<'a>>,
|
|
|
|
pub paren: Token<'a>,
|
|
|
|
pub args: Vec<Expr<'a>>,
|
|
|
|
}
|
|
|
|
|
2020-12-31 14:31:34 +01:00
|
|
|
// Not to be confused with `Var`, which is for assignment.
|
2020-12-22 15:44:25 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct Variable<'a>(pub Token<'a>);
|
|
|
|
|
2020-11-28 19:53:51 +01:00
|
|
|
#[derive(Debug)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub enum Expr<'a> {
|
2020-12-31 14:31:34 +01:00
|
|
|
Assign(Assign<'a>),
|
2020-11-28 19:53:51 +01:00
|
|
|
Binary(Binary<'a>),
|
|
|
|
Grouping(Grouping<'a>),
|
|
|
|
Literal(Literal),
|
2020-12-06 14:21:06 +01:00
|
|
|
Unary(Unary<'a>),
|
2021-01-11 18:29:20 +01:00
|
|
|
Call(Call<'a>),
|
2020-12-22 15:44:25 +01:00
|
|
|
Variable(Variable<'a>),
|
2021-01-06 18:35:05 +01:00
|
|
|
Logical(Logical<'a>),
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
2020-12-31 15:59:19 +01:00
|
|
|
// Variable assignment. Not to be confused with `Variable`, which is
|
|
|
|
// for access.
|
2020-12-22 15:44:25 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct Var<'a> {
|
|
|
|
pub name: Token<'a>,
|
|
|
|
pub initialiser: Option<Expr<'a>>,
|
|
|
|
}
|
|
|
|
|
2021-01-03 16:26:26 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct If<'a> {
|
|
|
|
pub condition: Expr<'a>,
|
|
|
|
pub then_branch: Box<Statement<'a>>,
|
|
|
|
pub else_branch: Option<Box<Statement<'a>>>,
|
|
|
|
}
|
|
|
|
|
2021-01-06 18:49:20 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct While<'a> {
|
|
|
|
pub condition: Expr<'a>,
|
|
|
|
pub body: Box<Statement<'a>>,
|
|
|
|
}
|
|
|
|
|
2020-12-31 16:05:58 +01:00
|
|
|
pub type Block<'a> = Vec<Statement<'a>>;
|
|
|
|
|
2021-01-14 03:02:50 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct Function<'a> {
|
|
|
|
pub name: Token<'a>,
|
|
|
|
pub params: Vec<Token<'a>>,
|
|
|
|
pub body: Block<'a>,
|
|
|
|
}
|
|
|
|
|
2020-12-21 00:13:22 +01:00
|
|
|
#[derive(Debug)]
|
2020-12-31 15:59:19 +01:00
|
|
|
pub enum Statement<'a> {
|
|
|
|
Expr(Expr<'a>),
|
|
|
|
Print(Expr<'a>),
|
2020-12-22 15:44:25 +01:00
|
|
|
Var(Var<'a>),
|
2020-12-31 16:05:58 +01:00
|
|
|
Block(Block<'a>),
|
2021-01-03 16:26:26 +01:00
|
|
|
If(If<'a>),
|
2021-01-06 18:49:20 +01:00
|
|
|
While(While<'a>),
|
2021-01-14 03:02:50 +01:00
|
|
|
Function(Function<'a>),
|
2020-12-21 00:13:22 +01:00
|
|
|
}
|
|
|
|
|
2020-11-28 19:53:51 +01:00
|
|
|
// Parser
|
|
|
|
|
|
|
|
/*
|
2020-12-21 00:13:22 +01:00
|
|
|
program → declaration* EOF ;
|
|
|
|
|
2021-01-14 03:02:50 +01:00
|
|
|
declaration → funDecl
|
|
|
|
| varDecl
|
2020-12-21 00:13:22 +01:00
|
|
|
| statement ;
|
2020-12-20 23:55:40 +01:00
|
|
|
|
2021-01-14 03:02:50 +01:00
|
|
|
funDecl → "fun" function ;
|
|
|
|
function → IDENTIFIER "(" parameters? ")" block ;
|
|
|
|
parameters → IDENTIFIER ( "," IDENTIFIER )* ;
|
|
|
|
|
|
|
|
|
2020-12-20 23:55:40 +01:00
|
|
|
statement → exprStmt
|
2021-01-06 23:57:37 +01:00
|
|
|
| forStmt
|
2021-01-03 16:26:26 +01:00
|
|
|
| ifStmt
|
|
|
|
| printStmt
|
2021-01-06 18:49:20 +01:00
|
|
|
| whileStmt
|
2021-01-03 16:26:26 +01:00
|
|
|
| block ;
|
2020-12-20 23:55:40 +01:00
|
|
|
|
2021-01-06 23:57:37 +01:00
|
|
|
forStmt → "for" "(" ( varDecl | exprStmt | ";" )
|
|
|
|
expression? ";"
|
|
|
|
expression? ")" statement ;
|
|
|
|
|
2021-01-06 18:49:20 +01:00
|
|
|
whileStmt → "while" "(" expression ")" statement ;
|
|
|
|
|
2020-12-20 23:55:40 +01:00
|
|
|
exprStmt → expression ";" ;
|
2021-01-03 16:26:26 +01:00
|
|
|
|
|
|
|
ifStmt → "if" "(" expression ")" statement
|
|
|
|
( "else" statement )? ;
|
|
|
|
|
2020-12-20 23:55:40 +01:00
|
|
|
printStmt → "print" expression ";" ;
|
|
|
|
|
2020-12-31 14:31:34 +01:00
|
|
|
expression → assignment ;
|
|
|
|
assignment → IDENTIFIER "=" assignment
|
2021-01-06 18:35:05 +01:00
|
|
|
| logic_or ;
|
|
|
|
logic_or → logic_and ( "or" logic_and )* ;
|
|
|
|
logic_and → equality ( "and" equality )* ;
|
2020-11-28 19:53:51 +01:00
|
|
|
equality → comparison ( ( "!=" | "==" ) comparison )* ;
|
|
|
|
comparison → term ( ( ">" | ">=" | "<" | "<=" ) term )* ;
|
|
|
|
term → factor ( ( "-" | "+" ) factor )* ;
|
|
|
|
factor → unary ( ( "/" | "*" ) unary )* ;
|
2021-01-11 18:29:20 +01:00
|
|
|
unary → ( "!" | "-" ) unary | call ;
|
|
|
|
call → primary ( "(" arguments? ")" )* ;
|
|
|
|
arguments → expression ( "," expression )* ;
|
2020-11-28 19:53:51 +01:00
|
|
|
primary → NUMBER | STRING | "true" | "false" | "nil"
|
|
|
|
| "(" expression ")" ;
|
|
|
|
*/
|
|
|
|
|
|
|
|
struct Parser<'a> {
|
|
|
|
tokens: Vec<Token<'a>>,
|
|
|
|
current: usize,
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
type ExprResult<'a> = Result<Expr<'a>, Error>;
|
2020-12-20 23:55:40 +01:00
|
|
|
type StmtResult<'a> = Result<Statement<'a>, Error>;
|
2020-12-06 14:43:43 +01:00
|
|
|
|
2020-11-28 19:53:51 +01:00
|
|
|
impl<'a> Parser<'a> {
|
|
|
|
// recursive-descent parser functions
|
|
|
|
|
2020-12-31 15:59:19 +01:00
|
|
|
fn declaration(&mut self) -> StmtResult<'a> {
|
2021-01-14 03:02:50 +01:00
|
|
|
if self.match_token(&TokenKind::Fun) {
|
|
|
|
return self.function();
|
|
|
|
}
|
|
|
|
|
2021-01-14 02:00:54 +01:00
|
|
|
if self.match_token(&TokenKind::Var) {
|
2020-12-22 15:44:25 +01:00
|
|
|
return self.var_declaration();
|
|
|
|
}
|
|
|
|
|
2020-12-31 15:59:19 +01:00
|
|
|
self.statement()
|
2020-12-21 00:13:22 +01:00
|
|
|
}
|
|
|
|
|
2021-01-14 03:02:50 +01:00
|
|
|
fn function(&mut self) -> StmtResult<'a> {
|
|
|
|
let name = self.identifier("Expected function name.")?;
|
|
|
|
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::LeftParen,
|
|
|
|
ErrorKind::ExpectedToken("Expect '(' after function name."),
|
|
|
|
)?;
|
|
|
|
|
|
|
|
let mut params = vec![];
|
|
|
|
|
|
|
|
if !self.check_token(&TokenKind::RightParen) {
|
|
|
|
loop {
|
|
|
|
if params.len() >= 255 {
|
|
|
|
return Err(Error {
|
|
|
|
line: self.peek().line,
|
|
|
|
kind: ErrorKind::InternalError("255 parameter limit exceeded.".into()),
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
params.push(self.identifier("Expected parameter name.")?);
|
|
|
|
|
|
|
|
if !self.match_token(&TokenKind::Comma) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::RightParen,
|
|
|
|
ErrorKind::ExpectedToken("Expect ')' after parameters."),
|
|
|
|
)?;
|
|
|
|
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::LeftBrace,
|
|
|
|
ErrorKind::ExpectedToken("Expect '{' before function body."),
|
|
|
|
)?;
|
|
|
|
|
|
|
|
Ok(Statement::Function(Function {
|
|
|
|
name,
|
|
|
|
params,
|
|
|
|
body: self.block_statement()?,
|
|
|
|
}))
|
|
|
|
}
|
|
|
|
|
2020-12-31 15:59:19 +01:00
|
|
|
fn var_declaration(&mut self) -> StmtResult<'a> {
|
2020-12-22 15:44:25 +01:00
|
|
|
// Since `TokenKind::Identifier` carries data, we can't use
|
|
|
|
// `consume`.
|
2021-01-14 02:50:28 +01:00
|
|
|
let mut var = Var {
|
|
|
|
name: self.identifier("Expected variable name.")?,
|
|
|
|
initialiser: None,
|
|
|
|
};
|
2020-12-22 15:44:25 +01:00
|
|
|
|
2021-01-14 02:50:28 +01:00
|
|
|
if self.match_token(&TokenKind::Equal) {
|
|
|
|
var.initialiser = Some(self.expression()?);
|
2020-12-22 15:44:25 +01:00
|
|
|
}
|
|
|
|
|
2021-01-14 02:50:28 +01:00
|
|
|
self.consume(&TokenKind::Semicolon, ErrorKind::ExpectedSemicolon)?;
|
|
|
|
Ok(Statement::Var(var))
|
2020-12-22 15:44:25 +01:00
|
|
|
}
|
|
|
|
|
2020-12-20 23:55:40 +01:00
|
|
|
fn statement(&mut self) -> StmtResult<'a> {
|
2021-01-14 02:00:54 +01:00
|
|
|
if self.match_token(&TokenKind::Print) {
|
2020-12-20 23:55:40 +01:00
|
|
|
self.print_statement()
|
2021-01-14 02:00:54 +01:00
|
|
|
} else if self.match_token(&TokenKind::LeftBrace) {
|
2021-01-14 03:02:50 +01:00
|
|
|
Ok(Statement::Block(self.block_statement()?))
|
2021-01-14 02:00:54 +01:00
|
|
|
} else if self.match_token(&TokenKind::If) {
|
2021-01-03 16:26:26 +01:00
|
|
|
self.if_statement()
|
2021-01-14 02:00:54 +01:00
|
|
|
} else if self.match_token(&TokenKind::While) {
|
2021-01-06 18:49:20 +01:00
|
|
|
self.while_statement()
|
2021-01-14 02:00:54 +01:00
|
|
|
} else if self.match_token(&TokenKind::For) {
|
2021-01-06 23:57:37 +01:00
|
|
|
self.for_statement()
|
2020-12-20 23:55:40 +01:00
|
|
|
} else {
|
|
|
|
self.expr_statement()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn print_statement(&mut self) -> StmtResult<'a> {
|
|
|
|
let expr = self.expression()?;
|
|
|
|
self.consume(&TokenKind::Semicolon, ErrorKind::ExpectedSemicolon)?;
|
|
|
|
Ok(Statement::Print(expr))
|
|
|
|
}
|
|
|
|
|
2021-01-14 03:02:50 +01:00
|
|
|
fn block_statement(&mut self) -> Result<Block<'a>, Error> {
|
2020-12-31 16:05:58 +01:00
|
|
|
let mut block: Block<'a> = vec![];
|
|
|
|
|
|
|
|
while !self.check_token(&TokenKind::RightBrace) && !self.is_at_end() {
|
|
|
|
block.push(self.declaration()?);
|
|
|
|
}
|
|
|
|
|
|
|
|
self.consume(&TokenKind::RightBrace, ErrorKind::ExpectedClosingBrace)?;
|
|
|
|
|
2021-01-14 03:02:50 +01:00
|
|
|
Ok(block)
|
2020-12-31 16:05:58 +01:00
|
|
|
}
|
|
|
|
|
2021-01-03 16:26:26 +01:00
|
|
|
fn if_statement(&mut self) -> StmtResult<'a> {
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::LeftParen,
|
|
|
|
ErrorKind::ExpectedToken("Expected '(' after 'if'"),
|
|
|
|
)?;
|
|
|
|
let condition = self.expression()?;
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::RightParen,
|
|
|
|
ErrorKind::ExpectedToken("Expected ')' after condition"),
|
|
|
|
)?;
|
|
|
|
|
|
|
|
let then_branch = Box::new(self.statement()?);
|
|
|
|
|
|
|
|
let mut stmt = If {
|
|
|
|
condition,
|
|
|
|
then_branch,
|
|
|
|
else_branch: Option::None,
|
|
|
|
};
|
|
|
|
|
2021-01-14 02:00:54 +01:00
|
|
|
if self.match_token(&TokenKind::Else) {
|
2021-01-03 16:26:26 +01:00
|
|
|
stmt.else_branch = Some(Box::new(self.statement()?));
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(Statement::If(stmt))
|
|
|
|
}
|
|
|
|
|
2021-01-06 18:49:20 +01:00
|
|
|
fn while_statement(&mut self) -> StmtResult<'a> {
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::LeftParen,
|
|
|
|
ErrorKind::ExpectedToken("Expected '(' after 'while'"),
|
|
|
|
)?;
|
|
|
|
|
|
|
|
let condition = self.expression()?;
|
|
|
|
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::RightParen,
|
|
|
|
ErrorKind::ExpectedToken("Expected ')' after 'while'"),
|
|
|
|
)?;
|
|
|
|
|
|
|
|
Ok(Statement::While(While {
|
|
|
|
condition,
|
|
|
|
body: Box::new(self.statement()?),
|
|
|
|
}))
|
|
|
|
}
|
|
|
|
|
2021-01-06 23:57:37 +01:00
|
|
|
fn for_statement(&mut self) -> StmtResult<'a> {
|
|
|
|
// Parsing of clauses ...
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::LeftParen,
|
|
|
|
ErrorKind::ExpectedToken("Expected '(' after 'for'"),
|
|
|
|
)?;
|
|
|
|
|
2021-01-14 02:00:54 +01:00
|
|
|
let initialiser = if self.match_token(&TokenKind::Semicolon) {
|
2021-01-06 23:57:37 +01:00
|
|
|
None
|
2021-01-14 02:00:54 +01:00
|
|
|
} else if self.match_token(&TokenKind::Var) {
|
2021-01-06 23:57:37 +01:00
|
|
|
Some(self.var_declaration()?)
|
|
|
|
} else {
|
|
|
|
Some(self.expr_statement()?)
|
|
|
|
};
|
|
|
|
|
|
|
|
let condition = if self.check_token(&TokenKind::Semicolon) {
|
|
|
|
// unspecified condition => infinite loop
|
|
|
|
Expr::Literal(Literal::Boolean(true))
|
|
|
|
} else {
|
|
|
|
self.expression()?
|
|
|
|
};
|
|
|
|
|
|
|
|
self.consume(&TokenKind::Semicolon, ErrorKind::ExpectedSemicolon)?;
|
|
|
|
|
|
|
|
let increment = if self.check_token(&TokenKind::RightParen) {
|
|
|
|
None
|
|
|
|
} else {
|
|
|
|
Some(self.expression()?)
|
|
|
|
};
|
|
|
|
|
|
|
|
self.consume(
|
|
|
|
&TokenKind::RightParen,
|
|
|
|
ErrorKind::ExpectedToken("Expected ')' after for clauses"),
|
|
|
|
)?;
|
|
|
|
|
|
|
|
let mut body = self.statement()?;
|
|
|
|
|
|
|
|
// ... desugaring to while
|
|
|
|
|
|
|
|
if let Some(inc) = increment {
|
|
|
|
body = Statement::Block(vec![body, Statement::Expr(inc)]);
|
|
|
|
}
|
|
|
|
|
|
|
|
body = Statement::While(While {
|
|
|
|
condition,
|
|
|
|
body: Box::new(body),
|
|
|
|
});
|
|
|
|
|
|
|
|
if let Some(init) = initialiser {
|
|
|
|
body = Statement::Block(vec![init, body]);
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(body)
|
|
|
|
}
|
|
|
|
|
2020-12-20 23:55:40 +01:00
|
|
|
fn expr_statement(&mut self) -> StmtResult<'a> {
|
|
|
|
let expr = self.expression()?;
|
|
|
|
self.consume(&TokenKind::Semicolon, ErrorKind::ExpectedSemicolon)?;
|
|
|
|
Ok(Statement::Expr(expr))
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn expression(&mut self) -> ExprResult<'a> {
|
2020-12-31 14:31:34 +01:00
|
|
|
self.assignment()
|
|
|
|
}
|
|
|
|
|
|
|
|
fn assignment(&mut self) -> ExprResult<'a> {
|
2021-01-06 18:35:05 +01:00
|
|
|
let expr = self.logic_or()?;
|
2020-12-31 14:31:34 +01:00
|
|
|
|
2021-01-14 02:00:54 +01:00
|
|
|
if self.match_token(&TokenKind::Equal) {
|
2020-12-31 14:31:34 +01:00
|
|
|
let equals = self.previous().clone();
|
|
|
|
let value = self.assignment()?;
|
|
|
|
|
|
|
|
if let Expr::Variable(Variable(name)) = expr {
|
|
|
|
return Ok(Expr::Assign(Assign {
|
|
|
|
name,
|
|
|
|
value: Box::new(value),
|
|
|
|
}));
|
|
|
|
}
|
|
|
|
|
|
|
|
return Err(Error {
|
|
|
|
line: equals.line,
|
|
|
|
kind: ErrorKind::InvalidAssignmentTarget(format!("{:?}", equals)),
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(expr)
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
2021-01-06 18:35:05 +01:00
|
|
|
fn logic_or(&mut self) -> ExprResult<'a> {
|
|
|
|
let mut expr = self.logic_and()?;
|
|
|
|
|
2021-01-14 02:00:54 +01:00
|
|
|
while self.match_token(&TokenKind::Or) {
|
2021-01-06 18:35:05 +01:00
|
|
|
expr = Expr::Logical(Logical {
|
|
|
|
left: Box::new(expr),
|
|
|
|
operator: self.previous().clone(),
|
|
|
|
right: Box::new(self.logic_and()?),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(expr)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn logic_and(&mut self) -> ExprResult<'a> {
|
|
|
|
let mut expr = self.equality()?;
|
|
|
|
|
2021-01-14 02:00:54 +01:00
|
|
|
while self.match_token(&TokenKind::And) {
|
2021-01-06 18:35:05 +01:00
|
|
|
expr = Expr::Logical(Logical {
|
|
|
|
left: Box::new(expr),
|
|
|
|
operator: self.previous().clone(),
|
|
|
|
right: Box::new(self.equality()?),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(expr)
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn equality(&mut self) -> ExprResult<'a> {
|
2020-12-06 14:21:06 +01:00
|
|
|
self.binary_operator(
|
|
|
|
&[TokenKind::BangEqual, TokenKind::EqualEqual],
|
|
|
|
Self::comparison,
|
|
|
|
)
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn comparison(&mut self) -> ExprResult<'a> {
|
2020-12-06 14:21:06 +01:00
|
|
|
self.binary_operator(
|
|
|
|
&[
|
|
|
|
TokenKind::Greater,
|
|
|
|
TokenKind::GreaterEqual,
|
|
|
|
TokenKind::Less,
|
|
|
|
TokenKind::LessEqual,
|
|
|
|
],
|
|
|
|
Self::term,
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn term(&mut self) -> ExprResult<'a> {
|
|
|
|
self.binary_operator(&[TokenKind::Minus, TokenKind::Plus], Self::factor)
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn factor(&mut self) -> ExprResult<'a> {
|
|
|
|
self.binary_operator(&[TokenKind::Slash, TokenKind::Star], Self::unary)
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn unary(&mut self) -> ExprResult<'a> {
|
2021-01-14 02:00:54 +01:00
|
|
|
if self.match_token(&TokenKind::Bang) || self.match_token(&TokenKind::Minus) {
|
2020-12-06 14:43:43 +01:00
|
|
|
return Ok(Expr::Unary(Unary {
|
2020-12-06 18:03:09 +01:00
|
|
|
operator: self.previous().clone(),
|
2020-12-06 14:43:43 +01:00
|
|
|
right: Box::new(self.unary()?),
|
|
|
|
}));
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
2021-01-11 18:29:20 +01:00
|
|
|
return self.call();
|
|
|
|
}
|
|
|
|
|
|
|
|
fn call(&mut self) -> ExprResult<'a> {
|
|
|
|
let mut expr = self.primary()?;
|
|
|
|
|
|
|
|
loop {
|
2021-01-14 02:00:54 +01:00
|
|
|
if self.match_token(&TokenKind::LeftParen) {
|
2021-01-11 18:29:20 +01:00
|
|
|
expr = self.finish_call(expr)?;
|
|
|
|
} else {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(expr)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn finish_call(&mut self, callee: Expr<'a>) -> ExprResult<'a> {
|
|
|
|
let mut args = vec![];
|
|
|
|
|
|
|
|
if !self.check_token(&TokenKind::RightParen) {
|
|
|
|
loop {
|
|
|
|
// TODO(tazjin): Check for max args count
|
|
|
|
args.push(self.expression()?);
|
2021-01-14 02:00:54 +01:00
|
|
|
if !self.match_token(&TokenKind::Comma) {
|
2021-01-11 18:29:20 +01:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
let paren = self.consume(
|
|
|
|
&TokenKind::RightParen,
|
|
|
|
ErrorKind::ExpectedToken("Expect ')' after arguments."),
|
|
|
|
)?;
|
|
|
|
|
|
|
|
Ok(Expr::Call(Call {
|
|
|
|
args,
|
|
|
|
callee: Box::new(callee),
|
|
|
|
paren,
|
|
|
|
}))
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn primary(&mut self) -> ExprResult<'a> {
|
2020-12-06 14:21:06 +01:00
|
|
|
let next = self.advance();
|
|
|
|
let literal = match next.kind {
|
|
|
|
TokenKind::True => Literal::Boolean(true),
|
|
|
|
TokenKind::False => Literal::Boolean(false),
|
|
|
|
TokenKind::Nil => Literal::Nil,
|
|
|
|
TokenKind::Number(num) => Literal::Number(num),
|
|
|
|
TokenKind::String(string) => Literal::String(string),
|
|
|
|
|
|
|
|
TokenKind::LeftParen => {
|
2020-12-06 15:28:16 +01:00
|
|
|
let expr = self.expression()?;
|
|
|
|
self.consume(&TokenKind::RightParen, ErrorKind::UnmatchedParens)?;
|
|
|
|
return Ok(Expr::Grouping(Grouping(Box::new(expr))));
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
2020-12-22 15:44:25 +01:00
|
|
|
TokenKind::Identifier(_) => return Ok(Expr::Variable(Variable(next))),
|
|
|
|
|
2020-12-06 18:03:09 +01:00
|
|
|
unexpected => {
|
|
|
|
eprintln!("encountered {:?}", unexpected);
|
|
|
|
return Err(Error {
|
|
|
|
line: next.line,
|
|
|
|
kind: ErrorKind::ExpectedExpression(next.lexeme.into_iter().collect()),
|
|
|
|
});
|
|
|
|
}
|
2020-12-06 14:21:06 +01:00
|
|
|
};
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
Ok(Expr::Literal(literal))
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// internal helpers
|
2020-12-06 14:21:06 +01:00
|
|
|
|
2021-01-14 02:50:28 +01:00
|
|
|
fn identifier(&mut self, err: &'static str) -> Result<Token<'a>, Error> {
|
|
|
|
if let TokenKind::Identifier(_) = self.peek().kind {
|
|
|
|
Ok(self.advance())
|
|
|
|
} else {
|
|
|
|
Err(Error {
|
|
|
|
line: self.peek().line,
|
|
|
|
kind: ErrorKind::ExpectedToken(err),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
/// Check if the next token is in `oneof`, and advance if it is.
|
2021-01-14 02:00:54 +01:00
|
|
|
fn match_token(&mut self, token: &TokenKind) -> bool {
|
|
|
|
if self.check_token(token) {
|
|
|
|
self.advance();
|
|
|
|
return true;
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
2021-01-14 02:00:54 +01:00
|
|
|
false
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
/// Return the next token and advance parser state.
|
|
|
|
fn advance(&mut self) -> Token<'a> {
|
2020-11-28 19:53:51 +01:00
|
|
|
if !self.is_at_end() {
|
|
|
|
self.current += 1;
|
|
|
|
}
|
|
|
|
|
2020-12-06 18:03:09 +01:00
|
|
|
return self.previous().clone();
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
fn is_at_end(&self) -> bool {
|
|
|
|
self.check_token(&TokenKind::Eof)
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
/// Is the next token `token`?
|
2020-11-28 19:53:51 +01:00
|
|
|
fn check_token(&self, token: &TokenKind) -> bool {
|
|
|
|
self.peek().kind == *token
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
fn peek(&self) -> &Token<'a> {
|
2020-11-28 19:53:51 +01:00
|
|
|
&self.tokens[self.current]
|
|
|
|
}
|
|
|
|
|
2020-12-06 18:03:09 +01:00
|
|
|
fn previous(&self) -> &Token<'a> {
|
|
|
|
&self.tokens[self.current - 1]
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
2021-01-11 18:29:20 +01:00
|
|
|
fn consume(&mut self, kind: &TokenKind, err: ErrorKind) -> Result<Token<'a>, Error> {
|
2020-12-06 15:28:16 +01:00
|
|
|
if self.check_token(kind) {
|
2020-12-22 15:44:25 +01:00
|
|
|
return Ok(self.advance());
|
2020-12-06 15:28:16 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
Err(Error {
|
|
|
|
line: self.peek().line,
|
|
|
|
kind: err,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-12-06 18:03:09 +01:00
|
|
|
fn synchronise(&mut self) {
|
|
|
|
self.advance();
|
|
|
|
|
|
|
|
while !self.is_at_end() {
|
|
|
|
if self.previous().kind == TokenKind::Semicolon {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
match self.peek().kind {
|
|
|
|
TokenKind::Class
|
|
|
|
| TokenKind::Fun
|
|
|
|
| TokenKind::Var
|
|
|
|
| TokenKind::For
|
|
|
|
| TokenKind::If
|
|
|
|
| TokenKind::While
|
|
|
|
| TokenKind::Print
|
|
|
|
| TokenKind::Return => return,
|
|
|
|
|
|
|
|
_ => {
|
|
|
|
self.advance();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
fn binary_operator(
|
|
|
|
&mut self,
|
|
|
|
oneof: &[TokenKind],
|
2020-12-06 14:43:43 +01:00
|
|
|
each: fn(&mut Parser<'a>) -> ExprResult<'a>,
|
|
|
|
) -> ExprResult<'a> {
|
|
|
|
let mut expr = each(self)?;
|
2020-12-06 14:21:06 +01:00
|
|
|
|
2021-01-14 02:00:54 +01:00
|
|
|
while oneof.iter().any(|t| self.match_token(t)) {
|
2020-12-06 14:21:06 +01:00
|
|
|
expr = Expr::Binary(Binary {
|
|
|
|
left: Box::new(expr),
|
2020-12-06 18:03:09 +01:00
|
|
|
operator: self.previous().clone(),
|
2020-12-06 14:43:43 +01:00
|
|
|
right: Box::new(each(self)?),
|
2020-12-06 14:21:06 +01:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
return Ok(expr);
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
}
|
2020-12-06 15:49:44 +01:00
|
|
|
|
2020-12-31 16:05:58 +01:00
|
|
|
pub fn parse<'a>(tokens: Vec<Token<'a>>) -> Result<Block<'a>, Vec<Error>> {
|
2020-12-06 15:49:44 +01:00
|
|
|
let mut parser = Parser { tokens, current: 0 };
|
2020-12-31 16:05:58 +01:00
|
|
|
let mut program: Block<'a> = vec![];
|
2020-12-06 18:03:09 +01:00
|
|
|
let mut errors: Vec<Error> = vec![];
|
|
|
|
|
|
|
|
while !parser.is_at_end() {
|
2020-12-21 00:13:22 +01:00
|
|
|
match parser.declaration() {
|
2020-12-06 18:03:09 +01:00
|
|
|
Err(err) => {
|
|
|
|
errors.push(err);
|
|
|
|
parser.synchronise();
|
|
|
|
}
|
2020-12-21 00:13:22 +01:00
|
|
|
Ok(decl) => {
|
|
|
|
program.push(decl);
|
2020-12-06 18:03:09 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2020-12-06 15:49:44 +01:00
|
|
|
|
2020-12-20 23:55:40 +01:00
|
|
|
if errors.is_empty() {
|
|
|
|
Ok(program)
|
|
|
|
} else {
|
|
|
|
Err(errors)
|
|
|
|
}
|
2020-12-06 15:49:44 +01:00
|
|
|
}
|