2020-11-28 19:53:51 +01:00
|
|
|
// This implements the grammar of Lox as described starting in the
|
|
|
|
// Crafting Interpreters chapter "Representing Code". Note that the
|
2020-12-06 14:21:06 +01:00
|
|
|
// upstream Java implementation works around Java being bad at value
|
2020-11-28 19:53:51 +01:00
|
|
|
// classes by writing a code generator for Java.
|
|
|
|
//
|
|
|
|
// My Rust implementation skips this step because it's unnecessary, we
|
|
|
|
// have real types.
|
2020-12-06 14:43:43 +01:00
|
|
|
use crate::errors::{Error, ErrorKind};
|
2020-11-28 19:53:51 +01:00
|
|
|
use crate::scanner::{Token, TokenKind};
|
|
|
|
|
|
|
|
// AST
|
|
|
|
|
|
|
|
#[derive(Debug)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub struct Binary<'a> {
|
2020-11-28 19:53:51 +01:00
|
|
|
left: Box<Expr<'a>>,
|
|
|
|
operator: Token<'a>,
|
2020-12-06 14:21:06 +01:00
|
|
|
right: Box<Expr<'a>>,
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub struct Grouping<'a>(Box<Expr<'a>>);
|
2020-11-28 19:53:51 +01:00
|
|
|
|
|
|
|
#[derive(Debug)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub enum Literal {
|
2020-12-06 14:21:06 +01:00
|
|
|
Boolean(bool),
|
|
|
|
Number(f64),
|
|
|
|
String(String),
|
|
|
|
Nil,
|
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub struct Unary<'a> {
|
2020-12-06 14:21:06 +01:00
|
|
|
operator: Token<'a>,
|
|
|
|
right: Box<Expr<'a>>,
|
|
|
|
}
|
2020-11-28 19:53:51 +01:00
|
|
|
|
|
|
|
#[derive(Debug)]
|
2020-12-06 15:49:44 +01:00
|
|
|
pub enum Expr<'a> {
|
2020-11-28 19:53:51 +01:00
|
|
|
Binary(Binary<'a>),
|
|
|
|
Grouping(Grouping<'a>),
|
|
|
|
Literal(Literal),
|
2020-12-06 14:21:06 +01:00
|
|
|
Unary(Unary<'a>),
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Parser
|
|
|
|
|
|
|
|
/*
|
|
|
|
expression → equality ;
|
|
|
|
equality → comparison ( ( "!=" | "==" ) comparison )* ;
|
|
|
|
comparison → term ( ( ">" | ">=" | "<" | "<=" ) term )* ;
|
|
|
|
term → factor ( ( "-" | "+" ) factor )* ;
|
|
|
|
factor → unary ( ( "/" | "*" ) unary )* ;
|
|
|
|
unary → ( "!" | "-" ) unary
|
|
|
|
| primary ;
|
|
|
|
primary → NUMBER | STRING | "true" | "false" | "nil"
|
|
|
|
| "(" expression ")" ;
|
|
|
|
*/
|
|
|
|
|
|
|
|
struct Parser<'a> {
|
|
|
|
tokens: Vec<Token<'a>>,
|
|
|
|
current: usize,
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
type ExprResult<'a> = Result<Expr<'a>, Error>;
|
|
|
|
|
2020-11-28 19:53:51 +01:00
|
|
|
impl<'a> Parser<'a> {
|
|
|
|
// recursive-descent parser functions
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn expression(&mut self) -> ExprResult<'a> {
|
2020-11-28 19:53:51 +01:00
|
|
|
self.equality()
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn equality(&mut self) -> ExprResult<'a> {
|
2020-12-06 14:21:06 +01:00
|
|
|
self.binary_operator(
|
|
|
|
&[TokenKind::BangEqual, TokenKind::EqualEqual],
|
|
|
|
Self::comparison,
|
|
|
|
)
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn comparison(&mut self) -> ExprResult<'a> {
|
2020-12-06 14:21:06 +01:00
|
|
|
self.binary_operator(
|
|
|
|
&[
|
|
|
|
TokenKind::Greater,
|
|
|
|
TokenKind::GreaterEqual,
|
|
|
|
TokenKind::Less,
|
|
|
|
TokenKind::LessEqual,
|
|
|
|
],
|
|
|
|
Self::term,
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn term(&mut self) -> ExprResult<'a> {
|
|
|
|
self.binary_operator(&[TokenKind::Minus, TokenKind::Plus], Self::factor)
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn factor(&mut self) -> ExprResult<'a> {
|
|
|
|
self.binary_operator(&[TokenKind::Slash, TokenKind::Star], Self::unary)
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn unary(&mut self) -> ExprResult<'a> {
|
2020-12-06 14:21:06 +01:00
|
|
|
if self.match_token(&[TokenKind::Bang, TokenKind::Minus]) {
|
2020-12-06 14:43:43 +01:00
|
|
|
return Ok(Expr::Unary(Unary {
|
2020-12-06 14:21:06 +01:00
|
|
|
operator: self.previous(),
|
2020-12-06 14:43:43 +01:00
|
|
|
right: Box::new(self.unary()?),
|
|
|
|
}));
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
return self.primary();
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
fn primary(&mut self) -> ExprResult<'a> {
|
2020-12-06 14:21:06 +01:00
|
|
|
let next = self.advance();
|
|
|
|
let literal = match next.kind {
|
|
|
|
TokenKind::True => Literal::Boolean(true),
|
|
|
|
TokenKind::False => Literal::Boolean(false),
|
|
|
|
TokenKind::Nil => Literal::Nil,
|
|
|
|
TokenKind::Number(num) => Literal::Number(num),
|
|
|
|
TokenKind::String(string) => Literal::String(string),
|
|
|
|
|
|
|
|
TokenKind::LeftParen => {
|
2020-12-06 15:28:16 +01:00
|
|
|
let expr = self.expression()?;
|
|
|
|
self.consume(&TokenKind::RightParen, ErrorKind::UnmatchedParens)?;
|
|
|
|
return Ok(Expr::Grouping(Grouping(Box::new(expr))));
|
2020-12-06 14:21:06 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// This branch indicates a parser bug, not invalid input.
|
|
|
|
unexpected => panic!("Parser encountered unexpected token '{:?}'", unexpected),
|
|
|
|
};
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
Ok(Expr::Literal(literal))
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// internal helpers
|
2020-12-06 14:21:06 +01:00
|
|
|
|
|
|
|
/// Check if the next token is in `oneof`, and advance if it is.
|
2020-11-28 19:53:51 +01:00
|
|
|
fn match_token(&mut self, oneof: &[TokenKind]) -> bool {
|
|
|
|
for token in oneof {
|
|
|
|
if self.check_token(token) {
|
|
|
|
self.advance();
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
/// Return the next token and advance parser state.
|
|
|
|
fn advance(&mut self) -> Token<'a> {
|
2020-11-28 19:53:51 +01:00
|
|
|
if !self.is_at_end() {
|
|
|
|
self.current += 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return self.previous();
|
|
|
|
}
|
|
|
|
|
|
|
|
fn is_at_end(&self) -> bool {
|
|
|
|
self.check_token(&TokenKind::Eof)
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
/// Is the next token `token`?
|
2020-11-28 19:53:51 +01:00
|
|
|
fn check_token(&self, token: &TokenKind) -> bool {
|
|
|
|
self.peek().kind == *token
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
fn peek(&self) -> &Token<'a> {
|
2020-11-28 19:53:51 +01:00
|
|
|
&self.tokens[self.current]
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
fn previous(&self) -> Token<'a> {
|
|
|
|
self.tokens[self.current - 1].clone()
|
|
|
|
}
|
|
|
|
|
2020-12-06 15:28:16 +01:00
|
|
|
fn consume(&mut self, kind: &TokenKind, err: ErrorKind) -> Result<(), Error> {
|
|
|
|
if self.check_token(kind) {
|
|
|
|
self.advance();
|
|
|
|
return Ok(());
|
|
|
|
}
|
|
|
|
|
|
|
|
Err(Error {
|
|
|
|
line: self.peek().line,
|
|
|
|
kind: err,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:21:06 +01:00
|
|
|
fn binary_operator(
|
|
|
|
&mut self,
|
|
|
|
oneof: &[TokenKind],
|
2020-12-06 14:43:43 +01:00
|
|
|
each: fn(&mut Parser<'a>) -> ExprResult<'a>,
|
|
|
|
) -> ExprResult<'a> {
|
|
|
|
let mut expr = each(self)?;
|
2020-12-06 14:21:06 +01:00
|
|
|
|
|
|
|
while self.match_token(oneof) {
|
|
|
|
expr = Expr::Binary(Binary {
|
|
|
|
left: Box::new(expr),
|
|
|
|
operator: self.previous(),
|
2020-12-06 14:43:43 +01:00
|
|
|
right: Box::new(each(self)?),
|
2020-12-06 14:21:06 +01:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-12-06 14:43:43 +01:00
|
|
|
return Ok(expr);
|
2020-11-28 19:53:51 +01:00
|
|
|
}
|
|
|
|
}
|
2020-12-06 15:49:44 +01:00
|
|
|
|
|
|
|
pub fn parse<'a>(tokens: Vec<Token<'a>>) -> ExprResult<'a> {
|
|
|
|
let mut parser = Parser { tokens, current: 0 };
|
|
|
|
|
|
|
|
parser.expression()
|
|
|
|
}
|