2021-03-08 06:04:44 +01:00
|
|
|
use std::convert::{TryFrom, TryInto};
|
2021-03-07 21:29:59 +01:00
|
|
|
use std::path::Path;
|
|
|
|
use std::result;
|
|
|
|
|
|
|
|
use inkwell::basic_block::BasicBlock;
|
|
|
|
use inkwell::builder::Builder;
|
|
|
|
pub use inkwell::context::Context;
|
|
|
|
use inkwell::module::Module;
|
|
|
|
use inkwell::support::LLVMString;
|
|
|
|
use inkwell::types::FunctionType;
|
2021-03-08 06:04:44 +01:00
|
|
|
use inkwell::values::{AnyValueEnum, BasicValueEnum, FunctionValue};
|
2021-03-07 21:29:59 +01:00
|
|
|
use inkwell::IntPredicate;
|
|
|
|
use thiserror::Error;
|
|
|
|
|
2021-03-13 19:12:03 +01:00
|
|
|
use crate::ast::{BinaryOperator, Binding, Decl, Expr, Fun, Ident, Literal, UnaryOperator};
|
2021-03-07 21:29:59 +01:00
|
|
|
use crate::common::env::Env;
|
|
|
|
|
|
|
|
#[derive(Debug, PartialEq, Eq, Error)]
|
|
|
|
pub enum Error {
|
|
|
|
#[error("Undefined variable {0}")]
|
|
|
|
UndefinedVariable(Ident<'static>),
|
|
|
|
|
|
|
|
#[error("LLVM Error: {0}")]
|
|
|
|
LLVMError(String),
|
|
|
|
}
|
|
|
|
|
|
|
|
impl From<LLVMString> for Error {
|
|
|
|
fn from(s: LLVMString) -> Self {
|
|
|
|
Self::LLVMError(s.to_string())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub type Result<T> = result::Result<T, Error>;
|
|
|
|
|
|
|
|
pub struct Codegen<'ctx, 'ast> {
|
|
|
|
context: &'ctx Context,
|
|
|
|
pub module: Module<'ctx>,
|
|
|
|
builder: Builder<'ctx>,
|
2021-03-08 06:04:44 +01:00
|
|
|
env: Env<'ast, AnyValueEnum<'ctx>>,
|
|
|
|
function_stack: Vec<FunctionValue<'ctx>>,
|
|
|
|
identifier_counter: u32,
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
impl<'ctx, 'ast> Codegen<'ctx, 'ast> {
|
|
|
|
pub fn new(context: &'ctx Context, module_name: &str) -> Self {
|
|
|
|
let module = context.create_module(module_name);
|
|
|
|
let builder = context.create_builder();
|
|
|
|
Self {
|
|
|
|
context,
|
|
|
|
module,
|
|
|
|
builder,
|
|
|
|
env: Default::default(),
|
2021-03-08 06:04:44 +01:00
|
|
|
function_stack: Default::default(),
|
|
|
|
identifier_counter: 0,
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn new_function<'a>(
|
|
|
|
&'a mut self,
|
|
|
|
name: &str,
|
|
|
|
ty: FunctionType<'ctx>,
|
|
|
|
) -> &'a FunctionValue<'ctx> {
|
2021-03-08 06:04:44 +01:00
|
|
|
self.function_stack
|
|
|
|
.push(self.module.add_function(name, ty, None));
|
2021-03-07 21:29:59 +01:00
|
|
|
let basic_block = self.append_basic_block("entry");
|
|
|
|
self.builder.position_at_end(basic_block);
|
2021-03-08 06:04:44 +01:00
|
|
|
self.function_stack.last().unwrap()
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
|
2021-03-08 06:04:44 +01:00
|
|
|
pub fn finish_function(&mut self, res: &BasicValueEnum<'ctx>) -> FunctionValue<'ctx> {
|
2021-03-07 21:29:59 +01:00
|
|
|
self.builder.build_return(Some(res));
|
2021-03-08 06:04:44 +01:00
|
|
|
self.function_stack.pop().unwrap()
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
pub fn append_basic_block(&self, name: &str) -> BasicBlock<'ctx> {
|
|
|
|
self.context
|
2021-03-08 06:04:44 +01:00
|
|
|
.append_basic_block(*self.function_stack.last().unwrap(), name)
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
|
2021-03-08 06:04:44 +01:00
|
|
|
pub fn codegen_expr(&mut self, expr: &'ast Expr<'ast>) -> Result<AnyValueEnum<'ctx>> {
|
2021-03-07 21:29:59 +01:00
|
|
|
match expr {
|
|
|
|
Expr::Ident(id) => self
|
|
|
|
.env
|
|
|
|
.resolve(id)
|
|
|
|
.cloned()
|
|
|
|
.ok_or_else(|| Error::UndefinedVariable(id.to_owned())),
|
|
|
|
Expr::Literal(Literal::Int(i)) => {
|
|
|
|
let ty = self.context.i64_type();
|
2021-03-08 06:04:44 +01:00
|
|
|
Ok(AnyValueEnum::IntValue(ty.const_int(*i, false)))
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
Expr::UnaryOp { op, rhs } => {
|
|
|
|
let rhs = self.codegen_expr(rhs)?;
|
|
|
|
match op {
|
|
|
|
UnaryOperator::Not => unimplemented!(),
|
2021-03-08 06:04:44 +01:00
|
|
|
UnaryOperator::Neg => Ok(AnyValueEnum::IntValue(
|
2021-03-07 21:29:59 +01:00
|
|
|
self.builder.build_int_neg(rhs.into_int_value(), "neg"),
|
|
|
|
)),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Expr::BinaryOp { lhs, op, rhs } => {
|
|
|
|
let lhs = self.codegen_expr(lhs)?;
|
|
|
|
let rhs = self.codegen_expr(rhs)?;
|
|
|
|
match op {
|
2021-03-08 06:04:44 +01:00
|
|
|
BinaryOperator::Add => Ok(AnyValueEnum::IntValue(self.builder.build_int_add(
|
|
|
|
lhs.into_int_value(),
|
|
|
|
rhs.into_int_value(),
|
|
|
|
"add",
|
|
|
|
))),
|
|
|
|
BinaryOperator::Sub => Ok(AnyValueEnum::IntValue(self.builder.build_int_sub(
|
|
|
|
lhs.into_int_value(),
|
|
|
|
rhs.into_int_value(),
|
|
|
|
"add",
|
|
|
|
))),
|
|
|
|
BinaryOperator::Mul => Ok(AnyValueEnum::IntValue(self.builder.build_int_sub(
|
|
|
|
lhs.into_int_value(),
|
|
|
|
rhs.into_int_value(),
|
|
|
|
"add",
|
|
|
|
))),
|
2021-03-07 21:29:59 +01:00
|
|
|
BinaryOperator::Div => {
|
2021-03-08 06:04:44 +01:00
|
|
|
Ok(AnyValueEnum::IntValue(self.builder.build_int_signed_div(
|
2021-03-07 21:29:59 +01:00
|
|
|
lhs.into_int_value(),
|
|
|
|
rhs.into_int_value(),
|
|
|
|
"add",
|
|
|
|
)))
|
|
|
|
}
|
|
|
|
BinaryOperator::Pow => unimplemented!(),
|
|
|
|
BinaryOperator::Equ => {
|
2021-03-08 06:04:44 +01:00
|
|
|
Ok(AnyValueEnum::IntValue(self.builder.build_int_compare(
|
2021-03-07 21:29:59 +01:00
|
|
|
IntPredicate::EQ,
|
|
|
|
lhs.into_int_value(),
|
|
|
|
rhs.into_int_value(),
|
|
|
|
"eq",
|
|
|
|
)))
|
|
|
|
}
|
|
|
|
BinaryOperator::Neq => todo!(),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Expr::Let { bindings, body } => {
|
|
|
|
self.env.push();
|
2021-03-13 19:12:03 +01:00
|
|
|
for Binding { ident, body, .. } in bindings {
|
|
|
|
let val = self.codegen_expr(body)?;
|
|
|
|
self.env.set(ident, val);
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
let res = self.codegen_expr(body);
|
|
|
|
self.env.pop();
|
|
|
|
res
|
|
|
|
}
|
|
|
|
Expr::If {
|
|
|
|
condition,
|
|
|
|
then,
|
|
|
|
else_,
|
|
|
|
} => {
|
|
|
|
let then_block = self.append_basic_block("then");
|
|
|
|
let else_block = self.append_basic_block("else");
|
|
|
|
let join_block = self.append_basic_block("join");
|
|
|
|
let condition = self.codegen_expr(condition)?;
|
|
|
|
self.builder.build_conditional_branch(
|
|
|
|
condition.into_int_value(),
|
|
|
|
then_block,
|
|
|
|
else_block,
|
|
|
|
);
|
|
|
|
self.builder.position_at_end(then_block);
|
|
|
|
let then_res = self.codegen_expr(then)?;
|
|
|
|
self.builder.build_unconditional_branch(join_block);
|
|
|
|
|
|
|
|
self.builder.position_at_end(else_block);
|
|
|
|
let else_res = self.codegen_expr(else_)?;
|
|
|
|
self.builder.build_unconditional_branch(join_block);
|
|
|
|
|
|
|
|
self.builder.position_at_end(join_block);
|
|
|
|
let phi = self.builder.build_phi(self.context.i64_type(), "join");
|
2021-03-08 06:04:44 +01:00
|
|
|
phi.add_incoming(&[
|
|
|
|
(&BasicValueEnum::try_from(then_res).unwrap(), then_block),
|
|
|
|
(&BasicValueEnum::try_from(else_res).unwrap(), else_block),
|
|
|
|
]);
|
|
|
|
Ok(phi.as_basic_value().into())
|
|
|
|
}
|
|
|
|
Expr::Call { fun, args } => {
|
|
|
|
if let Expr::Ident(id) = &**fun {
|
|
|
|
let function = self
|
|
|
|
.module
|
|
|
|
.get_function(id.into())
|
|
|
|
.or_else(|| self.env.resolve(id)?.clone().try_into().ok())
|
|
|
|
.ok_or_else(|| Error::UndefinedVariable(id.to_owned()))?;
|
|
|
|
let args = args
|
|
|
|
.iter()
|
|
|
|
.map(|arg| Ok(self.codegen_expr(arg)?.try_into().unwrap()))
|
|
|
|
.collect::<Result<Vec<_>>>()?;
|
|
|
|
Ok(self
|
|
|
|
.builder
|
|
|
|
.build_call(function, &args, "call")
|
|
|
|
.try_as_basic_value()
|
|
|
|
.left()
|
|
|
|
.unwrap()
|
|
|
|
.into())
|
|
|
|
} else {
|
|
|
|
todo!()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Expr::Fun(fun) => {
|
|
|
|
let Fun { args, body } = &**fun;
|
|
|
|
let fname = self.fresh_ident("f");
|
|
|
|
let cur_block = self.builder.get_insert_block().unwrap();
|
|
|
|
let env = self.env.save(); // TODO: closures
|
|
|
|
let function = self.codegen_function(&fname, args, body)?;
|
|
|
|
self.builder.position_at_end(cur_block);
|
|
|
|
self.env.restore(env);
|
|
|
|
Ok(function.into())
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
2021-03-13 19:12:03 +01:00
|
|
|
Expr::Ascription { expr, .. } => self.codegen_expr(expr),
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-08 06:04:44 +01:00
|
|
|
pub fn codegen_function(
|
|
|
|
&mut self,
|
|
|
|
name: &str,
|
|
|
|
args: &'ast [Ident<'ast>],
|
|
|
|
body: &'ast Expr<'ast>,
|
|
|
|
) -> Result<FunctionValue<'ctx>> {
|
|
|
|
let i64_type = self.context.i64_type();
|
|
|
|
self.new_function(
|
|
|
|
name,
|
|
|
|
i64_type.fn_type(
|
|
|
|
args.iter()
|
|
|
|
.map(|_| i64_type.into())
|
|
|
|
.collect::<Vec<_>>()
|
|
|
|
.as_slice(),
|
|
|
|
false,
|
|
|
|
),
|
|
|
|
);
|
|
|
|
self.env.push();
|
|
|
|
for (i, arg) in args.iter().enumerate() {
|
|
|
|
self.env.set(
|
|
|
|
arg,
|
|
|
|
self.cur_function().get_nth_param(i as u32).unwrap().into(),
|
|
|
|
);
|
|
|
|
}
|
|
|
|
let res = self.codegen_expr(body)?.try_into().unwrap();
|
|
|
|
self.env.pop();
|
|
|
|
Ok(self.finish_function(&res))
|
|
|
|
}
|
|
|
|
|
2021-03-07 21:29:59 +01:00
|
|
|
pub fn codegen_decl(&mut self, decl: &'ast Decl<'ast>) -> Result<()> {
|
|
|
|
match decl {
|
2021-03-08 06:04:44 +01:00
|
|
|
Decl::Fun {
|
|
|
|
name,
|
|
|
|
body: Fun { args, body },
|
|
|
|
} => {
|
|
|
|
self.codegen_function(name.into(), args, body)?;
|
2021-03-07 21:29:59 +01:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn codegen_main(&mut self, expr: &'ast Expr<'ast>) -> Result<()> {
|
|
|
|
self.new_function("main", self.context.i64_type().fn_type(&[], false));
|
2021-03-08 06:04:44 +01:00
|
|
|
let res = self.codegen_expr(expr)?.try_into().unwrap();
|
2021-03-07 21:29:59 +01:00
|
|
|
self.finish_function(&res);
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn print_to_file<P>(&self, path: P) -> Result<()>
|
|
|
|
where
|
|
|
|
P: AsRef<Path>,
|
|
|
|
{
|
|
|
|
Ok(self.module.print_to_file(path)?)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn binary_to_file<P>(&self, path: P) -> Result<()>
|
|
|
|
where
|
|
|
|
P: AsRef<Path>,
|
|
|
|
{
|
|
|
|
if self.module.write_bitcode_to_path(path.as_ref()) {
|
|
|
|
Ok(())
|
|
|
|
} else {
|
|
|
|
Err(Error::LLVMError(
|
|
|
|
"Error writing bitcode to output path".to_owned(),
|
|
|
|
))
|
|
|
|
}
|
|
|
|
}
|
2021-03-08 06:04:44 +01:00
|
|
|
|
|
|
|
fn fresh_ident(&mut self, prefix: &str) -> String {
|
|
|
|
self.identifier_counter += 1;
|
|
|
|
format!("{}{}", prefix, self.identifier_counter)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn cur_function(&self) -> &FunctionValue<'ctx> {
|
|
|
|
self.function_stack.last().unwrap()
|
|
|
|
}
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
use inkwell::execution_engine::JitFunction;
|
|
|
|
use inkwell::OptimizationLevel;
|
|
|
|
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
fn jit_eval<T>(expr: &str) -> anyhow::Result<T> {
|
|
|
|
let expr = crate::parser::expr(expr).unwrap().1;
|
|
|
|
|
|
|
|
let context = Context::create();
|
|
|
|
let mut codegen = Codegen::new(&context, "test");
|
|
|
|
let execution_engine = codegen
|
|
|
|
.module
|
|
|
|
.create_jit_execution_engine(OptimizationLevel::None)
|
|
|
|
.unwrap();
|
|
|
|
|
2021-03-08 06:04:44 +01:00
|
|
|
codegen.codegen_function("test", &[], &expr)?;
|
2021-03-07 21:29:59 +01:00
|
|
|
|
|
|
|
unsafe {
|
|
|
|
let fun: JitFunction<unsafe extern "C" fn() -> T> =
|
|
|
|
execution_engine.get_function("test")?;
|
|
|
|
Ok(fun.call())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn add_literals() {
|
|
|
|
assert_eq!(jit_eval::<i64>("1 + 2").unwrap(), 3);
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn variable_shadowing() {
|
|
|
|
assert_eq!(
|
|
|
|
jit_eval::<i64>("let x = 1 in (let x = 2 in x) + x").unwrap(),
|
|
|
|
3
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn eq() {
|
|
|
|
assert_eq!(
|
|
|
|
jit_eval::<i64>("let x = 1 in if x == 1 then 2 else 4").unwrap(),
|
|
|
|
2
|
|
|
|
);
|
|
|
|
}
|
2021-03-08 06:04:44 +01:00
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn function_call() {
|
|
|
|
let res = jit_eval::<i64>("let id = fn x = x in id 1").unwrap();
|
|
|
|
assert_eq!(res, 1);
|
|
|
|
}
|
2021-03-07 21:29:59 +01:00
|
|
|
}
|