2021-08-11 14:37:26 +08:00
|
|
|
use crate::{
|
|
|
|
symbol_resolver::SymbolResolver,
|
|
|
|
top_level::{TopLevelContext, TopLevelDef},
|
|
|
|
typecheck::{
|
|
|
|
type_inferencer::PrimitiveStore,
|
|
|
|
typedef::{FunSignature, Type, TypeEnum, Unifier},
|
|
|
|
},
|
|
|
|
};
|
|
|
|
use inkwell::{
|
|
|
|
basic_block::BasicBlock,
|
|
|
|
builder::Builder,
|
|
|
|
context::Context,
|
|
|
|
module::Module,
|
|
|
|
types::{BasicType, BasicTypeEnum},
|
|
|
|
values::PointerValue,
|
|
|
|
AddressSpace,
|
|
|
|
};
|
|
|
|
use itertools::Itertools;
|
2021-08-12 13:55:15 +08:00
|
|
|
use rustpython_parser::ast::Stmt;
|
2021-08-11 14:37:26 +08:00
|
|
|
use std::collections::HashMap;
|
|
|
|
use std::sync::Arc;
|
|
|
|
|
2021-08-05 14:55:23 +08:00
|
|
|
mod expr;
|
2021-08-09 15:39:50 +08:00
|
|
|
mod stmt;
|
2021-08-11 14:37:26 +08:00
|
|
|
|
2021-08-12 13:55:15 +08:00
|
|
|
#[cfg(test)]
|
|
|
|
mod test;
|
|
|
|
|
|
|
|
pub struct CodeGenContext<'ctx, 'a> {
|
2021-08-11 14:37:26 +08:00
|
|
|
pub ctx: &'ctx Context,
|
|
|
|
pub builder: Builder<'ctx>,
|
|
|
|
pub module: Module<'ctx>,
|
2021-08-12 13:55:15 +08:00
|
|
|
pub top_level: &'a TopLevelContext,
|
2021-08-11 14:37:26 +08:00
|
|
|
pub unifier: Unifier,
|
2021-08-12 13:55:15 +08:00
|
|
|
pub resolver: Arc<dyn SymbolResolver>,
|
2021-08-11 14:37:26 +08:00
|
|
|
pub var_assignment: HashMap<String, PointerValue<'ctx>>,
|
|
|
|
pub type_cache: HashMap<Type, BasicTypeEnum<'ctx>>,
|
|
|
|
pub primitives: PrimitiveStore,
|
|
|
|
// stores the alloca for variables
|
|
|
|
pub init_bb: BasicBlock<'ctx>,
|
|
|
|
// where continue and break should go to respectively
|
|
|
|
// the first one is the test_bb, and the second one is bb after the loop
|
|
|
|
pub loop_bb: Option<(BasicBlock<'ctx>, BasicBlock<'ctx>)>,
|
|
|
|
}
|
|
|
|
|
|
|
|
pub struct CodeGenTask {
|
|
|
|
pub subst: Vec<(Type, Type)>,
|
|
|
|
pub symbol_name: String,
|
|
|
|
pub signature: FunSignature,
|
2021-08-12 13:55:15 +08:00
|
|
|
pub body: Vec<Stmt<Option<Type>>>,
|
2021-08-11 14:37:26 +08:00
|
|
|
pub unifier_index: usize,
|
2021-08-12 13:55:15 +08:00
|
|
|
pub resolver: Arc<dyn SymbolResolver>,
|
2021-08-11 14:37:26 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
fn get_llvm_type<'ctx>(
|
|
|
|
ctx: &'ctx Context,
|
|
|
|
unifier: &mut Unifier,
|
|
|
|
top_level: &TopLevelContext,
|
|
|
|
type_cache: &mut HashMap<Type, BasicTypeEnum<'ctx>>,
|
|
|
|
ty: Type,
|
|
|
|
) -> BasicTypeEnum<'ctx> {
|
|
|
|
use TypeEnum::*;
|
|
|
|
// we assume the type cache should already contain primitive types,
|
|
|
|
// and they should be passed by value instead of passing as pointer.
|
2021-08-12 16:36:23 +08:00
|
|
|
type_cache.get(&unifier.get_representative(ty)).cloned().unwrap_or_else(|| {
|
|
|
|
match &*unifier.get_ty(ty) {
|
|
|
|
TObj { obj_id, fields, .. } => {
|
|
|
|
// a struct with fields in the order of declaration
|
|
|
|
let defs = top_level.definitions.read();
|
|
|
|
let definition = defs.get(obj_id.0).unwrap();
|
|
|
|
let ty = if let TopLevelDef::Class { fields: fields_list, .. } = &*definition.read()
|
|
|
|
{
|
|
|
|
let fields = fields.borrow();
|
|
|
|
let fields = fields_list
|
|
|
|
.iter()
|
|
|
|
.map(|f| get_llvm_type(ctx, unifier, top_level, type_cache, fields[&f.0]))
|
|
|
|
.collect_vec();
|
|
|
|
ctx.struct_type(&fields, false).ptr_type(AddressSpace::Generic).into()
|
|
|
|
} else {
|
|
|
|
unreachable!()
|
|
|
|
};
|
|
|
|
ty
|
|
|
|
}
|
|
|
|
TTuple { ty } => {
|
|
|
|
// a struct with fields in the order present in the tuple
|
|
|
|
let fields = ty
|
2021-08-11 14:37:26 +08:00
|
|
|
.iter()
|
2021-08-12 16:36:23 +08:00
|
|
|
.map(|ty| get_llvm_type(ctx, unifier, top_level, type_cache, *ty))
|
2021-08-11 14:37:26 +08:00
|
|
|
.collect_vec();
|
|
|
|
ctx.struct_type(&fields, false).ptr_type(AddressSpace::Generic).into()
|
2021-08-12 16:36:23 +08:00
|
|
|
}
|
|
|
|
TList { ty } => {
|
|
|
|
// a struct with an integer and a pointer to an array
|
|
|
|
let element_type = get_llvm_type(ctx, unifier, top_level, type_cache, *ty);
|
|
|
|
let fields =
|
|
|
|
[ctx.i32_type().into(), element_type.ptr_type(AddressSpace::Generic).into()];
|
|
|
|
ctx.struct_type(&fields, false).ptr_type(AddressSpace::Generic).into()
|
|
|
|
}
|
|
|
|
TVirtual { .. } => unimplemented!(),
|
|
|
|
_ => unreachable!(),
|
2021-08-11 14:37:26 +08:00
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2021-08-12 16:36:23 +08:00
|
|
|
pub fn gen_func<'ctx>(
|
|
|
|
context: &'ctx Context,
|
|
|
|
builder: Builder<'ctx>,
|
|
|
|
module: Module<'ctx>,
|
|
|
|
task: CodeGenTask,
|
|
|
|
top_level_ctx: Arc<TopLevelContext>,
|
|
|
|
) -> Module<'ctx> {
|
2021-08-11 14:37:26 +08:00
|
|
|
// unwrap_or(0) is for unit tests without using rayon
|
|
|
|
let (mut unifier, primitives) = {
|
|
|
|
let unifiers = top_level_ctx.unifiers.read();
|
|
|
|
let (unifier, primitives) = &unifiers[task.unifier_index];
|
|
|
|
(Unifier::from_shared_unifier(unifier), *primitives)
|
|
|
|
};
|
|
|
|
|
|
|
|
for (a, b) in task.subst.iter() {
|
|
|
|
// this should be unification between variables and concrete types
|
|
|
|
// and should not cause any problem...
|
|
|
|
unifier.unify(*a, *b).unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
// rebuild primitive store with unique representatives
|
|
|
|
let primitives = PrimitiveStore {
|
|
|
|
int32: unifier.get_representative(primitives.int32),
|
|
|
|
int64: unifier.get_representative(primitives.int64),
|
|
|
|
float: unifier.get_representative(primitives.float),
|
|
|
|
bool: unifier.get_representative(primitives.bool),
|
|
|
|
none: unifier.get_representative(primitives.none),
|
|
|
|
};
|
|
|
|
|
|
|
|
let mut type_cache: HashMap<_, _> = [
|
2021-08-12 13:55:15 +08:00
|
|
|
(unifier.get_representative(primitives.int32), context.i32_type().into()),
|
|
|
|
(unifier.get_representative(primitives.int64), context.i64_type().into()),
|
|
|
|
(unifier.get_representative(primitives.float), context.f64_type().into()),
|
|
|
|
(unifier.get_representative(primitives.bool), context.bool_type().into()),
|
2021-08-11 14:37:26 +08:00
|
|
|
]
|
|
|
|
.iter()
|
|
|
|
.cloned()
|
|
|
|
.collect();
|
|
|
|
|
|
|
|
let params = task
|
|
|
|
.signature
|
|
|
|
.args
|
|
|
|
.iter()
|
|
|
|
.map(|arg| {
|
|
|
|
get_llvm_type(&context, &mut unifier, top_level_ctx.as_ref(), &mut type_cache, arg.ty)
|
|
|
|
})
|
|
|
|
.collect_vec();
|
|
|
|
|
|
|
|
let fn_type = if unifier.unioned(task.signature.ret, primitives.none) {
|
|
|
|
context.void_type().fn_type(¶ms, false)
|
|
|
|
} else {
|
|
|
|
get_llvm_type(
|
|
|
|
&context,
|
|
|
|
&mut unifier,
|
|
|
|
top_level_ctx.as_ref(),
|
|
|
|
&mut type_cache,
|
|
|
|
task.signature.ret,
|
|
|
|
)
|
|
|
|
.fn_type(¶ms, false)
|
|
|
|
};
|
|
|
|
|
|
|
|
let fn_val = module.add_function(&task.symbol_name, fn_type, None);
|
|
|
|
let init_bb = context.append_basic_block(fn_val, "init");
|
|
|
|
builder.position_at_end(init_bb);
|
|
|
|
let body_bb = context.append_basic_block(fn_val, "body");
|
|
|
|
|
|
|
|
let mut var_assignment = HashMap::new();
|
|
|
|
for (n, arg) in task.signature.args.iter().enumerate() {
|
|
|
|
let param = fn_val.get_nth_param(n as u32).unwrap();
|
|
|
|
let alloca = builder.build_alloca(
|
|
|
|
get_llvm_type(&context, &mut unifier, top_level_ctx.as_ref(), &mut type_cache, arg.ty),
|
|
|
|
&arg.name,
|
|
|
|
);
|
|
|
|
builder.build_store(alloca, param);
|
|
|
|
var_assignment.insert(arg.name.clone(), alloca);
|
|
|
|
}
|
|
|
|
builder.build_unconditional_branch(body_bb);
|
|
|
|
builder.position_at_end(body_bb);
|
|
|
|
|
|
|
|
let mut code_gen_context = CodeGenContext {
|
|
|
|
ctx: &context,
|
|
|
|
resolver: task.resolver,
|
|
|
|
top_level: top_level_ctx.as_ref(),
|
|
|
|
loop_bb: None,
|
|
|
|
var_assignment,
|
|
|
|
type_cache,
|
|
|
|
primitives,
|
|
|
|
init_bb,
|
|
|
|
builder,
|
|
|
|
module,
|
|
|
|
unifier,
|
|
|
|
};
|
|
|
|
|
2021-08-12 13:55:15 +08:00
|
|
|
for stmt in task.body.iter() {
|
|
|
|
code_gen_context.gen_stmt(stmt);
|
2021-08-11 14:37:26 +08:00
|
|
|
}
|
2021-08-12 13:55:15 +08:00
|
|
|
|
|
|
|
code_gen_context.module
|
2021-08-11 14:37:26 +08:00
|
|
|
}
|