2022-01-08 22:16:55 +08:00
|
|
|
use regex::Regex;
|
|
|
|
use std::{
|
|
|
|
env,
|
2022-03-22 15:39:15 +08:00
|
|
|
fs::File,
|
2022-01-08 22:16:55 +08:00
|
|
|
io::Write,
|
2022-01-09 12:06:45 +08:00
|
|
|
path::Path,
|
2022-01-08 22:16:55 +08:00
|
|
|
process::{Command, Stdio},
|
|
|
|
};
|
|
|
|
|
|
|
|
fn main() {
|
2024-07-12 21:52:55 +08:00
|
|
|
// Define relevant directories
|
|
|
|
let out_dir = env::var("OUT_DIR").unwrap();
|
|
|
|
let out_dir = Path::new(&out_dir);
|
|
|
|
let irrt_dir = Path::new("irrt");
|
|
|
|
|
|
|
|
let irrt_cpp_path = irrt_dir.join("irrt.cpp");
|
2022-01-09 10:53:58 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* HACK: Sadly, clang doesn't let us emit generic LLVM bitcode.
|
|
|
|
* Compiling for WASM32 and filtering the output with regex is the closest we can get.
|
|
|
|
*/
|
2024-03-06 12:57:20 +08:00
|
|
|
let flags: &[&str] = &[
|
2022-01-09 10:53:58 +08:00
|
|
|
"--target=wasm32",
|
2024-07-09 13:31:29 +08:00
|
|
|
"-x",
|
|
|
|
"c++",
|
2023-11-22 13:35:56 +08:00
|
|
|
"-fno-discard-value-names",
|
2024-07-05 17:24:57 +08:00
|
|
|
"-fno-exceptions",
|
|
|
|
"-fno-rtti",
|
2024-03-06 12:57:20 +08:00
|
|
|
match env::var("PROFILE").as_deref() {
|
|
|
|
Ok("debug") => "-O0",
|
|
|
|
Ok("release") => "-O3",
|
2024-03-11 14:25:37 +08:00
|
|
|
flavor => panic!("Unknown or missing build flavor {flavor:?}"),
|
2024-03-06 12:57:20 +08:00
|
|
|
},
|
2022-01-08 22:16:55 +08:00
|
|
|
"-emit-llvm",
|
|
|
|
"-S",
|
|
|
|
"-Wall",
|
|
|
|
"-Wextra",
|
2024-07-12 20:34:06 +08:00
|
|
|
"-Werror=return-type",
|
2022-01-08 22:16:55 +08:00
|
|
|
"-o",
|
|
|
|
"-",
|
2024-07-12 21:52:55 +08:00
|
|
|
irrt_cpp_path.to_str().unwrap(),
|
2022-01-08 22:16:55 +08:00
|
|
|
];
|
2023-12-08 17:43:32 +08:00
|
|
|
|
2024-07-12 21:52:55 +08:00
|
|
|
// Tell Cargo to rerun if any file under `irrt_dir` (recursive) changes
|
|
|
|
println!("cargo:rerun-if-changed={}", irrt_dir.to_str().unwrap());
|
2023-12-08 17:43:32 +08:00
|
|
|
|
2024-07-12 21:52:55 +08:00
|
|
|
// Compile IRRT and capture the LLVM IR output
|
2024-07-07 20:03:34 +08:00
|
|
|
let output = Command::new("clang-irrt")
|
2024-03-06 12:57:20 +08:00
|
|
|
.args(flags)
|
2022-01-08 22:16:55 +08:00
|
|
|
.output()
|
|
|
|
.map(|o| {
|
|
|
|
assert!(o.status.success(), "{}", std::str::from_utf8(&o.stderr).unwrap());
|
|
|
|
o
|
|
|
|
})
|
|
|
|
.unwrap();
|
|
|
|
|
2022-03-22 16:04:48 +08:00
|
|
|
// https://github.com/rust-lang/regex/issues/244
|
|
|
|
let output = std::str::from_utf8(&output.stdout).unwrap().replace("\r\n", "\n");
|
2022-01-08 22:16:55 +08:00
|
|
|
let mut filtered_output = String::with_capacity(output.len());
|
|
|
|
|
2024-07-12 21:52:55 +08:00
|
|
|
// Filter out irrelevant IR
|
|
|
|
//
|
|
|
|
// Regex:
|
|
|
|
// - `(?ms:^define.*?\}$)` captures LLVM `define` blocks
|
|
|
|
// - `(?m:^declare.*?$)` captures LLVM `declare` lines
|
2024-07-09 21:02:20 +08:00
|
|
|
// - `(?m:^%.+?=\s*type\s*\{.+?\}$)` captures LLVM `type` declarations
|
2024-07-13 14:02:50 +08:00
|
|
|
// - `(?m:^@.+?=.+$)` captures global constants
|
|
|
|
let regex_filter = Regex::new(
|
|
|
|
r"(?ms:^define.*?\}$)|(?m:^declare.*?$)|(?m:^%.+?=\s*type\s*\{.+?\}$)|(?m:^@.+?=.+$)",
|
|
|
|
)
|
|
|
|
.unwrap();
|
2022-03-22 16:04:48 +08:00
|
|
|
for f in regex_filter.captures_iter(&output) {
|
2023-12-06 11:05:42 +08:00
|
|
|
assert_eq!(f.len(), 1);
|
2022-01-08 22:16:55 +08:00
|
|
|
filtered_output.push_str(&f[0]);
|
|
|
|
filtered_output.push('\n');
|
|
|
|
}
|
|
|
|
|
|
|
|
let filtered_output = Regex::new("(#\\d+)|(, *![0-9A-Za-z.]+)|(![0-9A-Za-z.]+)|(!\".*?\")")
|
|
|
|
.unwrap()
|
|
|
|
.replace_all(&filtered_output, "");
|
|
|
|
|
2024-07-12 21:52:55 +08:00
|
|
|
// For debugging
|
|
|
|
// Doing `DEBUG_DUMP_IRRT=1 cargo build -p nac3core` dumps the LLVM IR generated
|
|
|
|
const DEBUG_DUMP_IRRT: &str = "DEBUG_DUMP_IRRT";
|
|
|
|
println!("cargo:rerun-if-env-changed={DEBUG_DUMP_IRRT}");
|
|
|
|
if env::var(DEBUG_DUMP_IRRT).is_ok() {
|
|
|
|
let mut file = File::create(out_dir.join("irrt.ll")).unwrap();
|
2022-03-22 15:39:15 +08:00
|
|
|
file.write_all(output.as_bytes()).unwrap();
|
2024-07-12 21:52:55 +08:00
|
|
|
|
|
|
|
let mut file = File::create(out_dir.join("irrt-filtered.ll")).unwrap();
|
2022-03-22 15:39:15 +08:00
|
|
|
file.write_all(filtered_output.as_bytes()).unwrap();
|
|
|
|
}
|
|
|
|
|
2024-07-12 21:52:55 +08:00
|
|
|
// Assemble the emitted and filtered IR to .bc
|
|
|
|
// That .bc will be integrated into nac3core's codegen
|
2023-11-25 20:15:29 +08:00
|
|
|
let mut llvm_as = Command::new("llvm-as-irrt")
|
2022-01-08 22:16:55 +08:00
|
|
|
.stdin(Stdio::piped())
|
|
|
|
.arg("-o")
|
2024-07-12 21:52:55 +08:00
|
|
|
.arg(out_dir.join("irrt.bc"))
|
2022-01-08 22:16:55 +08:00
|
|
|
.spawn()
|
|
|
|
.unwrap();
|
|
|
|
llvm_as.stdin.as_mut().unwrap().write_all(filtered_output.as_bytes()).unwrap();
|
2023-12-08 17:43:32 +08:00
|
|
|
assert!(llvm_as.wait().unwrap().success());
|
2022-01-08 22:16:55 +08:00
|
|
|
}
|