mirror of
https://github.com/pseXperiments/clookup.git
synced 2026-01-08 03:33:51 -05:00
82 lines
3.4 KiB
Rust
82 lines
3.4 KiB
Rust
extern crate bindgen;
|
|
extern crate cc;
|
|
|
|
use std::{env, path::PathBuf, process::Command};
|
|
|
|
use bindgen::CargoCallbacks;
|
|
use regex::Regex;
|
|
|
|
fn main() {
|
|
// Tell cargo to invalidate the built crate whenever files of interest changes.
|
|
println!("cargo:rerun-if-changed=cuda-sumcheck/sumcheck/src/gpu/cuda/kernels/multilinear.cu");
|
|
println!("cargo:rerun-if-changed=cuda-sumcheck/sumcheck/src/gpu/cuda/kernels/sumcheck.cu");
|
|
|
|
let out_dir = PathBuf::from(env::var("OUT_DIR").unwrap());
|
|
|
|
// Specify the desired architecture version.
|
|
let arch = "compute_86"; // For example, using SM 8.6 (Ampere architecture).
|
|
let code = "sm_86"; // For the same SM 8.6 (Ampere architecture).
|
|
let compiler = "clang-16"; // Compiler for nvcc
|
|
let language_std = "c++20"; // Language standard in which device functions are written
|
|
|
|
// build the cuda kernels
|
|
let cuda_src = [
|
|
"cuda-sumcheck/sumcheck/src/gpu/cuda/kernels/multilinear.cu",
|
|
"cuda-sumcheck/sumcheck/src/gpu/cuda/kernels/sumcheck.cu",
|
|
]
|
|
.map(|path| PathBuf::from(path));
|
|
let ptx_file = ["multilinear.ptx", "sumcheck.ptx"].map(|file| out_dir.join(file));
|
|
|
|
for (cuda_src, ptx_file) in cuda_src.into_iter().zip(ptx_file) {
|
|
let nvcc_status = Command::new("nvcc")
|
|
.arg("-ptx")
|
|
.arg("-o")
|
|
.arg(&ptx_file)
|
|
.arg(&cuda_src)
|
|
.arg(format!("-arch={}", arch))
|
|
.arg(format!("-code={}", code))
|
|
.arg(format!("-ccbin={}", compiler))
|
|
.arg(format!("-std={}", language_std))
|
|
.arg("-allow-unsupported-compiler") // workaround to use clang-16 compiler with nvcc
|
|
.arg("--expt-relaxed-constexpr")
|
|
.status()
|
|
.unwrap();
|
|
|
|
assert!(
|
|
nvcc_status.success(),
|
|
"Failed to compile CUDA source to PTX."
|
|
);
|
|
}
|
|
|
|
// The bindgen::Builder is the main entry point
|
|
// to bindgen, and lets you build up options for
|
|
// the resulting bindings.
|
|
let bindings = bindgen::Builder::default()
|
|
// The input header we would like to generate
|
|
// bindings for.
|
|
.header("cuda-sumcheck/sumcheck/src/gpu/cuda/includes/wrapper.h")
|
|
// Tell cargo to invalidate the built crate whenever any of the
|
|
// included header files changed.
|
|
.parse_callbacks(Box::new(CargoCallbacks))
|
|
// we use "no_copy" and "no_debug" here because we don't know if we can safely generate them for our structs in C code (they may contain raw pointers)
|
|
.no_copy("*")
|
|
.no_debug("*")
|
|
// Finish the builder and generate the bindings.
|
|
.generate()
|
|
// Unwrap the Result and panic on failure.
|
|
.expect("Unable to generate bindings");
|
|
|
|
// we need to make modifications to the generated code
|
|
let generated_bindings = bindings.to_string();
|
|
|
|
// Regex to find raw pointers to float and replace them with CudaSlice<f32>
|
|
// You can copy this regex to add/modify other types of pointers, for example "*mut i32"
|
|
let pointer_regex = Regex::new(r"\*mut f32").unwrap();
|
|
let modified_bindings = pointer_regex.replace_all(&generated_bindings, "CudaSlice<f32>");
|
|
|
|
// Write the bindings to the $OUT_DIR/bindings.rs file.
|
|
let out_path = PathBuf::from(env::var("OUT_DIR").unwrap());
|
|
std::fs::write(out_path.join("bindings.rs"), modified_bindings.as_bytes())
|
|
.expect("Failed to write bindings");
|
|
}
|