charon_driver/driver.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261
//! Run the rustc compiler with our custom options and hooks.
use crate::translate::translate_crate_to_ullbc;
use crate::CharonFailure;
use charon_lib::options::CliOpts;
use charon_lib::transform::TransformCtx;
use rustc_driver::{Callbacks, Compilation};
use rustc_interface::Config;
use rustc_interface::{interface::Compiler, Queries};
use rustc_middle::util::Providers;
use rustc_session::config::{OutputType, OutputTypes, Polonius};
use std::ops::Deref;
use std::sync::atomic::{AtomicBool, Ordering};
use std::{env, fmt};
/// Helper that runs the compiler and catches its fatal errors.
fn run_compiler_with_callbacks(
args: Vec<String>,
callbacks: &mut (dyn Callbacks + Send),
) -> Result<(), CharonFailure> {
rustc_driver::catch_fatal_errors(|| rustc_driver::RunCompiler::new(&args, callbacks).run())
.map_err(|_| CharonFailure::RustcError)?
.map_err(|_| CharonFailure::RustcError)?;
Ok(())
}
/// Tweak options to get usable MIR even for foreign crates.
fn set_mir_options(config: &mut Config) {
config.opts.unstable_opts.always_encode_mir = true;
config.opts.unstable_opts.mir_opt_level = Some(0);
config.opts.unstable_opts.mir_emit_retag = true;
let disabled_mir_passes = ["CheckAlignment"];
for pass in disabled_mir_passes {
config
.opts
.unstable_opts
.mir_enable_passes
.push((pass.to_owned(), false));
}
}
/// Don't even try to codegen. This avoids errors due to checking if the output filename is
/// available (despite the fact that we won't emit it because we stop compilation early).
fn set_no_codegen(config: &mut Config) {
config.opts.unstable_opts.no_codegen = true;
// Only emit metadata.
config.opts.output_types = OutputTypes::new(&[(OutputType::Metadata, None)]);
}
/// Always compile in release mode: in effect, we want to analyze the released
/// code. Also, rustc inserts a lot of dynamic checks in debug mode, that we
/// have to clean. Full list of `--release` flags:
/// https://doc.rust-lang.org/cargo/reference/profiles.html#release
fn set_release_mode(config: &mut Config) {
let cg = &mut config.opts.cg;
cg.opt_level = "3".into();
cg.overflow_checks = Some(false);
config.opts.debug_assertions = false;
}
// We use a static to be able to pass data to `override_queries`.
static SKIP_BORROWCK: AtomicBool = AtomicBool::new(false);
fn set_skip_borrowck() {
SKIP_BORROWCK.store(true, Ordering::SeqCst);
}
fn skip_borrowck_if_set(providers: &mut Providers) {
if SKIP_BORROWCK.load(Ordering::SeqCst) {
providers.mir_borrowck = |tcx, def_id| {
let (input_body, _promoted) = tcx.mir_promoted(def_id);
let input_body = &input_body.borrow();
// Empty result, which is what is used for tainted or custom_mir bodies.
let result = rustc_middle::mir::BorrowCheckResult {
concrete_opaque_types: Default::default(),
closure_requirements: None,
used_mut_upvars: Default::default(),
tainted_by_errors: input_body.tainted_by_errors,
};
tcx.arena.alloc(result)
}
}
}
fn setup_compiler(config: &mut Config, options: &CliOpts, do_translate: bool) {
if do_translate {
if options.skip_borrowck {
// We use a static to be able to pass data to `override_queries`.
set_skip_borrowck();
}
config.override_queries = Some(|_sess, providers| {
skip_borrowck_if_set(providers);
// TODO: catch the MIR in-flight to avoid stealing issues?
// providers.mir_built = |tcx, def_id| {
// let mir = (rustc_interface::DEFAULT_QUERY_PROVIDERS.mir_built)(tcx, def_id);
// let mut mir = mir.steal();
// // use the mir
// tcx.alloc_steal_mir(mir)
// };
});
set_release_mode(config);
set_no_codegen(config);
if options.use_polonius {
config.opts.unstable_opts.polonius = Polonius::Legacy;
}
}
set_mir_options(config);
}
/// Run the rustc driver with our custom hooks. Returns `None` if the crate was not compiled with
/// charon (e.g. because it was a dependency). Otherwise returns the translated crate, ready for
/// post-processing transformations.
pub fn run_rustc_driver(options: &CliOpts) -> Result<Option<TransformCtx>, CharonFailure> {
// Retreive the command-line arguments pased to `charon_driver`. The first arg is the path to
// the current executable, we skip it.
let mut compiler_args: Vec<String> = env::args().skip(1).collect();
// When called using cargo, we tell cargo to use `charon-driver` by setting the `RUSTC_WRAPPER`
// env var. This uses `charon-driver` for all the crates being compiled.
// We may however not want to be calling charon on all crates; `CARGO_PRIMARY_PACKAGE` tells us
// whether the crate was specifically selected or is a dependency.
let is_workspace_dependency =
env::var("CHARON_USING_CARGO").is_ok() && !env::var("CARGO_PRIMARY_PACKAGE").is_ok();
// Determines if we are being invoked to build a crate for the "target" architecture, in
// contrast to the "host" architecture. Host crates are for build scripts and proc macros and
// still need to be built like normal; target crates need to be processed by Charon.
//
// Currently, we detect this by checking for "--target=", which is never set for host crates.
// This matches what Miri does, which hopefully makes it reliable enough. This relies on us
// always invoking cargo itself with `--target`, which `charon` ensures.
let is_target = arg_values(&compiler_args, "--target").next().is_some();
// Whether this is the crate we want to translate.
let is_selected_crate = !is_workspace_dependency && is_target;
let output = if !is_selected_crate {
trace!("Skipping charon; running compiler normally instead.");
// Run the compiler normally.
run_compiler_with_callbacks(compiler_args, &mut RunCompilerNormallyCallbacks { options })?;
None
} else {
for extra_flag in options.rustc_args.iter().cloned() {
compiler_args.push(extra_flag);
}
// Call the Rust compiler with our custom callback.
let mut callback = CharonCallbacks {
options,
transform_ctx: None,
};
run_compiler_with_callbacks(compiler_args, &mut callback)?;
// If `transform_ctx` is not set here, there was a fatal error.
let ctx = callback.transform_ctx.ok_or(CharonFailure::RustcError)?;
Some(ctx)
};
Ok(output)
}
/// The callbacks for Charon
pub struct CharonCallbacks<'a> {
options: &'a CliOpts,
/// This is to be filled during the extraction; it contains the translated crate.
transform_ctx: Option<TransformCtx>,
}
impl<'a> Callbacks for CharonCallbacks<'a> {
fn config(&mut self, config: &mut Config) {
setup_compiler(config, self.options, true);
}
/// The MIR is modified in place: borrow-checking requires the "promoted" MIR, which causes the
/// "built" MIR (which results from the conversion to HIR to MIR) to become unaccessible.
/// Because we require built MIR at the moment, we hook ourselves before MIR-based analysis
/// passes.
fn after_expansion<'tcx>(
&mut self,
compiler: &Compiler,
queries: &'tcx Queries<'tcx>,
) -> Compilation {
// Set up our own `DefId` debug routine.
rustc_hir::def_id::DEF_ID_DEBUG
.swap(&(def_id_debug as fn(_, &mut fmt::Formatter<'_>) -> _));
let transform_ctx = queries.global_ctxt().unwrap().get_mut().enter(|tcx| {
translate_crate_to_ullbc::translate(&self.options, tcx, compiler.sess.sysroot.clone())
});
self.transform_ctx = Some(transform_ctx);
Compilation::Continue
}
fn after_analysis<'tcx>(
&mut self,
_: &rustc_interface::interface::Compiler,
_: &'tcx Queries<'tcx>,
) -> Compilation {
// Don't continue to codegen etc.
Compilation::Stop
}
}
/// Dummy callbacks used to run the compiler normally when we shouldn't be analyzing the crate.
pub struct RunCompilerNormallyCallbacks<'a> {
options: &'a CliOpts,
}
impl<'a> Callbacks for RunCompilerNormallyCallbacks<'a> {
fn config(&mut self, config: &mut Config) {
setup_compiler(config, self.options, false);
}
}
/// Returns the values of the command-line options that match `find_arg`. The options are built-in
/// to be of the form `--arg=value` or `--arg value`.
fn arg_values<'a, T: Deref<Target = str>>(
args: &'a [T],
needle: &'a str,
) -> impl Iterator<Item = &'a str> {
struct ArgFilter<'a, T> {
args: std::slice::Iter<'a, T>,
needle: &'a str,
}
impl<'a, T: Deref<Target = str>> Iterator for ArgFilter<'a, T> {
type Item = &'a str;
fn next(&mut self) -> Option<Self::Item> {
while let Some(arg) = self.args.next() {
let mut split_arg = arg.splitn(2, '=');
if split_arg.next() == Some(self.needle) {
return match split_arg.next() {
// `--arg=value` form
arg @ Some(_) => arg,
// `--arg value` form
None => self.args.next().map(|x| x.deref()),
};
}
}
None
}
}
ArgFilter {
args: args.iter(),
needle,
}
}
/// Custom `DefId` debug routine that doesn't print unstable values like ids and hashes.
fn def_id_debug(def_id: rustc_hir::def_id::DefId, f: &mut fmt::Formatter<'_>) -> fmt::Result {
rustc_middle::ty::tls::with_opt(|opt_tcx| {
if let Some(tcx) = opt_tcx {
let crate_name = if def_id.is_local() {
tcx.crate_name(rustc_hir::def_id::LOCAL_CRATE)
} else {
tcx.cstore_untracked().crate_name(def_id.krate)
};
write!(
f,
"{}{}",
crate_name,
tcx.def_path(def_id).to_string_no_crate_verbose()
)?;
} else {
write!(f, "<can't access `tcx` to print `DefId` path>")?;
}
Ok(())
})
}