1 //! Main evaluator loop and setting up the initial stack frame.
8 use rustc_hir::def_id::DefId;
9 use rustc_middle::ty::{
11 layout::{LayoutCx, LayoutOf},
14 use rustc_target::spec::abi::Abi;
16 use rustc_session::config::EntryFnType;
18 use std::collections::HashSet;
22 #[derive(Copy, Clone, Debug, PartialEq)]
23 pub enum AlignmentCheck {
24 /// Do not check alignment.
26 /// Check alignment "symbolically", i.e., using only the requested alignment for an allocation and not its real base address.
28 /// Check alignment on the actual physical integer address.
32 #[derive(Copy, Clone, Debug, PartialEq)]
33 pub enum RejectOpWith {
34 /// Isolated op is rejected with an abort of the machine.
37 /// If not Abort, miri returns an error for an isolated op.
38 /// Following options determine if user should be warned about such error.
39 /// Do not print warning about rejected isolated op.
42 /// Print a warning about rejected isolated op, with backtrace.
45 /// Print a warning about rejected isolated op, without backtrace.
46 WarningWithoutBacktrace,
49 #[derive(Copy, Clone, Debug, PartialEq)]
51 /// Reject an op requiring communication with the host. By
52 /// default, miri rejects the op with an abort. If not, it returns
53 /// an error code, and prints a warning about it. Warning levels
54 /// are controlled by `RejectOpWith` enum.
57 /// Execute op requiring communication with the host, i.e. disable isolation.
61 #[derive(Copy, Clone, PartialEq, Eq)]
62 pub enum BacktraceStyle {
63 /// Prints a terser backtrace which ideally only contains relevant information.
65 /// Prints a backtrace with all possible information.
67 /// Prints only the frame that the error occurs in.
71 /// Configuration needed to spawn a Miri instance.
73 pub struct MiriConfig {
74 /// Determine if validity checking is enabled.
76 /// Determines if Stacked Borrows is enabled.
77 pub stacked_borrows: bool,
78 /// Controls alignment checking.
79 pub check_alignment: AlignmentCheck,
80 /// Controls integer and float validity initialization checking.
81 pub allow_uninit_numbers: bool,
82 /// Controls how we treat ptr2int and int2ptr transmutes.
83 pub allow_ptr_int_transmute: bool,
84 /// Controls function [ABI](Abi) checking.
86 /// Action for an op requiring communication with the host.
87 pub isolated_op: IsolatedOp,
88 /// Determines if memory leaks should be ignored.
89 pub ignore_leaks: bool,
90 /// Environment variables that should always be isolated from the host.
91 pub excluded_env_vars: Vec<String>,
92 /// Environment variables that should always be forwarded from the host.
93 pub forwarded_env_vars: Vec<String>,
94 /// Command-line arguments passed to the interpreted program.
95 pub args: Vec<String>,
96 /// The seed to use when non-determinism or randomness are required (e.g. ptr-to-int cast, `getrandom()`).
97 pub seed: Option<u64>,
98 /// The stacked borrows pointer ids to report about
99 pub tracked_pointer_tags: HashSet<PtrId>,
100 /// The stacked borrows call IDs to report about
101 pub tracked_call_ids: HashSet<CallId>,
102 /// The allocation ids to report about.
103 pub tracked_alloc_ids: HashSet<AllocId>,
104 /// Whether to track raw pointers in stacked borrows.
106 /// Determine if data race detection should be enabled
107 pub data_race_detector: bool,
108 /// Rate of spurious failures for compare_exchange_weak atomic operations,
109 /// between 0.0 and 1.0, defaulting to 0.8 (80% chance of failure).
110 pub cmpxchg_weak_failure_rate: f64,
111 /// If `Some`, enable the `measureme` profiler, writing results to a file
112 /// with the specified prefix.
113 pub measureme_out: Option<String>,
114 /// Panic when unsupported functionality is encountered.
115 pub panic_on_unsupported: bool,
116 /// Which style to use for printing backtraces.
117 pub backtrace_style: BacktraceStyle,
118 /// Which provenance to use for int2ptr casts
119 pub provenance_mode: ProvenanceMode,
120 /// Whether to ignore any output by the program. This is helpful when debugging miri
121 /// as its messages don't get intermingled with the program messages.
122 pub mute_stdout_stderr: bool,
125 impl Default for MiriConfig {
126 fn default() -> MiriConfig {
129 stacked_borrows: true,
130 check_alignment: AlignmentCheck::Int,
131 allow_uninit_numbers: false,
132 allow_ptr_int_transmute: false,
134 isolated_op: IsolatedOp::Reject(RejectOpWith::Abort),
136 excluded_env_vars: vec![],
137 forwarded_env_vars: vec![],
140 tracked_pointer_tags: HashSet::default(),
141 tracked_call_ids: HashSet::default(),
142 tracked_alloc_ids: HashSet::default(),
144 data_race_detector: true,
145 cmpxchg_weak_failure_rate: 0.8,
147 panic_on_unsupported: false,
148 backtrace_style: BacktraceStyle::Short,
149 provenance_mode: ProvenanceMode::Legacy,
150 mute_stdout_stderr: false,
155 /// Returns a freshly created `InterpCx`, along with an `MPlaceTy` representing
156 /// the location where the return value of the `start` function will be
158 /// Public because this is also used by `priroda`.
159 pub fn create_ecx<'mir, 'tcx: 'mir>(
162 entry_type: EntryFnType,
164 ) -> InterpResult<'tcx, (InterpCx<'mir, 'tcx, Evaluator<'mir, 'tcx>>, MPlaceTy<'tcx, Tag>)> {
165 let param_env = ty::ParamEnv::reveal_all();
166 let layout_cx = LayoutCx { tcx, param_env };
167 let mut ecx = InterpCx::new(
169 rustc_span::source_map::DUMMY_SP,
171 Evaluator::new(config, layout_cx),
174 // Capture the current interpreter stack state (which should be empty) so that we can emit
175 // allocation-tracking and tag-tracking diagnostics for allocations which are part of the
176 // early runtime setup.
177 let info = ecx.preprocess_diagnostics();
179 // Some parts of initialization require a full `InterpCx`.
180 Evaluator::late_init(&mut ecx, config)?;
182 // Make sure we have MIR. We check MIR for some stable monomorphic function in libcore.
183 let sentinel = ecx.try_resolve_path(&["core", "ascii", "escape_default"]);
184 if !matches!(sentinel, Some(s) if tcx.is_mir_available(s.def.def_id())) {
186 "the current sysroot was built without `-Zalways-encode-mir`, or libcore seems missing. \
187 Use `cargo miri setup` to prepare a sysroot that is suitable for Miri."
191 // Setup first stack frame.
192 let entry_instance = ty::Instance::mono(tcx, entry_id);
194 // First argument is constructed later, because it's skipped if the entry function uses #[start].
196 // Second argument (argc): length of `config.args`.
197 let argc = Scalar::from_machine_usize(u64::try_from(config.args.len()).unwrap(), &ecx);
198 // Third argument (`argv`): created from `config.args`.
200 // Put each argument in memory, collect pointers.
201 let mut argvs = Vec::<Immediate<Tag>>::new();
202 for arg in config.args.iter() {
203 // Make space for `0` terminator.
204 let size = u64::try_from(arg.len()).unwrap().checked_add(1).unwrap();
205 let arg_type = tcx.mk_array(tcx.types.u8, size);
207 ecx.allocate(ecx.layout_of(arg_type)?, MiriMemoryKind::Machine.into())?;
208 ecx.write_os_str_to_c_str(OsStr::new(arg), arg_place.ptr, size)?;
209 ecx.mark_immutable(&*arg_place);
210 argvs.push(arg_place.to_ref(&ecx));
212 // Make an array with all these pointers, in the Miri memory.
213 let argvs_layout = ecx.layout_of(
214 tcx.mk_array(tcx.mk_imm_ptr(tcx.types.u8), u64::try_from(argvs.len()).unwrap()),
216 let argvs_place = ecx.allocate(argvs_layout, MiriMemoryKind::Machine.into())?;
217 for (idx, arg) in argvs.into_iter().enumerate() {
218 let place = ecx.mplace_field(&argvs_place, idx)?;
219 ecx.write_immediate(arg, &place.into())?;
221 ecx.mark_immutable(&*argvs_place);
222 // A pointer to that place is the 3rd argument for main.
223 let argv = argvs_place.to_ref(&ecx);
224 // Store `argc` and `argv` for macOS `_NSGetArg{c,v}`.
227 ecx.allocate(ecx.machine.layouts.isize, MiriMemoryKind::Machine.into())?;
228 ecx.write_scalar(argc, &argc_place.into())?;
229 ecx.mark_immutable(&*argc_place);
230 ecx.machine.argc = Some(*argc_place);
232 let argv_place = ecx.allocate(
233 ecx.layout_of(tcx.mk_imm_ptr(tcx.types.unit))?,
234 MiriMemoryKind::Machine.into(),
236 ecx.write_immediate(argv, &argv_place.into())?;
237 ecx.mark_immutable(&*argv_place);
238 ecx.machine.argv = Some(*argv_place);
240 // Store command line as UTF-16 for Windows `GetCommandLineW`.
242 // Construct a command string with all the aguments.
243 let cmd_utf16: Vec<u16> = args_to_utf16_command_string(config.args.iter());
245 let cmd_type = tcx.mk_array(tcx.types.u16, u64::try_from(cmd_utf16.len()).unwrap());
247 ecx.allocate(ecx.layout_of(cmd_type)?, MiriMemoryKind::Machine.into())?;
248 ecx.machine.cmd_line = Some(*cmd_place);
249 // Store the UTF-16 string. We just allocated so we know the bounds are fine.
250 for (idx, &c) in cmd_utf16.iter().enumerate() {
251 let place = ecx.mplace_field(&cmd_place, idx)?;
252 ecx.write_scalar(Scalar::from_u16(c), &place.into())?;
254 ecx.mark_immutable(&*cmd_place);
259 // Return place (in static memory so that it does not count as leak).
260 let ret_place = ecx.allocate(ecx.machine.layouts.isize, MiriMemoryKind::Machine.into())?;
261 // Call start function.
264 EntryFnType::Main => {
265 let start_id = tcx.lang_items().start_fn().unwrap();
266 let main_ret_ty = tcx.fn_sig(entry_id).output();
267 let main_ret_ty = main_ret_ty.no_bound_vars().unwrap();
268 let start_instance = ty::Instance::resolve(
270 ty::ParamEnv::reveal_all(),
272 tcx.mk_substs(::std::iter::once(ty::subst::GenericArg::from(main_ret_ty))),
277 let main_ptr = ecx.create_fn_alloc_ptr(FnVal::Instance(entry_instance));
282 &[Scalar::from_pointer(main_ptr, &ecx).into(), argc.into(), argv],
284 StackPopCleanup::Root { cleanup: true },
287 EntryFnType::Start => {
291 &[argc.into(), argv],
293 StackPopCleanup::Root { cleanup: true },
298 // Emit any diagnostics related to the setup process for the runtime, so that when the
299 // interpreter loop starts there are no unprocessed diagnostics.
300 ecx.process_diagnostics(info);
305 /// Evaluates the entry function specified by `entry_id`.
306 /// Returns `Some(return_code)` if program executed completed.
307 /// Returns `None` if an evaluation error occured.
308 pub fn eval_entry<'tcx>(
311 entry_type: EntryFnType,
314 // Copy setting before we move `config`.
315 let ignore_leaks = config.ignore_leaks;
317 let (mut ecx, ret_place) = match create_ecx(tcx, entry_id, entry_type, &config) {
320 err.print_backtrace();
321 panic!("Miri initialization error: {}", err.kind())
325 // Perform the main execution.
326 let res: InterpResult<'_, i64> = (|| {
329 let info = ecx.preprocess_diagnostics();
330 match ecx.schedule()? {
331 SchedulingAction::ExecuteStep => {
332 assert!(ecx.step()?, "a terminated thread was scheduled for execution");
334 SchedulingAction::ExecuteTimeoutCallback => {
336 ecx.machine.communicate(),
337 "scheduler callbacks require disabled isolation, but the code \
338 that created the callback did not check it"
340 ecx.run_timeout_callback()?;
342 SchedulingAction::ExecuteDtors => {
343 // This will either enable the thread again (so we go back
344 // to `ExecuteStep`), or determine that this thread is done
346 ecx.schedule_next_tls_dtor_for_active_thread()?;
348 SchedulingAction::Stop => {
352 ecx.process_diagnostics(info);
354 let return_code = ecx.read_scalar(&ret_place.into())?.to_machine_isize(&ecx)?;
359 // Execution of the program has halted so any memory access we do here
360 // cannot produce a real data race. If we do not do something to disable
361 // data race detection here, some uncommon combination of errors will
362 // cause a data race to be detected:
363 // https://github.com/rust-lang/miri/issues/2020
364 ecx.allow_data_races_mut(|ecx| EnvVars::cleanup(ecx).unwrap());
366 // Process the result.
370 // Check for thread leaks.
371 if !ecx.have_all_terminated() {
373 "the main thread terminated without waiting for all remaining threads",
375 tcx.sess.note_without_error("pass `-Zmiri-ignore-leaks` to disable this check");
378 // Check for memory leaks.
379 info!("Additonal static roots: {:?}", ecx.machine.static_roots);
380 let leaks = ecx.leak_report(&ecx.machine.static_roots);
382 tcx.sess.err("the evaluated program leaked memory");
383 tcx.sess.note_without_error("pass `-Zmiri-ignore-leaks` to disable this check");
384 // Ignore the provided return code - let the reported error
385 // determine the return code.
391 Err(e) => report_error(&ecx, e),
395 /// Turns an array of arguments into a Windows command line string.
397 /// The string will be UTF-16 encoded and NUL terminated.
399 /// Panics if the zeroth argument contains the `"` character because doublequotes
400 /// in argv[0] cannot be encoded using the standard command line parsing rules.
403 /// * [Parsing C++ command-line arguments](https://docs.microsoft.com/en-us/cpp/cpp/main-function-command-line-args?view=msvc-160#parsing-c-command-line-arguments)
404 /// * [The C/C++ Parameter Parsing Rules](https://daviddeley.com/autohotkey/parameters/parameters.htm#WINCRULES)
405 fn args_to_utf16_command_string<I, T>(mut args: I) -> Vec<u16>
407 I: Iterator<Item = T>,
410 // Parse argv[0]. Slashes aren't escaped. Literal double quotes are not allowed.
412 let arg0 = if let Some(arg0) = args.next() {
417 let arg0 = arg0.as_ref();
418 if arg0.contains('"') {
419 panic!("argv[0] cannot contain a doublequote (\") character");
421 // Always surround argv[0] with quotes.
422 let mut s = String::new();
430 // Build the other arguments.
432 let arg = arg.as_ref();
435 cmd.push_str("\"\"");
436 } else if !arg.bytes().any(|c| matches!(c, b'"' | b'\t' | b' ')) {
437 // No quote, tab, or space -- no escaping required.
440 // Spaces and tabs are escaped by surrounding them in quotes.
441 // Quotes are themselves escaped by using backslashes when in a
443 // Backslashes only need to be escaped when one or more are directly
444 // followed by a quote. Otherwise they are taken literally.
447 let mut chars = arg.chars().peekable();
449 let mut nslashes = 0;
450 while let Some(&'\\') = chars.peek() {
457 cmd.extend(iter::repeat('\\').take(nslashes * 2 + 1));
461 cmd.extend(iter::repeat('\\').take(nslashes));
465 cmd.extend(iter::repeat('\\').take(nslashes * 2));
474 if cmd.contains('\0') {
475 panic!("interior null in command line arguments");
477 cmd.encode_utf16().chain(iter::once(0)).collect()
484 #[should_panic(expected = "argv[0] cannot contain a doublequote (\") character")]
485 fn windows_argv0_panic_on_quote() {
486 args_to_utf16_command_string(["\""].iter());
489 fn windows_argv0_no_escape() {
490 // Ensure that a trailing backslash in argv[0] is not escaped.
491 let cmd = String::from_utf16_lossy(&args_to_utf16_command_string(
492 [r"C:\Program Files\", "arg1", "arg 2", "arg \" 3"].iter(),
494 assert_eq!(cmd.trim_end_matches('\0'), r#""C:\Program Files\" arg1 "arg 2" "arg \" 3""#);