2 use std::ffi::{OsStr, OsString};
4 use std::path::{Path, PathBuf};
7 use std::os::unix::ffi::{OsStrExt, OsStringExt};
9 use std::os::windows::ffi::{OsStrExt, OsStringExt};
11 use rustc_middle::ty::layout::LayoutOf;
12 use rustc_target::abi::{Align, Size};
16 /// Represent how path separator conversion should be done.
17 pub enum PathConversion {
23 pub fn os_str_to_bytes<'a, 'tcx>(os_str: &'a OsStr) -> InterpResult<'tcx, &'a [u8]> {
28 pub fn os_str_to_bytes<'a, 'tcx>(os_str: &'a OsStr) -> InterpResult<'tcx, &'a [u8]> {
29 // On non-unix platforms the best we can do to transform bytes from/to OS strings is to do the
30 // intermediate transformation into strings. Which invalidates non-utf8 paths that are actually
34 .map(|s| s.as_bytes())
35 .ok_or_else(|| err_unsup_format!("{:?} is not a valid utf-8 string", os_str).into())
39 pub fn bytes_to_os_str<'a, 'tcx>(bytes: &'a [u8]) -> InterpResult<'tcx, &'a OsStr> {
40 Ok(OsStr::from_bytes(bytes))
43 pub fn bytes_to_os_str<'a, 'tcx>(bytes: &'a [u8]) -> InterpResult<'tcx, &'a OsStr> {
44 let s = std::str::from_utf8(bytes)
45 .map_err(|_| err_unsup_format!("{:?} is not a valid utf-8 string", bytes))?;
49 impl<'mir, 'tcx: 'mir> EvalContextExt<'mir, 'tcx> for crate::MiriInterpCx<'mir, 'tcx> {}
50 pub trait EvalContextExt<'mir, 'tcx: 'mir>: crate::MiriInterpCxExt<'mir, 'tcx> {
51 /// Helper function to read an OsString from a null-terminated sequence of bytes, which is what
52 /// the Unix APIs usually handle.
53 fn read_os_str_from_c_str<'a>(
55 ptr: Pointer<Option<Provenance>>,
56 ) -> InterpResult<'tcx, &'a OsStr>
61 let this = self.eval_context_ref();
62 let bytes = this.read_c_str(ptr)?;
63 bytes_to_os_str(bytes)
66 /// Helper function to read an OsString from a 0x0000-terminated sequence of u16,
67 /// which is what the Windows APIs usually handle.
68 fn read_os_str_from_wide_str<'a>(
70 ptr: Pointer<Option<Provenance>>,
71 ) -> InterpResult<'tcx, OsString>
77 pub fn u16vec_to_osstring<'tcx>(u16_vec: Vec<u16>) -> InterpResult<'tcx, OsString> {
78 Ok(OsString::from_wide(&u16_vec[..]))
81 pub fn u16vec_to_osstring<'tcx>(u16_vec: Vec<u16>) -> InterpResult<'tcx, OsString> {
82 let s = String::from_utf16(&u16_vec[..])
83 .map_err(|_| err_unsup_format!("{:?} is not a valid utf-16 string", u16_vec))?;
87 let u16_vec = self.eval_context_ref().read_wide_str(ptr)?;
88 u16vec_to_osstring(u16_vec)
91 /// Helper function to write an OsStr as a null-terminated sequence of bytes, which is what
92 /// the Unix APIs usually handle. This function returns `Ok((false, length))` without trying
93 /// to write if `size` is not large enough to fit the contents of `os_string` plus a null
94 /// terminator. It returns `Ok((true, length))` if the writing process was successful. The
95 /// string length returned does include the null terminator.
96 fn write_os_str_to_c_str(
99 ptr: Pointer<Option<Provenance>>,
101 ) -> InterpResult<'tcx, (bool, u64)> {
102 let bytes = os_str_to_bytes(os_str)?;
103 // If `size` is smaller or equal than `bytes.len()`, writing `bytes` plus the required null
104 // terminator to memory using the `ptr` pointer would cause an out-of-bounds access.
105 let string_length = u64::try_from(bytes.len()).unwrap();
106 let string_length = string_length.checked_add(1).unwrap();
107 if size < string_length {
108 return Ok((false, string_length));
110 self.eval_context_mut()
111 .write_bytes_ptr(ptr, bytes.iter().copied().chain(iter::once(0u8)))?;
112 Ok((true, string_length))
115 /// Helper function to write an OsStr as a 0x0000-terminated u16-sequence, which is what
116 /// the Windows APIs usually handle. This function returns `Ok((false, length))` without trying
117 /// to write if `size` is not large enough to fit the contents of `os_string` plus a null
118 /// terminator. It returns `Ok((true, length))` if the writing process was successful. The
119 /// string length returned does include the null terminator. Length is measured in units of
121 fn write_os_str_to_wide_str(
124 ptr: Pointer<Option<Provenance>>,
126 ) -> InterpResult<'tcx, (bool, u64)> {
128 fn os_str_to_u16vec<'tcx>(os_str: &OsStr) -> InterpResult<'tcx, Vec<u16>> {
129 Ok(os_str.encode_wide().collect())
132 fn os_str_to_u16vec<'tcx>(os_str: &OsStr) -> InterpResult<'tcx, Vec<u16>> {
133 // On non-Windows platforms the best we can do to transform Vec<u16> from/to OS strings is to do the
134 // intermediate transformation into strings. Which invalidates non-utf8 paths that are actually
138 .map(|s| s.encode_utf16().collect())
139 .ok_or_else(|| err_unsup_format!("{:?} is not a valid utf-8 string", os_str).into())
142 let u16_vec = os_str_to_u16vec(os_str)?;
143 // If `size` is smaller or equal than `bytes.len()`, writing `bytes` plus the required
144 // 0x0000 terminator to memory would cause an out-of-bounds access.
145 let string_length = u64::try_from(u16_vec.len()).unwrap();
146 let string_length = string_length.checked_add(1).unwrap();
147 if size < string_length {
148 return Ok((false, string_length));
151 // Store the UTF-16 string.
152 let size2 = Size::from_bytes(2);
153 let this = self.eval_context_mut();
155 .get_ptr_alloc_mut(ptr, size2 * string_length, Align::from_bytes(2).unwrap())?
156 .unwrap(); // not a ZST, so we will get a result
157 for (offset, wchar) in u16_vec.into_iter().chain(iter::once(0x0000)).enumerate() {
158 let offset = u64::try_from(offset).unwrap();
159 alloc.write_scalar(alloc_range(size2 * offset, size2), Scalar::from_u16(wchar))?;
161 Ok((true, string_length))
164 /// Allocate enough memory to store the given `OsStr` as a null-terminated sequence of bytes.
165 fn alloc_os_str_as_c_str(
168 memkind: MemoryKind<MiriMemoryKind>,
169 ) -> InterpResult<'tcx, Pointer<Option<Provenance>>> {
170 let size = u64::try_from(os_str.len()).unwrap().checked_add(1).unwrap(); // Make space for `0` terminator.
171 let this = self.eval_context_mut();
173 let arg_type = this.tcx.mk_array(this.tcx.types.u8, size);
174 let arg_place = this.allocate(this.layout_of(arg_type).unwrap(), memkind)?;
175 assert!(self.write_os_str_to_c_str(os_str, arg_place.ptr, size).unwrap().0);
179 /// Allocate enough memory to store the given `OsStr` as a null-terminated sequence of `u16`.
180 fn alloc_os_str_as_wide_str(
183 memkind: MemoryKind<MiriMemoryKind>,
184 ) -> InterpResult<'tcx, Pointer<Option<Provenance>>> {
185 let size = u64::try_from(os_str.len()).unwrap().checked_add(1).unwrap(); // Make space for `0x0000` terminator.
186 let this = self.eval_context_mut();
188 let arg_type = this.tcx.mk_array(this.tcx.types.u16, size);
189 let arg_place = this.allocate(this.layout_of(arg_type).unwrap(), memkind)?;
190 assert!(self.write_os_str_to_wide_str(os_str, arg_place.ptr, size).unwrap().0);
194 /// Read a null-terminated sequence of bytes, and perform path separator conversion if needed.
195 fn read_path_from_c_str<'a>(
197 ptr: Pointer<Option<Provenance>>,
198 ) -> InterpResult<'tcx, Cow<'a, Path>>
203 let this = self.eval_context_ref();
204 let os_str = this.read_os_str_from_c_str(ptr)?;
206 Ok(match this.convert_path_separator(Cow::Borrowed(os_str), PathConversion::TargetToHost) {
207 Cow::Borrowed(x) => Cow::Borrowed(Path::new(x)),
208 Cow::Owned(y) => Cow::Owned(PathBuf::from(y)),
212 /// Read a null-terminated sequence of `u16`s, and perform path separator conversion if needed.
213 fn read_path_from_wide_str(
215 ptr: Pointer<Option<Provenance>>,
216 ) -> InterpResult<'tcx, PathBuf> {
217 let this = self.eval_context_ref();
218 let os_str = this.read_os_str_from_wide_str(ptr)?;
221 .convert_path_separator(Cow::Owned(os_str), PathConversion::TargetToHost)
226 /// Write a Path to the machine memory (as a null-terminated sequence of bytes),
227 /// adjusting path separators if needed.
228 fn write_path_to_c_str(
231 ptr: Pointer<Option<Provenance>>,
233 ) -> InterpResult<'tcx, (bool, u64)> {
234 let this = self.eval_context_mut();
236 .convert_path_separator(Cow::Borrowed(path.as_os_str()), PathConversion::HostToTarget);
237 this.write_os_str_to_c_str(&os_str, ptr, size)
240 /// Write a Path to the machine memory (as a null-terminated sequence of `u16`s),
241 /// adjusting path separators if needed.
242 fn write_path_to_wide_str(
245 ptr: Pointer<Option<Provenance>>,
247 ) -> InterpResult<'tcx, (bool, u64)> {
248 let this = self.eval_context_mut();
250 .convert_path_separator(Cow::Borrowed(path.as_os_str()), PathConversion::HostToTarget);
251 this.write_os_str_to_wide_str(&os_str, ptr, size)
254 /// Allocate enough memory to store a Path as a null-terminated sequence of bytes,
255 /// adjusting path separators if needed.
256 fn alloc_path_as_c_str(
259 memkind: MemoryKind<MiriMemoryKind>,
260 ) -> InterpResult<'tcx, Pointer<Option<Provenance>>> {
261 let this = self.eval_context_mut();
263 .convert_path_separator(Cow::Borrowed(path.as_os_str()), PathConversion::HostToTarget);
264 this.alloc_os_str_as_c_str(&os_str, memkind)
267 fn convert_path_separator<'a>(
269 os_str: Cow<'a, OsStr>,
270 direction: PathConversion,
271 ) -> Cow<'a, OsStr> {
272 let this = self.eval_context_ref();
273 let target_os = &this.tcx.sess.target.os;
275 return if target_os == "windows" {
276 // Windows-on-Windows, all fine.
279 // Unix target, Windows host.
280 let (from, to) = match direction {
281 PathConversion::HostToTarget => ('\\', '/'),
282 PathConversion::TargetToHost => ('/', '\\'),
284 let converted = os_str
286 .map(|wchar| if wchar == from as u16 { to as u16 } else { wchar })
287 .collect::<Vec<_>>();
288 Cow::Owned(OsString::from_wide(&converted))
291 return if target_os == "windows" {
292 // Windows target, Unix host.
293 let (from, to) = match direction {
294 PathConversion::HostToTarget => ('/', '\\'),
295 PathConversion::TargetToHost => ('\\', '/'),
297 let converted = os_str
300 .map(|&wchar| if wchar == from as u8 { to as u8 } else { wchar })
301 .collect::<Vec<_>>();
302 Cow::Owned(OsString::from_vec(converted))
304 // Unix-on-Unix, all is fine.