2019-02-08 14:53:55 +01:00
|
|
|
//! The virtual memory representation of the MIR interpreter.
|
2018-10-23 17:54:20 +02:00
|
|
|
|
2020-03-21 13:49:02 +01:00
|
|
|
use std::borrow::Cow;
|
2021-08-10 19:29:18 -04:00
|
|
|
use std::convert::{TryFrom, TryInto};
|
Introduce `ConstAllocation`.
Currently some `Allocation`s are interned, some are not, and it's very
hard to tell at a use point which is which.
This commit introduces `ConstAllocation` for the known-interned ones,
which makes the division much clearer. `ConstAllocation::inner()` is
used to get the underlying `Allocation`.
In some places it's natural to use an `Allocation`, in some it's natural
to use a `ConstAllocation`, and in some places there's no clear choice.
I've tried to make things look as nice as possible, while generally
favouring `ConstAllocation`, which is the type that embodies more
information. This does require quite a few calls to `inner()`.
The commit also tweaks how `PartialOrd` works for `Interned`. The
previous code was too clever by half, building on `T: Ord` to make the
code shorter. That caused problems with deriving `PartialOrd` and `Ord`
for `ConstAllocation`, so I changed it to build on `T: PartialOrd`,
which is slightly more verbose but much more standard and avoided the
problems.
2022-03-02 07:15:04 +11:00
|
|
|
use std::fmt;
|
2020-03-21 13:49:02 +01:00
|
|
|
use std::iter;
|
2021-07-15 18:03:22 +02:00
|
|
|
use std::ops::{Deref, Range};
|
2021-05-16 18:53:20 +02:00
|
|
|
use std::ptr;
|
2020-03-21 13:49:02 +01:00
|
|
|
|
2020-04-27 23:26:11 +05:30
|
|
|
use rustc_ast::Mutability;
|
Introduce `ConstAllocation`.
Currently some `Allocation`s are interned, some are not, and it's very
hard to tell at a use point which is which.
This commit introduces `ConstAllocation` for the known-interned ones,
which makes the division much clearer. `ConstAllocation::inner()` is
used to get the underlying `Allocation`.
In some places it's natural to use an `Allocation`, in some it's natural
to use a `ConstAllocation`, and in some places there's no clear choice.
I've tried to make things look as nice as possible, while generally
favouring `ConstAllocation`, which is the type that embodies more
information. This does require quite a few calls to `inner()`.
The commit also tweaks how `PartialOrd` works for `Interned`. The
previous code was too clever by half, building on `T: Ord` to make the
code shorter. That caused problems with deriving `PartialOrd` and `Ord`
for `ConstAllocation`, so I changed it to build on `T: PartialOrd`,
which is slightly more verbose but much more standard and avoided the
problems.
2022-03-02 07:15:04 +11:00
|
|
|
use rustc_data_structures::intern::Interned;
|
2020-03-21 13:49:02 +01:00
|
|
|
use rustc_data_structures::sorted_map::SortedMap;
|
2021-06-30 15:38:31 -04:00
|
|
|
use rustc_span::DUMMY_SP;
|
2020-03-31 18:16:47 +02:00
|
|
|
use rustc_target::abi::{Align, HasDataLayout, Size};
|
2020-03-21 13:49:02 +01:00
|
|
|
|
2018-11-12 13:26:53 +01:00
|
|
|
use super::{
|
2021-07-18 11:15:17 +02:00
|
|
|
read_target_uint, write_target_uint, AllocId, InterpError, InterpResult, Pointer, Provenance,
|
2022-04-07 16:22:09 -04:00
|
|
|
ResourceExhaustionInfo, Scalar, ScalarMaybeUninit, ScalarSizeMismatch, UndefinedBehaviorInfo,
|
|
|
|
|
UninitBytesAccess, UnsupportedOpInfo,
|
2018-11-12 13:26:53 +01:00
|
|
|
};
|
2021-06-30 15:38:31 -04:00
|
|
|
use crate::ty;
|
2018-11-04 15:14:54 +01:00
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
/// This type represents an Allocation in the Miri/CTFE core engine.
|
|
|
|
|
///
|
|
|
|
|
/// Its public API is rather low-level, working directly with allocation offsets and a custom error
|
|
|
|
|
/// type to account for the lack of an AllocId on this level. The Miri/CTFE core engine `memory`
|
|
|
|
|
/// module provides higher-level access.
|
2020-06-11 15:49:57 +01:00
|
|
|
#[derive(Clone, Debug, Eq, PartialEq, PartialOrd, Ord, Hash, TyEncodable, TyDecodable)]
|
2020-03-23 14:48:59 +00:00
|
|
|
#[derive(HashStable)]
|
2021-07-12 18:22:15 +02:00
|
|
|
pub struct Allocation<Tag = AllocId, Extra = ()> {
|
2018-10-23 17:54:20 +02:00
|
|
|
/// The actual bytes of the allocation.
|
2019-07-13 04:00:06 +02:00
|
|
|
/// Note that the bytes of a pointer represent the offset of the pointer.
|
2021-08-05 19:52:08 +02:00
|
|
|
bytes: Box<[u8]>,
|
2018-10-23 17:54:20 +02:00
|
|
|
/// Maps from byte addresses to extra data for each pointer.
|
|
|
|
|
/// Only the first byte of a pointer is inserted into the map; i.e.,
|
|
|
|
|
/// every entry in this map applies to `pointer_size` consecutive bytes starting
|
|
|
|
|
/// at the given offset.
|
2019-08-29 18:02:51 +02:00
|
|
|
relocations: Relocations<Tag>,
|
2019-07-13 04:00:06 +02:00
|
|
|
/// Denotes which part of this allocation is initialized.
|
2020-04-22 03:20:40 -04:00
|
|
|
init_mask: InitMask,
|
2018-10-23 17:54:20 +02:00
|
|
|
/// The alignment of the allocation to detect unaligned reads.
|
2020-03-08 23:28:00 +01:00
|
|
|
/// (`Align` guarantees that this is a power of two.)
|
2018-09-09 01:16:45 +03:00
|
|
|
pub align: Align,
|
2019-09-06 03:57:44 +01:00
|
|
|
/// `true` if the allocation is mutable.
|
2018-10-23 17:54:20 +02:00
|
|
|
/// Also used by codegen to determine if a static should be put into mutable memory,
|
|
|
|
|
/// which happens for `static mut` and `static` with interior mutability.
|
|
|
|
|
pub mutability: Mutability,
|
|
|
|
|
/// Extra state for the machine.
|
|
|
|
|
pub extra: Extra,
|
|
|
|
|
}
|
|
|
|
|
|
Introduce `ConstAllocation`.
Currently some `Allocation`s are interned, some are not, and it's very
hard to tell at a use point which is which.
This commit introduces `ConstAllocation` for the known-interned ones,
which makes the division much clearer. `ConstAllocation::inner()` is
used to get the underlying `Allocation`.
In some places it's natural to use an `Allocation`, in some it's natural
to use a `ConstAllocation`, and in some places there's no clear choice.
I've tried to make things look as nice as possible, while generally
favouring `ConstAllocation`, which is the type that embodies more
information. This does require quite a few calls to `inner()`.
The commit also tweaks how `PartialOrd` works for `Interned`. The
previous code was too clever by half, building on `T: Ord` to make the
code shorter. That caused problems with deriving `PartialOrd` and `Ord`
for `ConstAllocation`, so I changed it to build on `T: PartialOrd`,
which is slightly more verbose but much more standard and avoided the
problems.
2022-03-02 07:15:04 +11:00
|
|
|
/// Interned types generally have an `Outer` type and an `Inner` type, where
|
|
|
|
|
/// `Outer` is a newtype around `Interned<Inner>`, and all the operations are
|
|
|
|
|
/// done on `Outer`, because all occurrences are interned. E.g. `Ty` is an
|
|
|
|
|
/// outer type and `TyS` is its inner type.
|
|
|
|
|
///
|
|
|
|
|
/// Here things are different because only const allocations are interned. This
|
|
|
|
|
/// means that both the inner type (`Allocation`) and the outer type
|
|
|
|
|
/// (`ConstAllocation`) are used quite a bit.
|
|
|
|
|
#[derive(Copy, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, HashStable)]
|
2022-04-05 22:42:23 +02:00
|
|
|
#[rustc_pass_by_value]
|
Introduce `ConstAllocation`.
Currently some `Allocation`s are interned, some are not, and it's very
hard to tell at a use point which is which.
This commit introduces `ConstAllocation` for the known-interned ones,
which makes the division much clearer. `ConstAllocation::inner()` is
used to get the underlying `Allocation`.
In some places it's natural to use an `Allocation`, in some it's natural
to use a `ConstAllocation`, and in some places there's no clear choice.
I've tried to make things look as nice as possible, while generally
favouring `ConstAllocation`, which is the type that embodies more
information. This does require quite a few calls to `inner()`.
The commit also tweaks how `PartialOrd` works for `Interned`. The
previous code was too clever by half, building on `T: Ord` to make the
code shorter. That caused problems with deriving `PartialOrd` and `Ord`
for `ConstAllocation`, so I changed it to build on `T: PartialOrd`,
which is slightly more verbose but much more standard and avoided the
problems.
2022-03-02 07:15:04 +11:00
|
|
|
pub struct ConstAllocation<'tcx, Tag = AllocId, Extra = ()>(
|
|
|
|
|
pub Interned<'tcx, Allocation<Tag, Extra>>,
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
impl<'tcx> fmt::Debug for ConstAllocation<'tcx> {
|
|
|
|
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
|
|
|
|
// This matches how `Allocation` is printed. We print it like this to
|
|
|
|
|
// avoid having to update expected output in a lot of tests.
|
|
|
|
|
write!(f, "{:?}", self.inner())
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl<'tcx, Tag, Extra> ConstAllocation<'tcx, Tag, Extra> {
|
|
|
|
|
pub fn inner(self) -> &'tcx Allocation<Tag, Extra> {
|
|
|
|
|
self.0.0
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
/// We have our own error type that does not know about the `AllocId`; that information
|
|
|
|
|
/// is added when converting to `InterpError`.
|
|
|
|
|
#[derive(Debug)]
|
|
|
|
|
pub enum AllocError {
|
2022-04-07 16:22:09 -04:00
|
|
|
/// A scalar had the wrong size.
|
|
|
|
|
ScalarSizeMismatch(ScalarSizeMismatch),
|
2021-05-16 18:53:20 +02:00
|
|
|
/// Encountered a pointer where we needed raw bytes.
|
|
|
|
|
ReadPointerAsBytes,
|
2021-07-18 11:15:17 +02:00
|
|
|
/// Partially overwriting a pointer.
|
|
|
|
|
PartialPointerOverwrite(Size),
|
2021-05-16 18:53:20 +02:00
|
|
|
/// Using uninitialized data where it is not allowed.
|
|
|
|
|
InvalidUninitBytes(Option<UninitBytesAccess>),
|
|
|
|
|
}
|
|
|
|
|
pub type AllocResult<T = ()> = Result<T, AllocError>;
|
2018-11-14 16:00:52 +01:00
|
|
|
|
2022-04-07 16:22:09 -04:00
|
|
|
impl From<ScalarSizeMismatch> for AllocError {
|
|
|
|
|
fn from(s: ScalarSizeMismatch) -> Self {
|
|
|
|
|
AllocError::ScalarSizeMismatch(s)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
impl AllocError {
|
|
|
|
|
pub fn to_interp_error<'tcx>(self, alloc_id: AllocId) -> InterpError<'tcx> {
|
2021-07-18 11:15:17 +02:00
|
|
|
use AllocError::*;
|
2021-05-16 18:53:20 +02:00
|
|
|
match self {
|
2022-04-07 16:22:09 -04:00
|
|
|
ScalarSizeMismatch(s) => {
|
|
|
|
|
InterpError::UndefinedBehavior(UndefinedBehaviorInfo::ScalarSizeMismatch(s))
|
|
|
|
|
}
|
2021-07-18 11:15:17 +02:00
|
|
|
ReadPointerAsBytes => InterpError::Unsupported(UnsupportedOpInfo::ReadPointerAsBytes),
|
|
|
|
|
PartialPointerOverwrite(offset) => InterpError::Unsupported(
|
|
|
|
|
UnsupportedOpInfo::PartialPointerOverwrite(Pointer::new(alloc_id, offset)),
|
|
|
|
|
),
|
|
|
|
|
InvalidUninitBytes(info) => InterpError::UndefinedBehavior(
|
2021-05-16 18:53:20 +02:00
|
|
|
UndefinedBehaviorInfo::InvalidUninitBytes(info.map(|b| (alloc_id, b))),
|
|
|
|
|
),
|
|
|
|
|
}
|
2018-11-14 16:00:52 +01:00
|
|
|
}
|
2021-05-16 18:53:20 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// The information that makes up a memory access: offset and size.
|
|
|
|
|
#[derive(Copy, Clone, Debug)]
|
|
|
|
|
pub struct AllocRange {
|
|
|
|
|
pub start: Size,
|
|
|
|
|
pub size: Size,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Free-starting constructor for less syntactic overhead.
|
|
|
|
|
#[inline(always)]
|
|
|
|
|
pub fn alloc_range(start: Size, size: Size) -> AllocRange {
|
|
|
|
|
AllocRange { start, size }
|
|
|
|
|
}
|
2018-11-14 16:00:52 +01:00
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
impl AllocRange {
|
2018-11-14 16:00:52 +01:00
|
|
|
#[inline(always)]
|
2021-05-16 18:53:20 +02:00
|
|
|
pub fn end(self) -> Size {
|
|
|
|
|
self.start + self.size // This does overflow checking.
|
2018-11-14 16:00:52 +01:00
|
|
|
}
|
|
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
/// Returns the `subrange` within this range; panics if it is not a subrange.
|
|
|
|
|
#[inline]
|
|
|
|
|
pub fn subrange(self, subrange: AllocRange) -> AllocRange {
|
|
|
|
|
let sub_start = self.start + subrange.start;
|
|
|
|
|
let range = alloc_range(sub_start, subrange.size);
|
|
|
|
|
assert!(range.end() <= self.end(), "access outside the bounds for given AllocRange");
|
|
|
|
|
range
|
2018-11-14 16:00:52 +01:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2019-05-28 10:44:46 +02:00
|
|
|
// The constructors are all without extra; the extra gets added by a machine hook later.
|
|
|
|
|
impl<Tag> Allocation<Tag> {
|
2021-05-23 13:26:51 +02:00
|
|
|
/// Creates an allocation initialized by the given bytes
|
2021-05-23 12:03:39 +02:00
|
|
|
pub fn from_bytes<'a>(
|
|
|
|
|
slice: impl Into<Cow<'a, [u8]>>,
|
|
|
|
|
align: Align,
|
|
|
|
|
mutability: Mutability,
|
|
|
|
|
) -> Self {
|
2021-08-05 19:52:08 +02:00
|
|
|
let bytes = Box::<[u8]>::from(slice.into());
|
2020-03-22 17:48:11 +01:00
|
|
|
let size = Size::from_bytes(bytes.len());
|
2018-11-14 16:00:52 +01:00
|
|
|
Self {
|
2019-04-22 13:53:52 +02:00
|
|
|
bytes,
|
2018-11-14 16:00:52 +01:00
|
|
|
relocations: Relocations::new(),
|
2020-04-22 03:20:40 -04:00
|
|
|
init_mask: InitMask::new(size, true),
|
2018-11-14 16:00:52 +01:00
|
|
|
align,
|
2021-05-23 12:03:39 +02:00
|
|
|
mutability,
|
2019-05-28 10:44:46 +02:00
|
|
|
extra: (),
|
2018-11-14 16:00:52 +01:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-05-23 12:03:39 +02:00
|
|
|
pub fn from_bytes_byte_aligned_immutable<'a>(slice: impl Into<Cow<'a, [u8]>>) -> Self {
|
|
|
|
|
Allocation::from_bytes(slice, Align::ONE, Mutability::Not)
|
2018-11-14 16:00:52 +01:00
|
|
|
}
|
|
|
|
|
|
2021-06-12 19:49:48 -04:00
|
|
|
/// Try to create an Allocation of `size` bytes, failing if there is not enough memory
|
|
|
|
|
/// available to the compiler to do so.
|
2021-07-02 16:06:12 -04:00
|
|
|
pub fn uninit(size: Size, align: Align, panic_on_fail: bool) -> InterpResult<'static, Self> {
|
2021-08-05 00:24:31 +02:00
|
|
|
let bytes = Box::<[u8]>::try_new_zeroed_slice(size.bytes_usize()).map_err(|_| {
|
2021-06-19 10:49:06 -04:00
|
|
|
// This results in an error that can happen non-deterministically, since the memory
|
|
|
|
|
// available to the compiler can change between runs. Normally queries are always
|
2022-03-30 01:39:38 -04:00
|
|
|
// deterministic. However, we can be non-deterministic here because all uses of const
|
2021-06-30 12:42:04 -04:00
|
|
|
// evaluation (including ConstProp!) will make compilation fail (via hard error
|
|
|
|
|
// or ICE) upon encountering a `MemoryExhausted` error.
|
2021-07-02 16:06:12 -04:00
|
|
|
if panic_on_fail {
|
|
|
|
|
panic!("Allocation::uninit called with panic_on_fail had allocation failure")
|
|
|
|
|
}
|
2021-06-30 15:38:31 -04:00
|
|
|
ty::tls::with(|tcx| {
|
2022-03-30 01:42:10 -04:00
|
|
|
tcx.sess.delay_span_bug(DUMMY_SP, "exhausted memory during interpretation")
|
2021-06-30 15:38:31 -04:00
|
|
|
});
|
2021-06-12 19:49:48 -04:00
|
|
|
InterpError::ResourceExhaustion(ResourceExhaustionInfo::MemoryExhausted)
|
|
|
|
|
})?;
|
2021-08-05 19:52:08 +02:00
|
|
|
// SAFETY: the box was zero-allocated, which is a valid initial value for Box<[u8]>
|
|
|
|
|
let bytes = unsafe { bytes.assume_init() };
|
2021-06-12 19:49:48 -04:00
|
|
|
Ok(Allocation {
|
2021-06-18 15:17:13 -04:00
|
|
|
bytes,
|
2018-11-14 16:00:52 +01:00
|
|
|
relocations: Relocations::new(),
|
2020-04-22 03:20:40 -04:00
|
|
|
init_mask: InitMask::new(size, false),
|
2018-11-14 16:00:52 +01:00
|
|
|
align,
|
2019-12-16 17:28:40 +01:00
|
|
|
mutability: Mutability::Mut,
|
2019-05-28 10:44:46 +02:00
|
|
|
extra: (),
|
2021-06-12 19:49:48 -04:00
|
|
|
})
|
2018-11-14 16:00:52 +01:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-07-12 18:22:15 +02:00
|
|
|
impl Allocation {
|
|
|
|
|
/// Convert Tag and add Extra fields
|
2021-07-15 18:03:22 +02:00
|
|
|
pub fn convert_tag_add_extra<Tag, Extra>(
|
2019-09-06 11:10:53 +02:00
|
|
|
self,
|
2021-07-15 18:03:22 +02:00
|
|
|
cx: &impl HasDataLayout,
|
2021-07-12 18:22:15 +02:00
|
|
|
extra: Extra,
|
2021-07-15 18:03:22 +02:00
|
|
|
mut tagger: impl FnMut(Pointer<AllocId>) -> Pointer<Tag>,
|
2021-07-12 18:22:15 +02:00
|
|
|
) -> Allocation<Tag, Extra> {
|
2021-07-15 18:03:22 +02:00
|
|
|
// Compute new pointer tags, which also adjusts the bytes.
|
|
|
|
|
let mut bytes = self.bytes;
|
|
|
|
|
let mut new_relocations = Vec::with_capacity(self.relocations.0.len());
|
|
|
|
|
let ptr_size = cx.data_layout().pointer_size.bytes_usize();
|
|
|
|
|
let endian = cx.data_layout().endian;
|
|
|
|
|
for &(offset, alloc_id) in self.relocations.iter() {
|
|
|
|
|
let idx = offset.bytes_usize();
|
|
|
|
|
let ptr_bytes = &mut bytes[idx..idx + ptr_size];
|
|
|
|
|
let bits = read_target_uint(endian, ptr_bytes).unwrap();
|
|
|
|
|
let (ptr_tag, ptr_offset) =
|
|
|
|
|
tagger(Pointer::new(alloc_id, Size::from_bytes(bits))).into_parts();
|
|
|
|
|
write_target_uint(endian, ptr_bytes, ptr_offset.bytes().into()).unwrap();
|
|
|
|
|
new_relocations.push((offset, ptr_tag));
|
|
|
|
|
}
|
|
|
|
|
// Create allocation.
|
2019-09-06 11:10:53 +02:00
|
|
|
Allocation {
|
2021-07-15 18:03:22 +02:00
|
|
|
bytes,
|
|
|
|
|
relocations: Relocations::from_presorted(new_relocations),
|
2020-04-22 03:20:40 -04:00
|
|
|
init_mask: self.init_mask,
|
2019-09-06 11:10:53 +02:00
|
|
|
align: self.align,
|
|
|
|
|
mutability: self.mutability,
|
|
|
|
|
extra,
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2019-07-13 04:00:06 +02:00
|
|
|
/// Raw accessors. Provide access to otherwise private bytes.
|
|
|
|
|
impl<Tag, Extra> Allocation<Tag, Extra> {
|
|
|
|
|
pub fn len(&self) -> usize {
|
2021-05-17 13:30:16 +02:00
|
|
|
self.bytes.len()
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
pub fn size(&self) -> Size {
|
|
|
|
|
Size::from_bytes(self.len())
|
2019-07-13 04:00:06 +02:00
|
|
|
}
|
|
|
|
|
|
2020-07-22 09:08:59 -06:00
|
|
|
/// Looks at a slice which may describe uninitialized bytes or describe a relocation. This differs
|
2020-08-08 07:53:47 -06:00
|
|
|
/// from `get_bytes_with_uninit_and_ptr` in that it does no relocation checks (even on the
|
2021-05-16 18:53:20 +02:00
|
|
|
/// edges) at all.
|
2019-07-13 04:00:06 +02:00
|
|
|
/// This must not be used for reads affecting the interpreter execution.
|
2020-08-08 07:53:47 -06:00
|
|
|
pub fn inspect_with_uninit_and_ptr_outside_interpreter(&self, range: Range<usize>) -> &[u8] {
|
2019-07-13 04:00:06 +02:00
|
|
|
&self.bytes[range]
|
|
|
|
|
}
|
2019-08-14 02:26:18 +02:00
|
|
|
|
2020-04-22 03:20:40 -04:00
|
|
|
/// Returns the mask indicating which bytes are initialized.
|
|
|
|
|
pub fn init_mask(&self) -> &InitMask {
|
|
|
|
|
&self.init_mask
|
2019-08-14 02:26:18 +02:00
|
|
|
}
|
2019-08-29 18:02:51 +02:00
|
|
|
|
|
|
|
|
/// Returns the relocation list.
|
|
|
|
|
pub fn relocations(&self) -> &Relocations<Tag> {
|
|
|
|
|
&self.relocations
|
|
|
|
|
}
|
2019-07-13 04:00:06 +02:00
|
|
|
}
|
|
|
|
|
|
2019-09-06 03:57:44 +01:00
|
|
|
/// Byte accessors.
|
2021-07-18 11:15:17 +02:00
|
|
|
impl<Tag: Provenance, Extra> Allocation<Tag, Extra> {
|
2020-07-22 09:08:59 -06:00
|
|
|
/// The last argument controls whether we error out when there are uninitialized
|
2019-02-08 14:53:55 +01:00
|
|
|
/// or pointer bytes. You should never call this, call `get_bytes` or
|
2020-08-08 07:53:47 -06:00
|
|
|
/// `get_bytes_with_uninit_and_ptr` instead,
|
2018-11-13 14:55:18 +01:00
|
|
|
///
|
|
|
|
|
/// This function also guarantees that the resulting pointer will remain stable
|
2022-04-17 19:27:41 -04:00
|
|
|
/// even when new allocations are pushed to the `HashMap`. `mem_copy_repeatedly` relies
|
2018-11-13 14:55:18 +01:00
|
|
|
/// on that.
|
2019-06-23 14:26:36 +02:00
|
|
|
///
|
2019-06-24 14:28:16 +02:00
|
|
|
/// It is the caller's responsibility to check bounds and alignment beforehand.
|
2019-04-15 10:05:13 +02:00
|
|
|
fn get_bytes_internal(
|
2018-11-13 14:55:18 +01:00
|
|
|
&self,
|
|
|
|
|
cx: &impl HasDataLayout,
|
2021-05-16 18:53:20 +02:00
|
|
|
range: AllocRange,
|
2020-07-22 09:08:59 -06:00
|
|
|
check_init_and_ptr: bool,
|
2021-05-16 18:53:20 +02:00
|
|
|
) -> AllocResult<&[u8]> {
|
2020-07-22 09:08:59 -06:00
|
|
|
if check_init_and_ptr {
|
2021-05-16 18:53:20 +02:00
|
|
|
self.check_init(range)?;
|
|
|
|
|
self.check_relocations(cx, range)?;
|
2018-11-13 14:55:18 +01:00
|
|
|
} else {
|
2019-09-06 03:57:44 +01:00
|
|
|
// We still don't want relocations on the *edges*.
|
2021-05-16 18:53:20 +02:00
|
|
|
self.check_relocation_edges(cx, range)?;
|
2018-11-13 14:55:18 +01:00
|
|
|
}
|
|
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
Ok(&self.bytes[range.start.bytes_usize()..range.end().bytes_usize()])
|
2018-11-13 14:55:18 +01:00
|
|
|
}
|
|
|
|
|
|
2019-09-06 03:57:44 +01:00
|
|
|
/// Checks that these bytes are initialized and not pointer bytes, and then return them
|
2019-06-23 14:26:36 +02:00
|
|
|
/// as a slice.
|
|
|
|
|
///
|
2019-06-24 14:28:16 +02:00
|
|
|
/// It is the caller's responsibility to check bounds and alignment beforehand.
|
2019-10-20 14:57:21 +02:00
|
|
|
/// Most likely, you want to use the `PlaceTy` and `OperandTy`-based methods
|
|
|
|
|
/// on `InterpCx` instead.
|
2018-11-13 14:55:18 +01:00
|
|
|
#[inline]
|
2021-05-16 18:53:20 +02:00
|
|
|
pub fn get_bytes(&self, cx: &impl HasDataLayout, range: AllocRange) -> AllocResult<&[u8]> {
|
|
|
|
|
self.get_bytes_internal(cx, range, true)
|
2018-11-13 14:55:18 +01:00
|
|
|
}
|
|
|
|
|
|
2020-07-22 09:08:59 -06:00
|
|
|
/// It is the caller's responsibility to handle uninitialized and pointer bytes.
|
2018-11-13 14:55:18 +01:00
|
|
|
/// However, this still checks that there are no relocations on the *edges*.
|
2019-06-23 14:26:36 +02:00
|
|
|
///
|
2019-06-24 14:28:16 +02:00
|
|
|
/// It is the caller's responsibility to check bounds and alignment beforehand.
|
2018-11-13 14:55:18 +01:00
|
|
|
#[inline]
|
2020-08-08 07:53:47 -06:00
|
|
|
pub fn get_bytes_with_uninit_and_ptr(
|
2018-11-13 14:55:18 +01:00
|
|
|
&self,
|
|
|
|
|
cx: &impl HasDataLayout,
|
2021-05-16 18:53:20 +02:00
|
|
|
range: AllocRange,
|
|
|
|
|
) -> AllocResult<&[u8]> {
|
|
|
|
|
self.get_bytes_internal(cx, range, false)
|
2018-11-13 14:55:18 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Just calling this already marks everything as defined and removes relocations,
|
|
|
|
|
/// so be sure to actually put data there!
|
2019-06-23 14:26:36 +02:00
|
|
|
///
|
2019-06-24 14:28:16 +02:00
|
|
|
/// It is the caller's responsibility to check bounds and alignment beforehand.
|
2019-10-20 14:57:21 +02:00
|
|
|
/// Most likely, you want to use the `PlaceTy` and `OperandTy`-based methods
|
|
|
|
|
/// on `InterpCx` instead.
|
2021-07-18 11:15:17 +02:00
|
|
|
pub fn get_bytes_mut(
|
|
|
|
|
&mut self,
|
|
|
|
|
cx: &impl HasDataLayout,
|
|
|
|
|
range: AllocRange,
|
|
|
|
|
) -> AllocResult<&mut [u8]> {
|
2021-05-16 18:53:20 +02:00
|
|
|
self.mark_init(range, true);
|
2021-07-18 11:15:17 +02:00
|
|
|
self.clear_relocations(cx, range)?;
|
2018-11-13 14:55:18 +01:00
|
|
|
|
2021-07-18 11:15:17 +02:00
|
|
|
Ok(&mut self.bytes[range.start.bytes_usize()..range.end().bytes_usize()])
|
2021-05-16 18:53:20 +02:00
|
|
|
}
|
2018-11-13 14:55:18 +01:00
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
/// A raw pointer variant of `get_bytes_mut` that avoids invalidating existing aliases into this memory.
|
2021-07-18 11:15:17 +02:00
|
|
|
pub fn get_bytes_mut_ptr(
|
|
|
|
|
&mut self,
|
|
|
|
|
cx: &impl HasDataLayout,
|
|
|
|
|
range: AllocRange,
|
|
|
|
|
) -> AllocResult<*mut [u8]> {
|
2021-05-16 18:53:20 +02:00
|
|
|
self.mark_init(range, true);
|
2021-07-18 11:15:17 +02:00
|
|
|
self.clear_relocations(cx, range)?;
|
2018-11-13 14:55:18 +01:00
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
assert!(range.end().bytes_usize() <= self.bytes.len()); // need to do our own bounds-check
|
|
|
|
|
let begin_ptr = self.bytes.as_mut_ptr().wrapping_add(range.start.bytes_usize());
|
|
|
|
|
let len = range.end().bytes_usize() - range.start.bytes_usize();
|
2021-07-18 11:15:17 +02:00
|
|
|
Ok(ptr::slice_from_raw_parts_mut(begin_ptr, len))
|
2018-11-13 14:55:18 +01:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2019-09-06 03:57:44 +01:00
|
|
|
/// Reading and writing.
|
2021-07-18 11:15:17 +02:00
|
|
|
impl<Tag: Provenance, Extra> Allocation<Tag, Extra> {
|
2018-11-16 16:25:15 +01:00
|
|
|
/// Validates that `ptr.offset` and `ptr.offset + size` do not point to the middle of a
|
2020-08-08 07:53:47 -06:00
|
|
|
/// relocation. If `allow_uninit_and_ptr` is `false`, also enforces that the memory in the
|
2020-07-22 09:08:59 -06:00
|
|
|
/// given range contains neither relocations nor uninitialized bytes.
|
2019-04-15 10:05:13 +02:00
|
|
|
pub fn check_bytes(
|
2018-11-12 09:00:41 +01:00
|
|
|
&self,
|
2018-11-12 13:26:53 +01:00
|
|
|
cx: &impl HasDataLayout,
|
2021-05-16 18:53:20 +02:00
|
|
|
range: AllocRange,
|
2020-08-08 07:53:47 -06:00
|
|
|
allow_uninit_and_ptr: bool,
|
2021-05-16 18:53:20 +02:00
|
|
|
) -> AllocResult {
|
2019-09-06 03:57:44 +01:00
|
|
|
// Check bounds and relocations on the edges.
|
2021-05-16 18:53:20 +02:00
|
|
|
self.get_bytes_with_uninit_and_ptr(cx, range)?;
|
2020-07-22 09:08:59 -06:00
|
|
|
// Check uninit and ptr.
|
2020-08-08 07:53:47 -06:00
|
|
|
if !allow_uninit_and_ptr {
|
2021-05-16 18:53:20 +02:00
|
|
|
self.check_init(range)?;
|
|
|
|
|
self.check_relocations(cx, range)?;
|
2018-11-12 09:00:41 +01:00
|
|
|
}
|
|
|
|
|
Ok(())
|
|
|
|
|
}
|
|
|
|
|
|
2019-09-06 03:57:44 +01:00
|
|
|
/// Reads a *non-ZST* scalar.
|
2018-11-15 14:48:34 +01:00
|
|
|
///
|
2020-08-20 05:32:14 -07:00
|
|
|
/// ZSTs can't be read because in order to obtain a `Pointer`, we need to check
|
|
|
|
|
/// for ZSTness anyway due to integer pointers being valid for ZSTs.
|
2018-11-16 16:25:15 +01:00
|
|
|
///
|
2019-06-24 14:28:16 +02:00
|
|
|
/// It is the caller's responsibility to check bounds and alignment beforehand.
|
2019-10-20 14:57:21 +02:00
|
|
|
/// Most likely, you want to call `InterpCx::read_scalar` instead of this method.
|
2019-04-15 10:05:13 +02:00
|
|
|
pub fn read_scalar(
|
2018-11-12 09:00:41 +01:00
|
|
|
&self,
|
2018-11-12 13:26:53 +01:00
|
|
|
cx: &impl HasDataLayout,
|
2021-05-16 18:53:20 +02:00
|
|
|
range: AllocRange,
|
|
|
|
|
) -> AllocResult<ScalarMaybeUninit<Tag>> {
|
2021-07-16 11:16:32 +02:00
|
|
|
// `get_bytes_with_uninit_and_ptr` tests relocation edges.
|
|
|
|
|
// We deliberately error when loading data that partially has provenance, or partially
|
|
|
|
|
// initialized data (that's the check below), into a scalar. The LLVM semantics of this are
|
|
|
|
|
// unclear so we are conservative. See <https://github.com/rust-lang/rust/issues/69488> for
|
|
|
|
|
// further discussion.
|
2021-05-16 18:53:20 +02:00
|
|
|
let bytes = self.get_bytes_with_uninit_and_ptr(cx, range)?;
|
2020-04-22 03:20:40 -04:00
|
|
|
// Uninit check happens *after* we established that the alignment is correct.
|
2019-09-06 03:57:44 +01:00
|
|
|
// We must not return `Ok()` for unaligned pointers!
|
2021-05-16 18:53:20 +02:00
|
|
|
if self.is_init(range).is_err() {
|
2020-04-22 03:20:40 -04:00
|
|
|
// This inflates uninitialized bytes to the entire scalar, even if only a few
|
|
|
|
|
// bytes are uninitialized.
|
|
|
|
|
return Ok(ScalarMaybeUninit::Uninit);
|
2018-11-12 09:00:41 +01:00
|
|
|
}
|
2019-09-06 03:57:44 +01:00
|
|
|
// Now we do the actual reading.
|
2018-11-12 13:26:53 +01:00
|
|
|
let bits = read_target_uint(cx.data_layout().endian, bytes).unwrap();
|
2019-09-06 03:57:44 +01:00
|
|
|
// See if we got a pointer.
|
2021-05-16 18:53:20 +02:00
|
|
|
if range.size != cx.data_layout().pointer_size {
|
|
|
|
|
// Not a pointer.
|
2019-09-06 03:57:44 +01:00
|
|
|
// *Now*, we better make sure that the inside is free of relocations too.
|
2021-05-16 18:53:20 +02:00
|
|
|
self.check_relocations(cx, range)?;
|
2018-11-12 09:00:41 +01:00
|
|
|
} else {
|
2021-05-16 18:53:20 +02:00
|
|
|
// Maybe a pointer.
|
2021-07-12 18:22:15 +02:00
|
|
|
if let Some(&prov) = self.relocations.get(&range.start) {
|
|
|
|
|
let ptr = Pointer::new(prov, Size::from_bytes(bits));
|
2021-07-12 20:29:05 +02:00
|
|
|
return Ok(ScalarMaybeUninit::from_pointer(ptr, cx));
|
2018-11-12 09:00:41 +01:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
// We don't. Just return the bits.
|
2021-05-16 18:53:20 +02:00
|
|
|
Ok(ScalarMaybeUninit::Scalar(Scalar::from_uint(bits, range.size)))
|
2018-11-12 09:00:41 +01:00
|
|
|
}
|
|
|
|
|
|
2019-09-06 03:57:44 +01:00
|
|
|
/// Writes a *non-ZST* scalar.
|
2018-11-15 14:48:34 +01:00
|
|
|
///
|
2020-08-20 05:32:14 -07:00
|
|
|
/// ZSTs can't be read because in order to obtain a `Pointer`, we need to check
|
|
|
|
|
/// for ZSTness anyway due to integer pointers being valid for ZSTs.
|
2018-11-16 16:25:15 +01:00
|
|
|
///
|
2019-06-24 14:28:16 +02:00
|
|
|
/// It is the caller's responsibility to check bounds and alignment beforehand.
|
2019-10-20 14:57:21 +02:00
|
|
|
/// Most likely, you want to call `InterpCx::write_scalar` instead of this method.
|
2019-04-15 10:05:13 +02:00
|
|
|
pub fn write_scalar(
|
2018-11-12 09:00:41 +01:00
|
|
|
&mut self,
|
2018-11-12 13:26:53 +01:00
|
|
|
cx: &impl HasDataLayout,
|
2021-05-16 18:53:20 +02:00
|
|
|
range: AllocRange,
|
2020-04-22 03:20:40 -04:00
|
|
|
val: ScalarMaybeUninit<Tag>,
|
2021-05-16 18:53:20 +02:00
|
|
|
) -> AllocResult {
|
2021-06-28 09:19:36 +02:00
|
|
|
assert!(self.mutability == Mutability::Mut);
|
|
|
|
|
|
2018-11-12 09:00:41 +01:00
|
|
|
let val = match val {
|
2020-04-22 03:20:40 -04:00
|
|
|
ScalarMaybeUninit::Scalar(scalar) => scalar,
|
|
|
|
|
ScalarMaybeUninit::Uninit => {
|
2022-04-17 19:16:54 -04:00
|
|
|
return self.write_uninit(cx, range);
|
2019-12-22 17:42:04 -05:00
|
|
|
}
|
2018-11-12 09:00:41 +01:00
|
|
|
};
|
|
|
|
|
|
2021-07-16 09:39:35 +02:00
|
|
|
// `to_bits_or_ptr_internal` is the right method because we just want to store this data
|
|
|
|
|
// as-is into memory.
|
2022-04-07 16:22:09 -04:00
|
|
|
let (bytes, provenance) = match val.to_bits_or_ptr_internal(range.size)? {
|
2021-07-12 18:22:15 +02:00
|
|
|
Err(val) => {
|
|
|
|
|
let (provenance, offset) = val.into_parts();
|
|
|
|
|
(u128::from(offset.bytes()), Some(provenance))
|
|
|
|
|
}
|
|
|
|
|
Ok(data) => (data, None),
|
2018-11-12 09:00:41 +01:00
|
|
|
};
|
|
|
|
|
|
2018-11-25 11:23:21 +01:00
|
|
|
let endian = cx.data_layout().endian;
|
2021-07-18 11:15:17 +02:00
|
|
|
let dst = self.get_bytes_mut(cx, range)?;
|
2018-11-25 11:23:21 +01:00
|
|
|
write_target_uint(endian, dst, bytes).unwrap();
|
2018-11-12 09:00:41 +01:00
|
|
|
|
2019-09-06 03:57:44 +01:00
|
|
|
// See if we have to also write a relocation.
|
2021-07-12 18:22:15 +02:00
|
|
|
if let Some(provenance) = provenance {
|
2021-07-15 18:03:22 +02:00
|
|
|
self.relocations.0.insert(range.start, provenance);
|
2018-11-12 09:00:41 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
|
}
|
2022-04-17 19:16:54 -04:00
|
|
|
|
|
|
|
|
/// Write "uninit" to the given memory range.
|
|
|
|
|
pub fn write_uninit(&mut self, cx: &impl HasDataLayout, range: AllocRange) -> AllocResult {
|
|
|
|
|
self.mark_init(range, false);
|
|
|
|
|
self.clear_relocations(cx, range)?;
|
|
|
|
|
return Ok(());
|
|
|
|
|
}
|
2018-11-13 14:32:39 +01:00
|
|
|
}
|
2018-11-12 09:00:41 +01:00
|
|
|
|
2019-09-06 03:57:44 +01:00
|
|
|
/// Relocations.
|
2021-05-16 18:53:20 +02:00
|
|
|
impl<Tag: Copy, Extra> Allocation<Tag, Extra> {
|
2019-09-06 03:57:44 +01:00
|
|
|
/// Returns all relocations overlapping with the given pointer-offset pair.
|
2021-07-12 18:22:15 +02:00
|
|
|
pub fn get_relocations(&self, cx: &impl HasDataLayout, range: AllocRange) -> &[(Size, Tag)] {
|
2018-11-12 08:34:04 +01:00
|
|
|
// We have to go back `pointer_size - 1` bytes, as that one would still overlap with
|
|
|
|
|
// the beginning of this range.
|
2021-05-16 18:53:20 +02:00
|
|
|
let start = range.start.bytes().saturating_sub(cx.data_layout().pointer_size.bytes() - 1);
|
|
|
|
|
self.relocations.range(Size::from_bytes(start)..range.end())
|
2018-11-12 08:34:04 +01:00
|
|
|
}
|
|
|
|
|
|
2019-02-08 14:53:55 +01:00
|
|
|
/// Checks that there are no relocations overlapping with the given range.
|
2018-11-12 08:34:04 +01:00
|
|
|
#[inline(always)]
|
2021-05-16 18:53:20 +02:00
|
|
|
fn check_relocations(&self, cx: &impl HasDataLayout, range: AllocRange) -> AllocResult {
|
|
|
|
|
if self.get_relocations(cx, range).is_empty() {
|
2018-11-12 08:34:04 +01:00
|
|
|
Ok(())
|
2018-11-13 09:44:59 +01:00
|
|
|
} else {
|
2021-05-16 18:53:20 +02:00
|
|
|
Err(AllocError::ReadPointerAsBytes)
|
2018-11-12 08:34:04 +01:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2019-02-08 14:53:55 +01:00
|
|
|
/// Removes all relocations inside the given range.
|
2018-11-12 08:34:04 +01:00
|
|
|
/// If there are relocations overlapping with the edges, they
|
|
|
|
|
/// are removed as well *and* the bytes they cover are marked as
|
2019-02-08 14:53:55 +01:00
|
|
|
/// uninitialized. This is a somewhat odd "spooky action at a distance",
|
2018-11-12 08:34:04 +01:00
|
|
|
/// but it allows strictly more code to run than if we would just error
|
|
|
|
|
/// immediately in that case.
|
2021-07-18 11:15:17 +02:00
|
|
|
fn clear_relocations(&mut self, cx: &impl HasDataLayout, range: AllocRange) -> AllocResult
|
|
|
|
|
where
|
|
|
|
|
Tag: Provenance,
|
|
|
|
|
{
|
2018-11-12 08:34:04 +01:00
|
|
|
// Find the start and end of the given range and its outermost relocations.
|
|
|
|
|
let (first, last) = {
|
|
|
|
|
// Find all relocations overlapping the given range.
|
2021-05-16 18:53:20 +02:00
|
|
|
let relocations = self.get_relocations(cx, range);
|
2018-11-12 08:34:04 +01:00
|
|
|
if relocations.is_empty() {
|
2021-07-18 11:15:17 +02:00
|
|
|
return Ok(());
|
2018-11-12 08:34:04 +01:00
|
|
|
}
|
|
|
|
|
|
2019-12-22 17:42:04 -05:00
|
|
|
(
|
|
|
|
|
relocations.first().unwrap().0,
|
|
|
|
|
relocations.last().unwrap().0 + cx.data_layout().pointer_size,
|
|
|
|
|
)
|
2018-11-12 08:34:04 +01:00
|
|
|
};
|
2021-05-16 18:53:20 +02:00
|
|
|
let start = range.start;
|
|
|
|
|
let end = range.end();
|
2018-11-12 08:34:04 +01:00
|
|
|
|
2021-07-18 11:15:17 +02:00
|
|
|
// We need to handle clearing the relocations from parts of a pointer. See
|
|
|
|
|
// <https://github.com/rust-lang/rust/issues/87184> for details.
|
2018-11-12 08:34:04 +01:00
|
|
|
if first < start {
|
2021-07-18 11:15:17 +02:00
|
|
|
if Tag::ERR_ON_PARTIAL_PTR_OVERWRITE {
|
|
|
|
|
return Err(AllocError::PartialPointerOverwrite(first));
|
|
|
|
|
}
|
2020-04-22 03:20:40 -04:00
|
|
|
self.init_mask.set_range(first, start, false);
|
2018-11-12 08:34:04 +01:00
|
|
|
}
|
|
|
|
|
if last > end {
|
2021-07-18 11:15:17 +02:00
|
|
|
if Tag::ERR_ON_PARTIAL_PTR_OVERWRITE {
|
|
|
|
|
return Err(AllocError::PartialPointerOverwrite(
|
|
|
|
|
last - cx.data_layout().pointer_size,
|
|
|
|
|
));
|
|
|
|
|
}
|
2020-04-22 03:20:40 -04:00
|
|
|
self.init_mask.set_range(end, last, false);
|
2018-11-12 08:34:04 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Forget all the relocations.
|
2021-07-15 18:03:22 +02:00
|
|
|
self.relocations.0.remove_range(first..last);
|
2021-07-18 11:15:17 +02:00
|
|
|
|
|
|
|
|
Ok(())
|
2018-11-12 08:34:04 +01:00
|
|
|
}
|
|
|
|
|
|
2019-09-06 03:57:44 +01:00
|
|
|
/// Errors if there are relocations overlapping with the edges of the
|
2018-11-12 08:34:04 +01:00
|
|
|
/// given memory range.
|
|
|
|
|
#[inline]
|
2021-05-16 18:53:20 +02:00
|
|
|
fn check_relocation_edges(&self, cx: &impl HasDataLayout, range: AllocRange) -> AllocResult {
|
|
|
|
|
self.check_relocations(cx, alloc_range(range.start, Size::ZERO))?;
|
|
|
|
|
self.check_relocations(cx, alloc_range(range.end(), Size::ZERO))?;
|
2018-11-12 08:34:04 +01:00
|
|
|
Ok(())
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-07-12 18:22:15 +02:00
|
|
|
/// "Relocations" stores the provenance information of pointers stored in memory.
|
2020-06-11 15:49:57 +01:00
|
|
|
#[derive(Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Debug, TyEncodable, TyDecodable)]
|
2021-07-12 18:22:15 +02:00
|
|
|
pub struct Relocations<Tag = AllocId>(SortedMap<Size, Tag>);
|
2018-10-25 16:09:42 +02:00
|
|
|
|
2021-07-12 18:22:15 +02:00
|
|
|
impl<Tag> Relocations<Tag> {
|
2018-10-25 16:09:42 +02:00
|
|
|
pub fn new() -> Self {
|
|
|
|
|
Relocations(SortedMap::new())
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// The caller must guarantee that the given relocations are already sorted
|
|
|
|
|
// by address and contain no duplicates.
|
2021-07-12 18:22:15 +02:00
|
|
|
pub fn from_presorted(r: Vec<(Size, Tag)>) -> Self {
|
2018-10-25 16:09:42 +02:00
|
|
|
Relocations(SortedMap::from_presorted_elements(r))
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl<Tag> Deref for Relocations<Tag> {
|
2021-07-12 18:22:15 +02:00
|
|
|
type Target = SortedMap<Size, Tag>;
|
2018-10-25 16:09:42 +02:00
|
|
|
|
|
|
|
|
fn deref(&self) -> &Self::Target {
|
|
|
|
|
&self.0
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2019-08-30 04:17:18 +02:00
|
|
|
/// A partial, owned list of relocations to transfer into another allocation.
|
|
|
|
|
pub struct AllocationRelocations<Tag> {
|
2021-07-12 18:22:15 +02:00
|
|
|
relative_relocations: Vec<(Size, Tag)>,
|
2019-08-30 04:17:18 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl<Tag: Copy, Extra> Allocation<Tag, Extra> {
|
|
|
|
|
pub fn prepare_relocation_copy(
|
|
|
|
|
&self,
|
|
|
|
|
cx: &impl HasDataLayout,
|
2021-05-16 18:53:20 +02:00
|
|
|
src: AllocRange,
|
|
|
|
|
dest: Size,
|
|
|
|
|
count: u64,
|
2019-08-30 04:17:18 +02:00
|
|
|
) -> AllocationRelocations<Tag> {
|
2021-05-16 18:53:20 +02:00
|
|
|
let relocations = self.get_relocations(cx, src);
|
2019-08-30 04:17:18 +02:00
|
|
|
if relocations.is_empty() {
|
|
|
|
|
return AllocationRelocations { relative_relocations: Vec::new() };
|
|
|
|
|
}
|
|
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
let size = src.size;
|
|
|
|
|
let mut new_relocations = Vec::with_capacity(relocations.len() * (count as usize));
|
2019-08-30 04:17:18 +02:00
|
|
|
|
2021-05-16 18:53:20 +02:00
|
|
|
for i in 0..count {
|
2019-12-22 17:42:04 -05:00
|
|
|
new_relocations.extend(relocations.iter().map(|&(offset, reloc)| {
|
|
|
|
|
// compute offset for current repetition
|
2021-05-16 18:53:20 +02:00
|
|
|
let dest_offset = dest + size * i; // `Size` operations
|
2019-12-22 17:42:04 -05:00
|
|
|
(
|
|
|
|
|
// shift offsets from source allocation to destination allocation
|
2021-05-16 18:53:20 +02:00
|
|
|
(offset + dest_offset) - src.start, // `Size` operations
|
2019-12-22 17:42:04 -05:00
|
|
|
reloc,
|
|
|
|
|
)
|
|
|
|
|
}));
|
2019-08-30 04:17:18 +02:00
|
|
|
}
|
|
|
|
|
|
2019-12-22 17:42:04 -05:00
|
|
|
AllocationRelocations { relative_relocations: new_relocations }
|
2019-08-30 04:17:18 +02:00
|
|
|
}
|
|
|
|
|
|
2019-09-06 21:05:37 +01:00
|
|
|
/// Applies a relocation copy.
|
2019-08-31 17:01:56 +02:00
|
|
|
/// The affected range, as defined in the parameters to `prepare_relocation_copy` is expected
|
|
|
|
|
/// to be clear of relocations.
|
2022-04-17 19:27:41 -04:00
|
|
|
///
|
|
|
|
|
/// This is dangerous to use as it can violate internal `Allocation` invariants!
|
|
|
|
|
/// It only exists to support an efficient implementation of `mem_copy_repeatedly`.
|
2019-12-22 17:42:04 -05:00
|
|
|
pub fn mark_relocation_range(&mut self, relocations: AllocationRelocations<Tag>) {
|
2021-07-15 18:03:22 +02:00
|
|
|
self.relocations.0.insert_presorted(relocations.relative_relocations);
|
2019-08-30 04:17:18 +02:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2018-10-25 16:09:42 +02:00
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
2020-07-22 09:08:59 -06:00
|
|
|
// Uninitialized byte tracking
|
2018-10-25 16:09:42 +02:00
|
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
|
|
|
|
|
|
type Block = u64;
|
|
|
|
|
|
2019-03-12 14:43:49 +01:00
|
|
|
/// A bitmask where each bit refers to the byte with the same index. If the bit is `true`, the byte
|
2020-04-22 03:20:40 -04:00
|
|
|
/// is initialized. If it is `false` the byte is uninitialized.
|
2020-06-11 15:49:57 +01:00
|
|
|
#[derive(Clone, Debug, Eq, PartialEq, PartialOrd, Ord, Hash, TyEncodable, TyDecodable)]
|
2020-03-23 14:48:59 +00:00
|
|
|
#[derive(HashStable)]
|
2020-04-22 03:20:40 -04:00
|
|
|
pub struct InitMask {
|
2018-10-25 16:09:42 +02:00
|
|
|
blocks: Vec<Block>,
|
|
|
|
|
len: Size,
|
|
|
|
|
}
|
|
|
|
|
|
2020-04-22 03:20:40 -04:00
|
|
|
impl InitMask {
|
2019-02-18 10:54:16 +01:00
|
|
|
pub const BLOCK_SIZE: u64 = 64;
|
|
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
#[inline]
|
|
|
|
|
fn bit_index(bits: Size) -> (usize, usize) {
|
2021-08-15 12:24:58 -04:00
|
|
|
// BLOCK_SIZE is the number of bits that can fit in a `Block`.
|
|
|
|
|
// Each bit in a `Block` represents the initialization state of one byte of an allocation,
|
|
|
|
|
// so we use `.bytes()` here.
|
2021-08-14 14:13:06 -04:00
|
|
|
let bits = bits.bytes();
|
|
|
|
|
let a = bits / InitMask::BLOCK_SIZE;
|
|
|
|
|
let b = bits % InitMask::BLOCK_SIZE;
|
|
|
|
|
(usize::try_from(a).unwrap(), usize::try_from(b).unwrap())
|
2018-10-25 16:09:42 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
2021-08-14 14:13:06 -04:00
|
|
|
fn size_from_bit_index(block: impl TryInto<u64>, bit: impl TryInto<u64>) -> Size {
|
|
|
|
|
let block = block.try_into().ok().unwrap();
|
|
|
|
|
let bit = bit.try_into().ok().unwrap();
|
|
|
|
|
Size::from_bytes(block * InitMask::BLOCK_SIZE + bit)
|
2018-10-25 16:09:42 +02:00
|
|
|
}
|
|
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
pub fn new(size: Size, state: bool) -> Self {
|
|
|
|
|
let mut m = InitMask { blocks: vec![], len: Size::ZERO };
|
|
|
|
|
m.grow(size, state);
|
|
|
|
|
m
|
2021-03-31 00:06:01 -04:00
|
|
|
}
|
|
|
|
|
|
2018-10-25 16:09:42 +02:00
|
|
|
pub fn set_range(&mut self, start: Size, end: Size, new_state: bool) {
|
|
|
|
|
let len = self.len;
|
|
|
|
|
if end > len {
|
|
|
|
|
self.grow(end - len, new_state);
|
|
|
|
|
}
|
|
|
|
|
self.set_range_inbounds(start, end, new_state);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
pub fn set_range_inbounds(&mut self, start: Size, end: Size, new_state: bool) {
|
2021-08-14 14:13:06 -04:00
|
|
|
let (blocka, bita) = Self::bit_index(start);
|
|
|
|
|
let (blockb, bitb) = Self::bit_index(end);
|
2019-02-18 10:54:16 +01:00
|
|
|
if blocka == blockb {
|
2019-09-06 03:57:44 +01:00
|
|
|
// First set all bits except the first `bita`,
|
|
|
|
|
// then unset the last `64 - bitb` bits.
|
2019-02-20 15:07:25 +01:00
|
|
|
let range = if bitb == 0 {
|
2020-03-04 13:12:04 +01:00
|
|
|
u64::MAX << bita
|
2019-02-20 15:07:25 +01:00
|
|
|
} else {
|
2020-03-04 13:12:04 +01:00
|
|
|
(u64::MAX << bita) & (u64::MAX >> (64 - bitb))
|
2019-02-20 15:07:25 +01:00
|
|
|
};
|
|
|
|
|
if new_state {
|
|
|
|
|
self.blocks[blocka] |= range;
|
|
|
|
|
} else {
|
|
|
|
|
self.blocks[blocka] &= !range;
|
2019-02-18 10:54:16 +01:00
|
|
|
}
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
// across block boundaries
|
|
|
|
|
if new_state {
|
2019-09-06 03:57:44 +01:00
|
|
|
// Set `bita..64` to `1`.
|
2020-03-04 13:12:04 +01:00
|
|
|
self.blocks[blocka] |= u64::MAX << bita;
|
2019-09-06 03:57:44 +01:00
|
|
|
// Set `0..bitb` to `1`.
|
2019-02-20 15:07:25 +01:00
|
|
|
if bitb != 0 {
|
2020-03-04 13:12:04 +01:00
|
|
|
self.blocks[blockb] |= u64::MAX >> (64 - bitb);
|
2019-02-20 15:07:25 +01:00
|
|
|
}
|
2019-09-06 03:57:44 +01:00
|
|
|
// Fill in all the other blocks (much faster than one bit at a time).
|
2019-12-22 17:42:04 -05:00
|
|
|
for block in (blocka + 1)..blockb {
|
2020-03-04 13:12:04 +01:00
|
|
|
self.blocks[block] = u64::MAX;
|
2019-02-18 10:54:16 +01:00
|
|
|
}
|
|
|
|
|
} else {
|
2019-09-06 03:57:44 +01:00
|
|
|
// Set `bita..64` to `0`.
|
2020-03-04 13:12:04 +01:00
|
|
|
self.blocks[blocka] &= !(u64::MAX << bita);
|
2019-09-06 03:57:44 +01:00
|
|
|
// Set `0..bitb` to `0`.
|
2019-02-20 15:07:25 +01:00
|
|
|
if bitb != 0 {
|
2020-03-04 13:12:04 +01:00
|
|
|
self.blocks[blockb] &= !(u64::MAX >> (64 - bitb));
|
2019-02-20 15:07:25 +01:00
|
|
|
}
|
2019-09-06 03:57:44 +01:00
|
|
|
// Fill in all the other blocks (much faster than one bit at a time).
|
2019-12-22 17:42:04 -05:00
|
|
|
for block in (blocka + 1)..blockb {
|
2019-02-18 10:54:16 +01:00
|
|
|
self.blocks[block] = 0;
|
|
|
|
|
}
|
2018-10-25 16:09:42 +02:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
|
pub fn get(&self, i: Size) -> bool {
|
2021-08-14 14:13:06 -04:00
|
|
|
let (block, bit) = Self::bit_index(i);
|
2019-02-20 15:07:25 +01:00
|
|
|
(self.blocks[block] & (1 << bit)) != 0
|
2018-10-25 16:09:42 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
|
pub fn set(&mut self, i: Size, new_state: bool) {
|
2021-08-14 14:13:06 -04:00
|
|
|
let (block, bit) = Self::bit_index(i);
|
2019-02-18 10:54:16 +01:00
|
|
|
self.set_bit(block, bit, new_state);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
|
fn set_bit(&mut self, block: usize, bit: usize, new_state: bool) {
|
2018-10-25 16:09:42 +02:00
|
|
|
if new_state {
|
|
|
|
|
self.blocks[block] |= 1 << bit;
|
|
|
|
|
} else {
|
|
|
|
|
self.blocks[block] &= !(1 << bit);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
pub fn grow(&mut self, amount: Size, new_state: bool) {
|
2019-02-20 15:07:25 +01:00
|
|
|
if amount.bytes() == 0 {
|
|
|
|
|
return;
|
|
|
|
|
}
|
2020-03-21 13:49:02 +01:00
|
|
|
let unused_trailing_bits =
|
|
|
|
|
u64::try_from(self.blocks.len()).unwrap() * Self::BLOCK_SIZE - self.len.bytes();
|
2018-10-25 16:09:42 +02:00
|
|
|
if amount.bytes() > unused_trailing_bits {
|
2019-02-18 10:54:16 +01:00
|
|
|
let additional_blocks = amount.bytes() / Self::BLOCK_SIZE + 1;
|
2018-10-25 16:09:42 +02:00
|
|
|
self.blocks.extend(
|
2019-09-06 03:57:44 +01:00
|
|
|
// FIXME(oli-obk): optimize this by repeating `new_state as Block`.
|
2020-03-21 13:49:02 +01:00
|
|
|
iter::repeat(0).take(usize::try_from(additional_blocks).unwrap()),
|
2018-10-25 16:09:42 +02:00
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
let start = self.len;
|
|
|
|
|
self.len += amount;
|
2020-03-24 16:43:50 +01:00
|
|
|
self.set_range_inbounds(start, start + amount, new_state); // `Size` operation
|
2018-10-25 16:09:42 +02:00
|
|
|
}
|
2021-08-14 14:13:06 -04:00
|
|
|
|
|
|
|
|
/// Returns the index of the first bit in `start..end` (end-exclusive) that is equal to is_init.
|
|
|
|
|
fn find_bit(&self, start: Size, end: Size, is_init: bool) -> Option<Size> {
|
|
|
|
|
/// A fast implementation of `find_bit`,
|
|
|
|
|
/// which skips over an entire block at a time if it's all 0s (resp. 1s),
|
|
|
|
|
/// and finds the first 1 (resp. 0) bit inside a block using `trailing_zeros` instead of a loop.
|
|
|
|
|
///
|
|
|
|
|
/// Note that all examples below are written with 8 (instead of 64) bit blocks for simplicity,
|
|
|
|
|
/// and with the least significant bit (and lowest block) first:
|
|
|
|
|
///
|
|
|
|
|
/// 00000000|00000000
|
|
|
|
|
/// ^ ^ ^ ^
|
|
|
|
|
/// index: 0 7 8 15
|
|
|
|
|
///
|
|
|
|
|
/// Also, if not stated, assume that `is_init = true`, that is, we are searching for the first 1 bit.
|
|
|
|
|
fn find_bit_fast(
|
|
|
|
|
init_mask: &InitMask,
|
|
|
|
|
start: Size,
|
|
|
|
|
end: Size,
|
|
|
|
|
is_init: bool,
|
|
|
|
|
) -> Option<Size> {
|
|
|
|
|
/// Search one block, returning the index of the first bit equal to `is_init`.
|
|
|
|
|
fn search_block(
|
|
|
|
|
bits: Block,
|
|
|
|
|
block: usize,
|
|
|
|
|
start_bit: usize,
|
|
|
|
|
is_init: bool,
|
|
|
|
|
) -> Option<Size> {
|
|
|
|
|
// For the following examples, assume this function was called with:
|
2021-08-15 12:24:58 -04:00
|
|
|
// bits = 0b00111011
|
2021-08-14 14:13:06 -04:00
|
|
|
// start_bit = 3
|
|
|
|
|
// is_init = false
|
2021-08-15 12:24:58 -04:00
|
|
|
// Note that, for the examples in this function, the most significant bit is written first,
|
|
|
|
|
// which is backwards compared to the comments in `find_bit`/`find_bit_fast`.
|
2021-08-14 14:13:06 -04:00
|
|
|
|
|
|
|
|
// Invert bits so we're always looking for the first set bit.
|
2021-08-15 12:24:58 -04:00
|
|
|
// ! 0b00111011
|
|
|
|
|
// bits = 0b11000100
|
2021-08-14 14:13:06 -04:00
|
|
|
let bits = if is_init { bits } else { !bits };
|
|
|
|
|
// Mask off unused start bits.
|
2021-08-15 12:24:58 -04:00
|
|
|
// 0b11000100
|
|
|
|
|
// & 0b11111000
|
|
|
|
|
// bits = 0b11000000
|
2021-08-14 14:13:06 -04:00
|
|
|
let bits = bits & (!0 << start_bit);
|
|
|
|
|
// Find set bit, if any.
|
2021-08-15 12:24:58 -04:00
|
|
|
// bit = trailing_zeros(0b11000000)
|
2021-08-14 14:13:06 -04:00
|
|
|
// bit = 6
|
|
|
|
|
if bits == 0 {
|
|
|
|
|
None
|
|
|
|
|
} else {
|
|
|
|
|
let bit = bits.trailing_zeros();
|
|
|
|
|
Some(InitMask::size_from_bit_index(block, bit))
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if start >= end {
|
|
|
|
|
return None;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Convert `start` and `end` to block indexes and bit indexes within each block.
|
|
|
|
|
// We must convert `end` to an inclusive bound to handle block boundaries correctly.
|
|
|
|
|
//
|
|
|
|
|
// For example:
|
|
|
|
|
//
|
|
|
|
|
// (a) 00000000|00000000 (b) 00000000|
|
|
|
|
|
// ^~~~~~~~~~~^ ^~~~~~~~~^
|
|
|
|
|
// start end start end
|
|
|
|
|
//
|
|
|
|
|
// In both cases, the block index of `end` is 1.
|
|
|
|
|
// But we do want to search block 1 in (a), and we don't in (b).
|
|
|
|
|
//
|
2021-08-25 17:40:57 -04:00
|
|
|
// We subtract 1 from both end positions to make them inclusive:
|
2021-08-14 14:13:06 -04:00
|
|
|
//
|
|
|
|
|
// (a) 00000000|00000000 (b) 00000000|
|
|
|
|
|
// ^~~~~~~~~~^ ^~~~~~~^
|
|
|
|
|
// start end_inclusive start end_inclusive
|
|
|
|
|
//
|
|
|
|
|
// For (a), the block index of `end_inclusive` is 1, and for (b), it's 0.
|
|
|
|
|
// This provides the desired behavior of searching blocks 0 and 1 for (a),
|
|
|
|
|
// and searching only block 0 for (b).
|
2021-08-15 12:24:58 -04:00
|
|
|
// There is no concern of overflows since we checked for `start >= end` above.
|
2021-08-14 14:13:06 -04:00
|
|
|
let (start_block, start_bit) = InitMask::bit_index(start);
|
|
|
|
|
let end_inclusive = Size::from_bytes(end.bytes() - 1);
|
|
|
|
|
let (end_block_inclusive, _) = InitMask::bit_index(end_inclusive);
|
|
|
|
|
|
|
|
|
|
// Handle first block: need to skip `start_bit` bits.
|
|
|
|
|
//
|
|
|
|
|
// We need to handle the first block separately,
|
|
|
|
|
// because there may be bits earlier in the block that should be ignored,
|
|
|
|
|
// such as the bit marked (1) in this example:
|
|
|
|
|
//
|
|
|
|
|
// (1)
|
|
|
|
|
// -|------
|
|
|
|
|
// (c) 01000000|00000000|00000001
|
|
|
|
|
// ^~~~~~~~~~~~~~~~~~^
|
|
|
|
|
// start end
|
|
|
|
|
if let Some(i) =
|
|
|
|
|
search_block(init_mask.blocks[start_block], start_block, start_bit, is_init)
|
|
|
|
|
{
|
|
|
|
|
// If the range is less than a block, we may find a matching bit after `end`.
|
|
|
|
|
//
|
|
|
|
|
// For example, we shouldn't successfully find bit (2), because it's after `end`:
|
|
|
|
|
//
|
|
|
|
|
// (2)
|
|
|
|
|
// -------|
|
|
|
|
|
// (d) 00000001|00000000|00000001
|
|
|
|
|
// ^~~~~^
|
|
|
|
|
// start end
|
|
|
|
|
//
|
|
|
|
|
// An alternative would be to mask off end bits in the same way as we do for start bits,
|
|
|
|
|
// but performing this check afterwards is faster and simpler to implement.
|
|
|
|
|
if i < end {
|
|
|
|
|
return Some(i);
|
|
|
|
|
} else {
|
|
|
|
|
return None;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Handle remaining blocks.
|
|
|
|
|
//
|
|
|
|
|
// We can skip over an entire block at once if it's all 0s (resp. 1s).
|
|
|
|
|
// The block marked (3) in this example is the first block that will be handled by this loop,
|
|
|
|
|
// and it will be skipped for that reason:
|
|
|
|
|
//
|
|
|
|
|
// (3)
|
|
|
|
|
// --------
|
|
|
|
|
// (e) 01000000|00000000|00000001
|
|
|
|
|
// ^~~~~~~~~~~~~~~~~~^
|
|
|
|
|
// start end
|
|
|
|
|
if start_block < end_block_inclusive {
|
|
|
|
|
// This loop is written in a specific way for performance.
|
|
|
|
|
// Notably: `..end_block_inclusive + 1` is used for an inclusive range instead of `..=end_block_inclusive`,
|
|
|
|
|
// and `.zip(start_block + 1..)` is used to track the index instead of `.enumerate().skip().take()`,
|
|
|
|
|
// because both alternatives result in significantly worse codegen.
|
|
|
|
|
// `end_block_inclusive + 1` is guaranteed not to wrap, because `end_block_inclusive <= end / BLOCK_SIZE`,
|
|
|
|
|
// and `BLOCK_SIZE` (the number of bits per block) will always be at least 8 (1 byte).
|
|
|
|
|
for (&bits, block) in init_mask.blocks[start_block + 1..end_block_inclusive + 1]
|
|
|
|
|
.iter()
|
|
|
|
|
.zip(start_block + 1..)
|
|
|
|
|
{
|
|
|
|
|
if let Some(i) = search_block(bits, block, 0, is_init) {
|
|
|
|
|
// If this is the last block, we may find a matching bit after `end`.
|
|
|
|
|
//
|
|
|
|
|
// For example, we shouldn't successfully find bit (4), because it's after `end`:
|
|
|
|
|
//
|
|
|
|
|
// (4)
|
|
|
|
|
// -------|
|
|
|
|
|
// (f) 00000001|00000000|00000001
|
|
|
|
|
// ^~~~~~~~~~~~~~~~~~^
|
|
|
|
|
// start end
|
|
|
|
|
//
|
|
|
|
|
// As above with example (d), we could handle the end block separately and mask off end bits,
|
|
|
|
|
// but unconditionally searching an entire block at once and performing this check afterwards
|
|
|
|
|
// is faster and much simpler to implement.
|
|
|
|
|
if i < end {
|
|
|
|
|
return Some(i);
|
|
|
|
|
} else {
|
|
|
|
|
return None;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
None
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[cfg_attr(not(debug_assertions), allow(dead_code))]
|
|
|
|
|
fn find_bit_slow(
|
|
|
|
|
init_mask: &InitMask,
|
|
|
|
|
start: Size,
|
|
|
|
|
end: Size,
|
|
|
|
|
is_init: bool,
|
|
|
|
|
) -> Option<Size> {
|
|
|
|
|
(start..end).find(|&i| init_mask.get(i) == is_init)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
let result = find_bit_fast(self, start, end, is_init);
|
|
|
|
|
|
|
|
|
|
debug_assert_eq!(
|
|
|
|
|
result,
|
|
|
|
|
find_bit_slow(self, start, end, is_init),
|
|
|
|
|
"optimized implementation of find_bit is wrong for start={:?} end={:?} is_init={} init_mask={:#?}",
|
|
|
|
|
start,
|
|
|
|
|
end,
|
|
|
|
|
is_init,
|
|
|
|
|
self
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
result
|
|
|
|
|
}
|
2018-10-25 16:09:42 +02:00
|
|
|
}
|
|
|
|
|
|
2021-08-10 23:16:11 -04:00
|
|
|
/// A contiguous chunk of initialized or uninitialized memory.
|
|
|
|
|
pub enum InitChunk {
|
|
|
|
|
Init(Range<Size>),
|
|
|
|
|
Uninit(Range<Size>),
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl InitChunk {
|
2021-08-25 17:44:27 -04:00
|
|
|
#[inline]
|
|
|
|
|
pub fn is_init(&self) -> bool {
|
|
|
|
|
match self {
|
|
|
|
|
Self::Init(_) => true,
|
|
|
|
|
Self::Uninit(_) => false,
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-08-10 23:16:11 -04:00
|
|
|
#[inline]
|
|
|
|
|
pub fn range(&self) -> Range<Size> {
|
|
|
|
|
match self {
|
|
|
|
|
Self::Init(r) => r.clone(),
|
|
|
|
|
Self::Uninit(r) => r.clone(),
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
impl InitMask {
|
|
|
|
|
/// Checks whether the range `start..end` (end-exclusive) is entirely initialized.
|
|
|
|
|
///
|
|
|
|
|
/// Returns `Ok(())` if it's initialized. Otherwise returns a range of byte
|
|
|
|
|
/// indexes for the first contiguous span of the uninitialized access.
|
|
|
|
|
#[inline]
|
|
|
|
|
pub fn is_range_initialized(&self, start: Size, end: Size) -> Result<(), Range<Size>> {
|
|
|
|
|
if end > self.len {
|
|
|
|
|
return Err(self.len..end);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
let uninit_start = self.find_bit(start, end, false);
|
|
|
|
|
|
|
|
|
|
match uninit_start {
|
|
|
|
|
Some(uninit_start) => {
|
|
|
|
|
let uninit_end = self.find_bit(uninit_start, end, true).unwrap_or(end);
|
|
|
|
|
Err(uninit_start..uninit_end)
|
|
|
|
|
}
|
|
|
|
|
None => Ok(()),
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Returns an iterator, yielding a range of byte indexes for each contiguous region
|
|
|
|
|
/// of initialized or uninitialized bytes inside the range `start..end` (end-exclusive).
|
|
|
|
|
///
|
|
|
|
|
/// The iterator guarantees the following:
|
|
|
|
|
/// - Chunks are nonempty.
|
|
|
|
|
/// - Chunks are adjacent (each range's start is equal to the previous range's end).
|
|
|
|
|
/// - Chunks span exactly `start..end` (the first starts at `start`, the last ends at `end`).
|
|
|
|
|
/// - Chunks alternate between [`InitChunk::Init`] and [`InitChunk::Uninit`].
|
|
|
|
|
#[inline]
|
|
|
|
|
pub fn range_as_init_chunks(&self, start: Size, end: Size) -> InitChunkIter<'_> {
|
|
|
|
|
assert!(end <= self.len);
|
|
|
|
|
|
2021-08-25 17:40:57 -04:00
|
|
|
let is_init = if start < end {
|
|
|
|
|
self.get(start)
|
|
|
|
|
} else {
|
|
|
|
|
// `start..end` is empty: there are no chunks, so use some arbitrary value
|
|
|
|
|
false
|
|
|
|
|
};
|
2021-08-14 14:13:06 -04:00
|
|
|
|
|
|
|
|
InitChunkIter { init_mask: self, is_init, start, end }
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-03-31 00:06:01 -04:00
|
|
|
/// Yields [`InitChunk`]s. See [`InitMask::range_as_init_chunks`].
|
2022-02-19 01:17:31 -05:00
|
|
|
#[derive(Clone)]
|
2021-03-31 00:06:01 -04:00
|
|
|
pub struct InitChunkIter<'a> {
|
|
|
|
|
init_mask: &'a InitMask,
|
2021-08-14 13:54:35 -04:00
|
|
|
/// Whether the next chunk we will return is initialized.
|
2021-08-14 14:13:06 -04:00
|
|
|
/// If there are no more chunks, contains some arbitrary value.
|
2021-08-10 23:16:11 -04:00
|
|
|
is_init: bool,
|
2021-03-31 00:06:01 -04:00
|
|
|
/// The current byte index into `init_mask`.
|
|
|
|
|
start: Size,
|
|
|
|
|
/// The end byte index into `init_mask`.
|
|
|
|
|
end: Size,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
impl<'a> Iterator for InitChunkIter<'a> {
|
|
|
|
|
type Item = InitChunk;
|
|
|
|
|
|
2021-08-10 23:16:11 -04:00
|
|
|
#[inline]
|
2021-03-31 00:06:01 -04:00
|
|
|
fn next(&mut self) -> Option<Self::Item> {
|
|
|
|
|
if self.start >= self.end {
|
|
|
|
|
return None;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
let end_of_chunk =
|
2021-08-14 14:13:06 -04:00
|
|
|
self.init_mask.find_bit(self.start, self.end, !self.is_init).unwrap_or(self.end);
|
2021-03-31 00:06:01 -04:00
|
|
|
let range = self.start..end_of_chunk;
|
|
|
|
|
|
2021-08-10 23:16:11 -04:00
|
|
|
let ret =
|
|
|
|
|
Some(if self.is_init { InitChunk::Init(range) } else { InitChunk::Uninit(range) });
|
|
|
|
|
|
|
|
|
|
self.is_init = !self.is_init;
|
2021-03-31 00:06:01 -04:00
|
|
|
self.start = end_of_chunk;
|
|
|
|
|
|
2021-08-10 23:16:11 -04:00
|
|
|
ret
|
2021-03-31 00:06:01 -04:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
/// Uninitialized bytes.
|
|
|
|
|
impl<Tag: Copy, Extra> Allocation<Tag, Extra> {
|
|
|
|
|
/// Checks whether the given range is entirely initialized.
|
2021-08-14 13:54:35 -04:00
|
|
|
///
|
2021-08-14 14:13:06 -04:00
|
|
|
/// Returns `Ok(())` if it's initialized. Otherwise returns the range of byte
|
|
|
|
|
/// indexes of the first contiguous uninitialized access.
|
|
|
|
|
fn is_init(&self, range: AllocRange) -> Result<(), Range<Size>> {
|
|
|
|
|
self.init_mask.is_range_initialized(range.start, range.end()) // `Size` addition
|
|
|
|
|
}
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
/// Checks that a range of bytes is initialized. If not, returns the `InvalidUninitBytes`
|
|
|
|
|
/// error which will report the first range of bytes which is uninitialized.
|
|
|
|
|
fn check_init(&self, range: AllocRange) -> AllocResult {
|
2021-10-16 10:18:17 +02:00
|
|
|
self.is_init(range).map_err(|idx_range| {
|
|
|
|
|
AllocError::InvalidUninitBytes(Some(UninitBytesAccess {
|
2021-08-14 14:13:06 -04:00
|
|
|
access_offset: range.start,
|
|
|
|
|
access_size: range.size,
|
|
|
|
|
uninit_offset: idx_range.start,
|
|
|
|
|
uninit_size: idx_range.end - idx_range.start, // `Size` subtraction
|
2021-10-16 10:18:17 +02:00
|
|
|
}))
|
2021-08-14 14:13:06 -04:00
|
|
|
})
|
|
|
|
|
}
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2022-04-17 19:16:54 -04:00
|
|
|
fn mark_init(&mut self, range: AllocRange, is_init: bool) {
|
2021-08-14 14:13:06 -04:00
|
|
|
if range.size.bytes() == 0 {
|
|
|
|
|
return;
|
2021-08-10 19:29:18 -04:00
|
|
|
}
|
2021-08-14 14:13:06 -04:00
|
|
|
assert!(self.mutability == Mutability::Mut);
|
|
|
|
|
self.init_mask.set_range(range.start, range.end(), is_init);
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
/// Run-length encoding of the uninit mask.
|
|
|
|
|
/// Used to copy parts of a mask multiple times to another allocation.
|
|
|
|
|
pub struct InitMaskCompressed {
|
|
|
|
|
/// Whether the first range is initialized.
|
|
|
|
|
initial: bool,
|
|
|
|
|
/// The lengths of ranges that are run-length encoded.
|
|
|
|
|
/// The initialization state of the ranges alternate starting with `initial`.
|
|
|
|
|
ranges: smallvec::SmallVec<[u64; 1]>,
|
|
|
|
|
}
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
impl InitMaskCompressed {
|
|
|
|
|
pub fn no_bytes_init(&self) -> bool {
|
|
|
|
|
// The `ranges` are run-length encoded and of alternating initialization state.
|
|
|
|
|
// So if `ranges.len() > 1` then the second block is an initialized range.
|
|
|
|
|
!self.initial && self.ranges.len() == 1
|
2021-08-10 19:29:18 -04:00
|
|
|
}
|
2021-08-14 14:13:06 -04:00
|
|
|
}
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
/// Transferring the initialization mask to other allocations.
|
|
|
|
|
impl<Tag, Extra> Allocation<Tag, Extra> {
|
2021-08-25 17:44:27 -04:00
|
|
|
/// Creates a run-length encoding of the initialization mask; panics if range is empty.
|
2021-08-14 14:13:06 -04:00
|
|
|
///
|
|
|
|
|
/// This is essentially a more space-efficient version of
|
|
|
|
|
/// `InitMask::range_as_init_chunks(...).collect::<Vec<_>>()`.
|
|
|
|
|
pub fn compress_uninit_range(&self, range: AllocRange) -> InitMaskCompressed {
|
|
|
|
|
// Since we are copying `size` bytes from `src` to `dest + i * size` (`for i in 0..repeat`),
|
|
|
|
|
// a naive initialization mask copying algorithm would repeatedly have to read the initialization mask from
|
|
|
|
|
// the source and write it to the destination. Even if we optimized the memory accesses,
|
|
|
|
|
// we'd be doing all of this `repeat` times.
|
|
|
|
|
// Therefore we precompute a compressed version of the initialization mask of the source value and
|
|
|
|
|
// then write it back `repeat` times without computing any more information from the source.
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
// A precomputed cache for ranges of initialized / uninitialized bits
|
|
|
|
|
// 0000010010001110 will become
|
|
|
|
|
// `[5, 1, 2, 1, 3, 3, 1]`,
|
|
|
|
|
// where each element toggles the state.
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
let mut ranges = smallvec::SmallVec::<[u64; 1]>::new();
|
2021-08-25 17:44:27 -04:00
|
|
|
|
|
|
|
|
let mut chunks = self.init_mask.range_as_init_chunks(range.start, range.end()).peekable();
|
|
|
|
|
|
|
|
|
|
let initial = chunks.peek().expect("range should be nonempty").is_init();
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-15 12:24:58 -04:00
|
|
|
// Here we rely on `range_as_init_chunks` to yield alternating init/uninit chunks.
|
2021-08-25 17:44:27 -04:00
|
|
|
for chunk in chunks {
|
2021-08-14 14:13:06 -04:00
|
|
|
let len = chunk.range().end.bytes() - chunk.range().start.bytes();
|
|
|
|
|
ranges.push(len);
|
|
|
|
|
}
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
InitMaskCompressed { ranges, initial }
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Applies multiple instances of the run-length encoding to the initialization mask.
|
2022-04-17 19:27:41 -04:00
|
|
|
///
|
|
|
|
|
/// This is dangerous to use as it can violate internal `Allocation` invariants!
|
|
|
|
|
/// It only exists to support an efficient implementation of `mem_copy_repeatedly`.
|
2021-08-14 14:13:06 -04:00
|
|
|
pub fn mark_compressed_init_range(
|
|
|
|
|
&mut self,
|
|
|
|
|
defined: &InitMaskCompressed,
|
|
|
|
|
range: AllocRange,
|
|
|
|
|
repeat: u64,
|
|
|
|
|
) {
|
|
|
|
|
// An optimization where we can just overwrite an entire range of initialization
|
|
|
|
|
// bits if they are going to be uniformly `1` or `0`.
|
|
|
|
|
if defined.ranges.len() <= 1 {
|
|
|
|
|
self.init_mask.set_range_inbounds(
|
|
|
|
|
range.start,
|
|
|
|
|
range.start + range.size * repeat, // `Size` operations
|
|
|
|
|
defined.initial,
|
|
|
|
|
);
|
|
|
|
|
return;
|
|
|
|
|
}
|
2021-08-10 19:29:18 -04:00
|
|
|
|
2021-08-14 14:13:06 -04:00
|
|
|
for mut j in 0..repeat {
|
|
|
|
|
j *= range.size.bytes();
|
|
|
|
|
j += range.start.bytes();
|
|
|
|
|
let mut cur = defined.initial;
|
|
|
|
|
for range in &defined.ranges {
|
|
|
|
|
let old_j = j;
|
|
|
|
|
j += range;
|
|
|
|
|
self.init_mask.set_range_inbounds(
|
|
|
|
|
Size::from_bytes(old_j),
|
|
|
|
|
Size::from_bytes(j),
|
|
|
|
|
cur,
|
|
|
|
|
);
|
|
|
|
|
cur = !cur;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-08-10 19:29:18 -04:00
|
|
|
}
|