summaryrefslogtreecommitdiffstats
path: root/third_party/rust/gpu-alloc/src/block.rs
diff options
context:
space:
mode:
Diffstat (limited to 'third_party/rust/gpu-alloc/src/block.rs')
-rw-r--r--third_party/rust/gpu-alloc/src/block.rs351
1 files changed, 351 insertions, 0 deletions
diff --git a/third_party/rust/gpu-alloc/src/block.rs b/third_party/rust/gpu-alloc/src/block.rs
new file mode 100644
index 0000000000..b1093fd83c
--- /dev/null
+++ b/third_party/rust/gpu-alloc/src/block.rs
@@ -0,0 +1,351 @@
+use {
+ crate::{align_down, align_up, error::MapError},
+ core::{
+ convert::TryFrom as _,
+ ptr::{copy_nonoverlapping, NonNull},
+ sync::atomic::{AtomicU8, Ordering::*},
+ },
+ gpu_alloc_types::{MappedMemoryRange, MemoryDevice, MemoryPropertyFlags},
+};
+
+#[derive(Debug)]
+struct Relevant;
+
+impl Drop for Relevant {
+ #[cfg(feature = "tracing")]
+ fn drop(&mut self) {
+ tracing::error!("Memory block wasn't deallocated");
+ }
+
+ #[cfg(all(not(feature = "tracing"), feature = "std"))]
+ fn drop(&mut self) {
+ eprintln!("Memory block wasn't deallocated")
+ }
+
+ #[cfg(all(not(feature = "tracing"), not(feature = "std")))]
+ fn drop(&mut self) {
+ panic!("Memory block wasn't deallocated")
+ }
+}
+
+const MAPPING_STATE_UNMAPPED: u8 = 0;
+const MAPPING_STATE_MAPPED: u8 = 1;
+const MAPPING_STATE_UNMAPPING: u8 = 2;
+
+/// Memory block allocated by `GpuAllocator`.
+#[derive(Debug)]
+pub struct MemoryBlock<M> {
+ memory: M,
+ memory_type: u32,
+ props: MemoryPropertyFlags,
+ offset: u64,
+ size: u64,
+ atom_mask: u64,
+ mapped: AtomicU8,
+ flavor: MemoryBlockFlavor,
+ relevant: Relevant,
+}
+
+impl<M> MemoryBlock<M> {
+ pub(crate) fn new(
+ memory: M,
+ memory_type: u32,
+ props: MemoryPropertyFlags,
+ offset: u64,
+ size: u64,
+ atom_mask: u64,
+ flavor: MemoryBlockFlavor,
+ ) -> Self {
+ MemoryBlock {
+ memory,
+ memory_type,
+ props,
+ offset,
+ size,
+ atom_mask,
+ flavor,
+ mapped: AtomicU8::new(MAPPING_STATE_UNMAPPED),
+ relevant: Relevant,
+ }
+ }
+
+ pub(crate) fn deallocate(self) -> (M, MemoryBlockFlavor) {
+ core::mem::forget(self.relevant);
+ (self.memory, self.flavor)
+ }
+}
+
+unsafe impl<M> Sync for MemoryBlock<M> where M: Sync {}
+unsafe impl<M> Send for MemoryBlock<M> where M: Send {}
+
+#[derive(Debug)]
+pub(crate) enum MemoryBlockFlavor {
+ Dedicated,
+ Linear {
+ chunk: u64,
+ ptr: Option<NonNull<u8>>,
+ },
+ Buddy {
+ chunk: usize,
+ index: usize,
+ ptr: Option<NonNull<u8>>,
+ },
+}
+
+impl<M> MemoryBlock<M> {
+ /// Returns reference to parent memory object.
+ #[inline(always)]
+ pub fn memory(&self) -> &M {
+ &self.memory
+ }
+
+ /// Returns offset in bytes from start of memory object to start of this block.
+ #[inline(always)]
+ pub fn offset(&self) -> u64 {
+ self.offset
+ }
+
+ /// Returns size of this memory block.
+ #[inline(always)]
+ pub fn size(&self) -> u64 {
+ self.size
+ }
+
+ /// Returns memory property flags for parent memory object.
+ #[inline(always)]
+ pub fn props(&self) -> MemoryPropertyFlags {
+ self.props
+ }
+
+ /// Returns index of type of parent memory object.
+ #[inline(always)]
+ pub fn memory_type(&self) -> u32 {
+ self.memory_type
+ }
+
+ /// Returns pointer to mapped memory range of this block.
+ /// This blocks becomes mapped.
+ ///
+ /// The user of returned pointer must guarantee that any previously submitted command that writes to this range has completed
+ /// before the host reads from or writes to that range,
+ /// and that any previously submitted command that reads from that range has completed
+ /// before the host writes to that region.
+ /// If the device memory was allocated without the `HOST_COHERENT` property flag set,
+ /// these guarantees must be made for an extended range:
+ /// the user must round down the start of the range to the nearest multiple of `non_coherent_atom_size`,
+ /// and round the end of the range up to the nearest multiple of `non_coherent_atom_size`.
+ ///
+ /// # Panics
+ ///
+ /// This function panics if block is currently mapped.
+ ///
+ /// # Safety
+ ///
+ /// `block` must have been allocated from specified `device`.
+ #[inline(always)]
+ pub unsafe fn map(
+ &self,
+ device: &impl MemoryDevice<M>,
+ offset: u64,
+ size: usize,
+ ) -> Result<NonNull<u8>, MapError> {
+ let size_u64 = u64::try_from(size).expect("`size` doesn't fit device address space");
+ let size = align_up(size_u64, self.atom_mask)
+ .expect("aligned `size` doesn't fit device address space");
+
+ let aligned_offset = align_down(offset, self.atom_mask);
+
+ assert!(offset < self.size, "`offset` is out of memory block bounds");
+ assert!(
+ size_u64 <= self.size - offset,
+ "`offset + size` is out of memory block bounds"
+ );
+
+ let ptr = match self.flavor {
+ MemoryBlockFlavor::Dedicated => {
+ let offset_align_shift = offset - aligned_offset;
+ let offset_align_shift = isize::try_from(offset_align_shift)
+ .expect("`non_coherent_atom_size` is too large");
+
+ if !self.acquire_mapping() {
+ return Err(MapError::AlreadyMapped);
+ }
+ let aligned_size = offset + size - aligned_offset;
+ let result =
+ device.map_memory(&self.memory, self.offset + aligned_offset, aligned_size);
+
+ match result {
+ Ok(ptr) => ptr.as_ptr().offset(offset_align_shift),
+ Err(err) => {
+ self.mapping_failed();
+ return Err(err.into());
+ }
+ }
+ }
+ MemoryBlockFlavor::Linear { ptr: Some(ptr), .. }
+ | MemoryBlockFlavor::Buddy { ptr: Some(ptr), .. } => {
+ if !self.acquire_mapping() {
+ return Err(MapError::AlreadyMapped);
+ }
+
+ let offset_isize = isize::try_from(offset)
+ .expect("Buddy and linear block should fit host address space");
+ ptr.as_ptr().offset(offset_isize)
+ }
+ _ => return Err(MapError::NonHostVisible),
+ };
+
+ Ok(NonNull::new_unchecked(ptr))
+ }
+
+ /// Unmaps memory range of this block that was previously mapped with `Block::map`.
+ /// This block becomes unmapped.
+ ///
+ /// # Panics
+ ///
+ /// This function panics if this block is not currently mapped.
+ ///
+ /// # Safety
+ ///
+ /// `block` must have been allocated from specified `device`.
+ #[inline(always)]
+ pub unsafe fn unmap(&self, device: &impl MemoryDevice<M>) -> bool {
+ if !self.start_unmapping() {
+ return false;
+ }
+ match self.flavor {
+ MemoryBlockFlavor::Dedicated => {
+ device.unmap_memory(&self.memory);
+ }
+ MemoryBlockFlavor::Linear { .. } => {}
+ MemoryBlockFlavor::Buddy { .. } => {}
+ }
+ self.end_unmapping();
+ true
+ }
+
+ /// Transiently maps block memory range and copies specified data
+ /// to the mapped memory range.
+ ///
+ /// # Panics
+ ///
+ /// This function panics if block is currently mapped.
+ ///
+ /// # Safety
+ ///
+ /// `block` must have been allocated from specified `device`.
+ /// The caller must guarantee that any previously submitted command that reads or writes to this range has completed.
+ #[inline(always)]
+ pub unsafe fn write_bytes(
+ &self,
+ device: &impl MemoryDevice<M>,
+ offset: u64,
+ data: &[u8],
+ ) -> Result<(), MapError> {
+ let size = data.len();
+ let ptr = self.map(device, offset, size)?;
+
+ copy_nonoverlapping(data.as_ptr(), ptr.as_ptr(), size);
+ let result = if !self.coherent() {
+ let aligned_offset = align_down(offset, self.atom_mask);
+ let size = align_up(data.len() as u64, self.atom_mask).unwrap();
+
+ device.flush_memory_ranges(&[MappedMemoryRange {
+ memory: &self.memory,
+ offset: aligned_offset,
+ size,
+ }])
+ } else {
+ Ok(())
+ };
+
+ self.unmap(device);
+ result.map_err(Into::into)
+ }
+
+ /// Transiently maps block memory range and copies specified data
+ /// from the mapped memory range.
+ ///
+ /// # Panics
+ ///
+ /// This function panics if block is currently mapped.
+ ///
+ /// # Safety
+ ///
+ /// `block` must have been allocated from specified `device`.
+ /// The caller must guarantee that any previously submitted command that reads to this range has completed.
+ #[inline(always)]
+ pub unsafe fn read_bytes(
+ &self,
+ device: &impl MemoryDevice<M>,
+ offset: u64,
+ data: &mut [u8],
+ ) -> Result<(), MapError> {
+ #[cfg(feature = "tracing")]
+ {
+ if !self.cached() {
+ tracing::warn!("Reading from non-cached memory may be slow. Consider allocating HOST_CACHED memory block for host reads.")
+ }
+ }
+
+ let size = data.len();
+ let ptr = self.map(device, offset, size)?;
+ let result = if !self.coherent() {
+ let aligned_offset = align_down(offset, self.atom_mask);
+ let size = align_up(data.len() as u64, self.atom_mask).unwrap();
+
+ device.invalidate_memory_ranges(&[MappedMemoryRange {
+ memory: &self.memory,
+ offset: aligned_offset,
+ size,
+ }])
+ } else {
+ Ok(())
+ };
+ if result.is_ok() {
+ copy_nonoverlapping(ptr.as_ptr(), data.as_mut_ptr(), size);
+ }
+
+ self.unmap(device);
+ result.map_err(Into::into)
+ }
+
+ fn acquire_mapping(&self) -> bool {
+ self.mapped
+ .compare_exchange(
+ MAPPING_STATE_UNMAPPED,
+ MAPPING_STATE_MAPPED,
+ Acquire,
+ Relaxed,
+ )
+ .is_ok()
+ }
+
+ fn mapping_failed(&self) {
+ self.mapped.store(MAPPING_STATE_UNMAPPED, Relaxed);
+ }
+
+ fn start_unmapping(&self) -> bool {
+ self.mapped
+ .compare_exchange(
+ MAPPING_STATE_MAPPED,
+ MAPPING_STATE_UNMAPPING,
+ Release,
+ Relaxed,
+ )
+ .is_ok()
+ }
+
+ fn end_unmapping(&self) {
+ self.mapped.store(MAPPING_STATE_UNMAPPED, Relaxed);
+ }
+
+ fn coherent(&self) -> bool {
+ self.props.contains(MemoryPropertyFlags::HOST_COHERENT)
+ }
+
+ #[cfg(feature = "tracing")]
+ fn cached(&self) -> bool {
+ self.props.contains(MemoryPropertyFlags::HOST_CACHED)
+ }
+}