Access buffer data through mapping

This patch includes a number of changes to encourage reading and writing
buffers through mapping rather than copying data as before.

This includes a new `BufWrite` abstraction which is designed for filling
buffers. It behaves much like a Vec<u8>, but with fixed capacity.
This commit is contained in:
Raph Levien 2021-11-25 13:12:25 -08:00
parent 5af8aa5e52
commit 9fb2ae91eb
14 changed files with 499 additions and 158 deletions

View file

@ -16,7 +16,7 @@
//! The generic trait for backends to implement.
use crate::{BindType, BufferUsage, Error, GpuInfo, ImageLayout, SamplerParams};
use crate::{BindType, BufferUsage, Error, GpuInfo, ImageLayout, MapMode, SamplerParams};
pub trait Device: Sized {
type Buffer: 'static;
@ -114,36 +114,33 @@ pub trait Device: Sized {
fence: Option<&mut Self::Fence>,
) -> Result<(), Error>;
/// Copy data from the buffer to memory.
///
/// Discussion question: add offset?
/// Map the buffer into addressable memory.
///
/// # Safety
///
/// The buffer must be valid to access. The destination memory must be valid to
/// write to. The ranges must not overlap. The offset + size must be within
/// the buffer's allocation, and size within the destination.
unsafe fn read_buffer(
/// The buffer must be valid to access. The offset + size much be within the
/// buffer's allocation. The buffer must not already be mapped. Of course,
/// the usual safety rules apply to the returned pointer.
unsafe fn map_buffer(
&self,
buffer: &Self::Buffer,
dst: *mut u8,
offset: u64,
size: u64,
) -> Result<(), Error>;
mode: MapMode,
) -> Result<*mut u8, Error>;
/// Copy data from memory to the buffer.
/// Map the buffer into addressable memory.
///
/// # Safety
///
/// The buffer must be valid to access. The source memory must be valid to
/// read from. The ranges must not overlap. The offset + size must be within
/// the buffer's allocation, and size within the source.
unsafe fn write_buffer(
/// The buffer must be mapped. The parameters must be the same as the map
/// call.
unsafe fn unmap_buffer(
&self,
buffer: &Self::Buffer,
contents: *const u8,
offset: u64,
size: u64,
mode: MapMode,
) -> Result<(), Error>;
unsafe fn create_semaphore(&self) -> Result<Self::Semaphore, Error>;

View file

@ -0,0 +1,117 @@
// Copyright © 2021 piet-gpu developers.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those
//! An abstraction for writing to GPU buffers.
use bytemuck::Pod;
/// A GPU buffer to be filled.
pub struct BufWrite {
ptr: *mut u8,
len: usize,
capacity: usize,
}
impl BufWrite {
pub(crate) fn new(ptr: *mut u8, len: usize, capacity: usize) -> BufWrite {
BufWrite { ptr, len, capacity }
}
/// Append a plain data object to the buffer.
///
/// Panics if capacity is inadequate.
#[inline]
pub fn push(&mut self, item: &impl Pod) {
self.push_bytes(bytemuck::bytes_of(item));
}
/// Extend with a slice of plain data objects.
///
/// Panics if capacity is inadequate.
#[inline]
pub fn extend_slice(&mut self, slice: &[impl Pod]) {
self.push_bytes(bytemuck::cast_slice(slice));
}
/// Extend with a byte slice.
///
/// Panics if capacity is inadequate.
#[inline]
pub fn push_bytes(&mut self, bytes: &[u8]) {
let len = bytes.len();
assert!(self.capacity - self.len >= len);
unsafe {
std::ptr::copy_nonoverlapping(bytes.as_ptr(), self.ptr.add(self.len), len);
}
self.len += len;
}
/// Extend with zeros.
///
/// Panics if capacity is inadequate.
#[inline]
pub fn fill_zero(&mut self, len: usize) {
assert!(self.capacity - self.len >= len);
unsafe {
let slice = std::slice::from_raw_parts_mut(self.ptr.add(self.len), len);
slice.fill(0);
}
self.len += len;
}
/// The total capacity of the buffer, in bytes.
#[inline]
pub fn capacity(&self) -> usize {
self.capacity
}
/// Extend with an iterator over plain data objects.
///
/// Currently, this doesn't panic, just truncates. That may change.
pub fn extend<'a, I, T: Pod + 'a>(&mut self, iter: I)
where
I: IntoIterator<Item = &'a T>,
{
let item_size = std::mem::size_of::<T>();
if item_size == 0 {
return;
}
let mut iter = iter.into_iter();
let n_remaining = (self.capacity - self.len) / item_size;
unsafe {
let mut dst = self.ptr.add(self.len);
for _ in 0..n_remaining {
if let Some(item) = iter.next() {
std::ptr::copy_nonoverlapping(
bytemuck::bytes_of(item).as_ptr(),
dst,
item_size,
);
self.len += item_size;
dst = dst.add(item_size);
} else {
break;
}
}
}
// TODO: should we test the iter and panic on overflow?
}
}
impl std::ops::Deref for BufWrite {
type Target = [u8];
fn deref(&self) -> &[u8] {
unsafe { std::slice::from_raw_parts(self.ptr, self.len) }
}
}
impl std::ops::DerefMut for BufWrite {
fn deref_mut(&mut self) -> &mut [u8] {
unsafe { std::slice::from_raw_parts_mut(self.ptr, self.len) }
}
}

View file

@ -21,7 +21,7 @@ use raw_window_handle::{HasRawWindowHandle, RawWindowHandle};
use smallvec::SmallVec;
use crate::{BindType, BufferUsage, Error, GpuInfo, ImageLayout, WorkgroupLimits};
use crate::{BindType, BufferUsage, Error, GpuInfo, ImageLayout, MapMode, WorkgroupLimits};
use self::{
descriptor::{CpuHeapRefOwned, DescriptorPool, GpuHeapRefOwned},
@ -381,12 +381,10 @@ impl crate::backend::Device for Dx12Device {
unsafe fn fetch_query_pool(&self, pool: &Self::QueryPool) -> Result<Vec<f64>, Error> {
let mut buf = vec![0u64; pool.n_queries as usize];
self.read_buffer(
&pool.buf,
buf.as_mut_ptr() as *mut u8,
0,
mem::size_of_val(buf.as_slice()) as u64,
)?;
let size = mem::size_of_val(buf.as_slice());
let mapped = self.map_buffer(&pool.buf, 0, size as u64, MapMode::Read)?;
std::ptr::copy_nonoverlapping(mapped, buf.as_mut_ptr() as *mut u8, size);
self.unmap_buffer(&pool.buf, 0, size as u64, MapMode::Read)?;
let ts0 = buf[0];
let tsp = (self.ts_freq as f64).recip();
let result = buf[1..]
@ -418,29 +416,25 @@ impl crate::backend::Device for Dx12Device {
Ok(())
}
unsafe fn read_buffer(
unsafe fn map_buffer(
&self,
buffer: &Self::Buffer,
dst: *mut u8,
offset: u64,
size: u64,
) -> Result<(), Error> {
buffer
.resource
.read_resource(dst, offset as usize, size as usize)?;
Ok(())
mode: MapMode,
) -> Result<*mut u8, Error> {
let mapped = buffer.resource.map_buffer(offset, size, mode)?;
Ok(mapped)
}
unsafe fn write_buffer(
unsafe fn unmap_buffer(
&self,
buffer: &Self::Buffer,
contents: *const u8,
offset: u64,
size: u64,
mode: MapMode,
) -> Result<(), Error> {
buffer
.resource
.write_resource(contents, offset as usize, size as usize)?;
buffer.resource.unmap_buffer(offset, size, mode)?;
Ok(())
}

View file

@ -7,6 +7,7 @@
// except according to those terms.
use crate::dx12::error::{self, error_if_failed_else_unit, explain_error, Error};
use crate::MapMode;
use smallvec::SmallVec;
use std::convert::{TryFrom, TryInto};
use std::sync::atomic::{AtomicPtr, Ordering};
@ -105,46 +106,38 @@ impl Resource {
self.ptr.store(ptr::null_mut(), Ordering::Relaxed);
}
pub unsafe fn write_resource(
pub unsafe fn map_buffer(
&self,
data: *const u8,
offset: usize,
size: usize,
) -> Result<(), Error> {
offset: u64,
size: u64,
mode: MapMode,
) -> Result<*mut u8, Error> {
let mut mapped_memory: *mut u8 = ptr::null_mut();
let zero_range = d3d12::D3D12_RANGE { ..mem::zeroed() };
let range = d3d12::D3D12_RANGE {
Begin: offset,
End: offset + size,
let (begin, end) = match mode {
MapMode::Read => (offset as usize, (offset + size) as usize),
MapMode::Write => (0, 0),
};
explain_error(
(*self.get()).Map(0, &zero_range, &mut mapped_memory as *mut _ as *mut _),
"could not map GPU mem to CPU mem",
)?;
ptr::copy_nonoverlapping(data, mapped_memory.add(offset), size);
(*self.get()).Unmap(0, &range);
Ok(())
}
pub unsafe fn read_resource(
&self,
dst: *mut u8,
offset: usize,
size: usize,
) -> Result<(), Error> {
let mut mapped_memory: *mut u8 = ptr::null_mut();
let range = d3d12::D3D12_RANGE {
Begin: offset,
End: offset + size,
Begin: begin,
End: end,
};
let zero_range = d3d12::D3D12_RANGE { ..mem::zeroed() };
explain_error(
(*self.get()).Map(0, &range, &mut mapped_memory as *mut _ as *mut _),
"could not map GPU mem to CPU mem",
)?;
ptr::copy_nonoverlapping(mapped_memory.add(offset), dst, size);
(*self.get()).Unmap(0, &zero_range);
Ok(mapped_memory.add(offset as usize))
}
pub unsafe fn unmap_buffer(&self, offset: u64, size: u64, mode: MapMode) -> Result<(), Error> {
let (begin, end) = match mode {
MapMode::Read => (0, 0),
MapMode::Write => (offset as usize, (offset + size) as usize),
};
let range = d3d12::D3D12_RANGE {
Begin: begin,
End: end,
};
(*self.get()).Unmap(0, &range);
Ok(())
}
}

View file

@ -7,12 +7,13 @@
//! even more in time.
use std::convert::TryInto;
use std::ops::{Bound, RangeBounds};
use std::sync::{Arc, Mutex, Weak};
use bytemuck::Pod;
use smallvec::SmallVec;
use crate::{mux, BackendType};
use crate::{mux, BackendType, BufWrite, MapMode};
use crate::{BindType, BufferUsage, Error, GpuInfo, ImageLayout, SamplerParams};
@ -112,6 +113,28 @@ pub enum RetainResource {
Image(Image),
}
/// A buffer mapped for writing.
///
/// When this structure is dropped, the buffer will be unmapped.
pub struct BufWriteGuard<'a> {
buf_write: BufWrite,
session: Arc<SessionInner>,
buffer: &'a mux::Buffer,
offset: u64,
size: u64,
}
/// A buffer mapped for reading.
///
/// When this structure is dropped, the buffer will be unmapped.
pub struct BufReadGuard<'a> {
bytes: &'a [u8],
session: Arc<SessionInner>,
buffer: &'a mux::Buffer,
offset: u64,
size: u64,
}
impl Session {
/// Create a new session, choosing the best backend.
pub fn new(device: mux::Device) -> Session {
@ -232,20 +255,24 @@ impl Session {
contents: &[impl Pod],
usage: BufferUsage,
) -> Result<Buffer, Error> {
unsafe {
let size = std::mem::size_of_val(contents);
let bytes = bytemuck::cast_slice(contents);
self.create_buffer_init_raw(bytes.as_ptr(), bytes.len().try_into()?, usage)
}
self.create_buffer_with(size as u64, |b| b.push_bytes(bytes), usage)
}
/// Create a buffer with initialized data, from a raw pointer memory region.
pub unsafe fn create_buffer_init_raw(
/// Create a buffer with initialized data.
///
/// The buffer is filled by the provided function. The same details about
/// staging buffers apply as [`create_buffer_init`].
pub fn create_buffer_with(
&self,
contents: *const u8,
size: u64,
f: impl Fn(&mut BufWrite),
usage: BufferUsage,
) -> Result<Buffer, Error> {
let use_staging_buffer = !usage.intersects(BufferUsage::MAP_READ | BufferUsage::MAP_WRITE)
unsafe {
let use_staging_buffer = !usage
.intersects(BufferUsage::MAP_READ | BufferUsage::MAP_WRITE)
&& self.gpu_info().use_staging_buffers;
let create_usage = if use_staging_buffer {
BufferUsage::MAP_WRITE | BufferUsage::COPY_SRC
@ -253,9 +280,15 @@ impl Session {
usage | BufferUsage::MAP_WRITE
};
let create_buf = self.create_buffer(size, create_usage)?;
let mapped =
self.0
.device
.write_buffer(&create_buf.mux_buffer(), contents, 0, size)?;
.map_buffer(&create_buf.mux_buffer(), 0, size, MapMode::Write)?;
let mut buf_write = BufWrite::new(mapped, 0, size as usize);
f(&mut buf_write);
self.0
.device
.unmap_buffer(&create_buf.mux_buffer(), 0, size, MapMode::Write)?;
if use_staging_buffer {
let buf = self.create_buffer(size, usage | BufferUsage::COPY_DST)?;
let mut staging_cmd_buf = self.0.staging_cmd_buf.lock().unwrap();
@ -273,6 +306,7 @@ impl Session {
Ok(create_buf)
}
}
}
/// Create an image.
///
@ -669,12 +703,22 @@ impl Buffer {
pub unsafe fn write(&mut self, contents: &[impl Pod]) -> Result<(), Error> {
let bytes = bytemuck::cast_slice(contents);
if let Some(session) = Weak::upgrade(&self.0.session) {
session.device.write_buffer(
&self.0.buffer,
bytes.as_ptr(),
0,
bytes.len().try_into()?,
)?;
let size = bytes.len().try_into()?;
let buf_size = self.0.buffer.size();
if size > buf_size {
return Err(format!(
"Trying to write {} bytes into buffer of size {}",
size, buf_size
)
.into());
}
let mapped = session
.device
.map_buffer(&self.0.buffer, 0, size, MapMode::Write)?;
std::ptr::copy_nonoverlapping(bytes.as_ptr(), mapped, bytes.len());
session
.device
.unmap_buffer(&self.0.buffer, 0, size, MapMode::Write)?;
}
// else session lost error?
Ok(())
@ -694,15 +738,115 @@ impl Buffer {
result.reserve(len - result.len());
}
if let Some(session) = Weak::upgrade(&self.0.session) {
let mapped = session
.device
.map_buffer(&self.0.buffer, 0, size, MapMode::Read)?;
std::ptr::copy_nonoverlapping(mapped, result.as_mut_ptr() as *mut u8, size as usize);
session
.device
.read_buffer(&self.0.buffer, result.as_mut_ptr() as *mut u8, 0, size)?;
.unmap_buffer(&self.0.buffer, 0, size, MapMode::Read)?;
result.set_len(len);
}
// else session lost error?
Ok(())
}
/// Map a buffer for writing.
///
/// The mapped buffer is represented by a "guard" structure, which will unmap
/// the buffer when it's dropped. That also has a number of methods for pushing
/// bytes and [`bytemuck::Pod`] objects.
///
/// The buffer must have been created with `MAP_WRITE` usage.
pub unsafe fn map_write<'a>(
&'a mut self,
range: impl RangeBounds<usize>,
) -> Result<BufWriteGuard<'a>, Error> {
let offset = match range.start_bound() {
Bound::Unbounded => 0,
Bound::Included(&s) => s.try_into()?,
Bound::Excluded(_) => unreachable!(),
};
let end = match range.end_bound() {
Bound::Unbounded => self.size(),
Bound::Included(&s) => s.try_into()?,
Bound::Excluded(&s) => s.checked_add(1).unwrap().try_into()?,
};
self.map_write_impl(offset, end - offset)
}
unsafe fn map_write_impl<'a>(
&'a self,
offset: u64,
size: u64,
) -> Result<BufWriteGuard<'a>, Error> {
if let Some(session) = Weak::upgrade(&self.0.session) {
let ptr = session
.device
.map_buffer(&self.0.buffer, offset, size, MapMode::Write)?;
let buf_write = BufWrite::new(ptr, 0, size as usize);
let guard = BufWriteGuard {
buf_write,
session,
buffer: &self.0.buffer,
offset,
size,
};
Ok(guard)
} else {
Err("session lost".into())
}
}
/// Map a buffer for reading.
///
/// The mapped buffer is represented by a "guard" structure, which will unmap
/// the buffer when it's dropped, and derefs to a plain byte slice.
///
/// The buffer must have been created with `MAP_READ` usage. The caller
/// is also responsible for ensuring that this does not read uninitialized
/// memory.
pub unsafe fn map_read<'a>(
// Discussion: should be &mut? Buffer is Clone, but maybe that should change.
&'a self,
range: impl RangeBounds<usize>,
) -> Result<BufReadGuard<'a>, Error> {
let offset = match range.start_bound() {
Bound::Unbounded => 0,
Bound::Excluded(&s) => s.try_into()?,
Bound::Included(_) => unreachable!(),
};
let end = match range.end_bound() {
Bound::Unbounded => self.size(),
Bound::Excluded(&s) => s.try_into()?,
Bound::Included(&s) => s.checked_add(1).unwrap().try_into()?,
};
self.map_read_impl(offset, end - offset)
}
unsafe fn map_read_impl<'a>(
&'a self,
offset: u64,
size: u64,
) -> Result<BufReadGuard<'a>, Error> {
if let Some(session) = Weak::upgrade(&self.0.session) {
let ptr = session
.device
.map_buffer(&self.0.buffer, offset, size, MapMode::Read)?;
let bytes = std::slice::from_raw_parts(ptr, size as usize);
let guard = BufReadGuard {
bytes,
session,
buffer: &self.0.buffer,
offset,
size,
};
Ok(guard)
} else {
Err("session lost".into())
}
}
/// The size of the buffer.
///
/// This is at least as large as the value provided on creation.
@ -801,3 +945,58 @@ impl<'a, T: Clone + Into<RetainResource>> From<&'a T> for RetainResource {
resource.clone().into()
}
}
impl<'a> Drop for BufWriteGuard<'a> {
fn drop(&mut self) {
unsafe {
let _ = self.session.device.unmap_buffer(
self.buffer,
self.offset,
self.size,
MapMode::Write,
);
}
}
}
impl<'a> std::ops::Deref for BufWriteGuard<'a> {
type Target = BufWrite;
fn deref(&self) -> &Self::Target {
&self.buf_write
}
}
impl<'a> std::ops::DerefMut for BufWriteGuard<'a> {
fn deref_mut(&mut self) -> &mut Self::Target {
&mut self.buf_write
}
}
impl<'a> Drop for BufReadGuard<'a> {
fn drop(&mut self) {
unsafe {
let _ = self.session.device.unmap_buffer(
self.buffer,
self.offset,
self.size,
MapMode::Read,
);
}
}
}
impl<'a> std::ops::Deref for BufReadGuard<'a> {
type Target = [u8];
fn deref(&self) -> &Self::Target {
self.bytes
}
}
impl<'a> BufReadGuard<'a> {
/// Interpret the buffer as a slice of a plain data type.
pub fn cast_slice<T: Pod>(&self) -> &[T] {
bytemuck::cast_slice(self.bytes)
}
}

View file

@ -7,6 +7,7 @@ use bitflags::bitflags;
mod backend;
mod bestfit;
mod bufwrite;
mod hub;
#[macro_use]
@ -18,8 +19,10 @@ pub use crate::mux::{
DescriptorSet, Fence, Instance, Pipeline, QueryPool, Sampler, Semaphore, ShaderCode, Surface,
Swapchain,
};
pub use bufwrite::BufWrite;
pub use hub::{
Buffer, CmdBuf, DescriptorSetBuilder, Image, RetainResource, Session, SubmittedCmdBuf,
BufReadGuard, BufWriteGuard, Buffer, CmdBuf, DescriptorSetBuilder, Image, RetainResource,
Session, SubmittedCmdBuf,
};
// TODO: because these are conditionally included, "cargo fmt" does not
@ -128,6 +131,14 @@ pub enum BindType {
// TODO: Uniform, Sampler, maybe others
}
/// Whether to map a buffer in read or write mode.
pub enum MapMode {
/// Map for reading.
Read,
/// Map for writing.
Write,
}
#[derive(Clone, Debug)]
/// Information about the GPU.
pub struct GpuInfo {

View file

@ -377,6 +377,30 @@ impl crate::backend::Device for MtlDevice {
Ok(())
}
unsafe fn map_buffer(
&self,
buffer: &Self::Buffer,
offset: u64,
size: u64,
mode: MapMode,
) -> Result<*mut u8, Error> {
let contents_ptr = buffer.buffer.contents();
if contents_ptr.is_null() {
return Err("probably trying to map private buffer".into());
}
Ok((contents_ptr as *mut u8).add(offset as usize))
}
unsafe fn unmap_buffer(
&self,
buffer: &Self::Buffer,
_offset: u64,
_size: u64,
_mode: MapMode,
) -> Result<(), Error> {
Ok(())
}
unsafe fn create_semaphore(&self) -> Result<Self::Semaphore, Error> {
Ok(Semaphore)
}

View file

@ -35,6 +35,7 @@ use crate::backend::DescriptorSetBuilder as DescriptorSetBuilderTrait;
use crate::backend::Device as DeviceTrait;
use crate::BackendType;
use crate::BindType;
use crate::MapMode;
use crate::{BufferUsage, Error, GpuInfo, ImageLayout, InstanceFlags};
mux_enum! {
@ -445,31 +446,31 @@ impl Device {
}
}
pub unsafe fn read_buffer(
pub unsafe fn map_buffer(
&self,
buffer: &Buffer,
dst: *mut u8,
offset: u64,
size: u64,
) -> Result<(), Error> {
mode: MapMode,
) -> Result<*mut u8, Error> {
mux_match! { self;
Device::Vk(d) => d.read_buffer(buffer.vk(), dst, offset, size),
Device::Dx12(d) => d.read_buffer(buffer.dx12(), dst, offset, size),
Device::Mtl(d) => d.read_buffer(buffer.mtl(), dst, offset, size),
Device::Vk(d) => d.map_buffer(buffer.vk(), offset, size, mode),
Device::Dx12(d) => d.map_buffer(buffer.dx12(), offset, size, mode),
Device::Mtl(d) => d.map_buffer(buffer.mtl(), offset, size, mode),
}
}
pub unsafe fn write_buffer(
pub unsafe fn unmap_buffer(
&self,
buffer: &Buffer,
contents: *const u8,
offset: u64,
size: u64,
mode: MapMode,
) -> Result<(), Error> {
mux_match! { self;
Device::Vk(d) => d.write_buffer(buffer.vk(), contents, offset, size),
Device::Dx12(d) => d.write_buffer(buffer.dx12(), contents, offset, size),
Device::Mtl(d) => d.write_buffer(buffer.mtl(), contents, offset, size),
Device::Vk(d) => d.unmap_buffer(buffer.vk(), offset, size, mode),
Device::Dx12(d) => d.unmap_buffer(buffer.dx12(), offset, size, mode),
Device::Mtl(d) => d.unmap_buffer(buffer.mtl(), offset, size, mode),
}
}

View file

@ -13,7 +13,7 @@ use smallvec::SmallVec;
use crate::backend::Device as DeviceTrait;
use crate::{
BindType, BufferUsage, Error, GpuInfo, ImageLayout, SamplerParams, SubgroupSize,
BindType, BufferUsage, Error, GpuInfo, ImageLayout, MapMode, SamplerParams, SubgroupSize,
WorkgroupLimits,
};
@ -821,14 +821,13 @@ impl crate::backend::Device for VkDevice {
Ok(())
}
unsafe fn read_buffer(
unsafe fn map_buffer(
&self,
buffer: &Self::Buffer,
dst: *mut u8,
offset: u64,
size: u64,
) -> Result<(), Error> {
let copy_size = size.try_into()?;
_mode: MapMode,
) -> Result<*mut u8, Error> {
let device = &self.device.device;
let buf = device.map_memory(
buffer.buffer_memory,
@ -836,28 +835,17 @@ impl crate::backend::Device for VkDevice {
size,
vk::MemoryMapFlags::empty(),
)?;
std::ptr::copy_nonoverlapping(buf as *const u8, dst, copy_size);
device.unmap_memory(buffer.buffer_memory);
Ok(())
Ok(buf as *mut u8)
}
unsafe fn write_buffer(
unsafe fn unmap_buffer(
&self,
buffer: &Buffer,
contents: *const u8,
offset: u64,
size: u64,
buffer: &Self::Buffer,
_offset: u64,
_size: u64,
_mode: MapMode,
) -> Result<(), Error> {
let copy_size = size.try_into()?;
let device = &self.device.device;
let buf = device.map_memory(
buffer.buffer_memory,
offset,
size,
vk::MemoryMapFlags::empty(),
)?;
std::ptr::copy_nonoverlapping(contents, buf as *mut u8, copy_size);
device.unmap_memory(buffer.buffer_memory);
self.device.device.unmap_memory(buffer.buffer_memory);
Ok(())
}

View file

@ -61,9 +61,8 @@ pub unsafe fn run_clear_test(runner: &mut Runner, config: &Config) -> TestResult
}
total_elapsed += runner.submit(commands);
if i == 0 {
let mut dst: Vec<u32> = Default::default();
out_buf.read(&mut dst);
if let Some(failure) = verify(&dst) {
let dst = out_buf.map_read(..);
if let Some(failure) = verify(dst.cast_slice()) {
result.fail(format!("failure at {}", failure));
}
}

View file

@ -54,9 +54,8 @@ pub unsafe fn run_linkedlist_test(runner: &mut Runner, config: &Config) -> TestR
}
total_elapsed += runner.submit(commands);
if i == 0 {
let mut dst: Vec<u32> = Default::default();
mem_buf.read(&mut dst);
if !verify(&dst) {
let dst = mem_buf.map_read(..);
if !verify(dst.cast_slice()) {
result.fail("incorrect data");
}
}

View file

@ -69,10 +69,17 @@ pub unsafe fn run_prefix_test(
}
*/
let n_elements: u64 = config.size.choose(1 << 12, 1 << 24, 1 << 25);
let data: Vec<u32> = (0..n_elements as u32).collect();
let data_buf = runner
.session
.create_buffer_init(&data, BufferUsage::STORAGE)
.create_buffer_with(
n_elements * 4,
|b| {
for i in 0..n_elements as u32 {
b.push(&i);
}
},
BufferUsage::STORAGE,
)
.unwrap();
let out_buf = runner.buf_down(data_buf.size(), BufferUsage::empty());
let code = PrefixCode::new(runner, variant);
@ -91,9 +98,8 @@ pub unsafe fn run_prefix_test(
}
total_elapsed += runner.submit(commands);
if i == 0 {
let mut dst: Vec<u32> = Default::default();
out_buf.read(&mut dst);
if let Some(failure) = verify(&dst) {
let dst = out_buf.map_read(..);
if let Some(failure) = verify(dst.cast_slice()) {
result.fail(format!("failure at {}", failure));
}
}

View file

@ -47,10 +47,17 @@ pub unsafe fn run_prefix_test(runner: &mut Runner, config: &Config) -> TestResul
// prone to reading and writing past the end of buffers if this is
// not a power of the number of elements processed in a workgroup.
let n_elements: u64 = config.size.choose(1 << 12, 1 << 24, 1 << 24);
let data: Vec<u32> = (0..n_elements as u32).collect();
let data_buf = runner
.session
.create_buffer_init(&data, BufferUsage::STORAGE)
.create_buffer_with(
n_elements * 4,
|b| {
for i in 0..n_elements as u32 {
b.push(&i);
}
},
BufferUsage::STORAGE,
)
.unwrap();
let out_buf = runner.buf_down(data_buf.size(), BufferUsage::empty());
let code = PrefixTreeCode::new(runner);
@ -72,9 +79,8 @@ pub unsafe fn run_prefix_test(runner: &mut Runner, config: &Config) -> TestResul
}
total_elapsed += runner.submit(commands);
if i == 0 {
let mut dst: Vec<u32> = Default::default();
out_buf.read(&mut dst);
if let Some(failure) = verify(&dst) {
let dst = out_buf.map_read(..);
if let Some(failure) = verify(dst.cast_slice()) {
result.fail(format!("failure at {}", failure));
}
}

View file

@ -16,9 +16,12 @@
//! Test runner intended to make it easy to write tests.
use std::ops::RangeBounds;
use bytemuck::Pod;
use piet_gpu_hal::{
BackendType, Buffer, BufferUsage, CmdBuf, Instance, InstanceFlags, QueryPool, Session,
BackendType, BufReadGuard, Buffer, BufferUsage, CmdBuf, Instance, InstanceFlags, QueryPool,
Session,
};
pub struct Runner {
@ -140,4 +143,8 @@ impl BufDown {
pub unsafe fn read(&self, dst: &mut Vec<impl Pod>) {
self.stage_buf.read(dst).unwrap()
}
pub unsafe fn map_read<'a>(&'a self, range: impl RangeBounds<usize>) -> BufReadGuard<'a> {
self.stage_buf.map_read(range).unwrap()
}
}