mirror of
https://github.com/italicsjenga/vello.git
synced 2025-01-25 18:56:35 +11:00
429 lines
13 KiB
Rust
429 lines
13 KiB
Rust
|
//! Vulkan implemenation of HAL trait.
|
||
|
|
||
|
use std::ffi::CString;
|
||
|
use std::sync::Arc;
|
||
|
|
||
|
use ash::version::{DeviceV1_0, EntryV1_0, InstanceV1_0};
|
||
|
use ash::{vk, Device, Entry, Instance};
|
||
|
|
||
|
use crate::Error;
|
||
|
|
||
|
/// A base for allocating resources and dispatching work.
|
||
|
///
|
||
|
/// This is quite similar to "device" in most GPU API's, but I didn't want to overload
|
||
|
/// that term further.
|
||
|
pub struct Base {
|
||
|
/// Retain the dynamic lib.
|
||
|
#[allow(unused)]
|
||
|
entry: Entry,
|
||
|
|
||
|
#[allow(unused)]
|
||
|
instance: Instance,
|
||
|
|
||
|
device: Arc<RawDevice>,
|
||
|
device_mem_props: vk::PhysicalDeviceMemoryProperties,
|
||
|
queue: vk::Queue,
|
||
|
qfi: u32,
|
||
|
}
|
||
|
|
||
|
struct RawDevice {
|
||
|
device: Device,
|
||
|
}
|
||
|
|
||
|
/// A handle to a buffer.
|
||
|
///
|
||
|
/// There is no lifetime tracking at this level; the caller is responsible
|
||
|
/// for destroying the buffer at the appropriate time.
|
||
|
pub struct Buffer {
|
||
|
buffer: vk::Buffer,
|
||
|
buffer_memory: vk::DeviceMemory,
|
||
|
size: u64,
|
||
|
}
|
||
|
|
||
|
pub struct Pipeline {
|
||
|
pipeline: vk::Pipeline,
|
||
|
descriptor_set_layout: vk::DescriptorSetLayout,
|
||
|
pipeline_layout: vk::PipelineLayout,
|
||
|
}
|
||
|
|
||
|
pub struct DescriptorSet {
|
||
|
descriptor_set: vk::DescriptorSet,
|
||
|
}
|
||
|
|
||
|
pub struct CmdBuf {
|
||
|
cmd_buf: vk::CommandBuffer,
|
||
|
device: Arc<RawDevice>,
|
||
|
}
|
||
|
|
||
|
impl Base {
|
||
|
/// Create a new instance.
|
||
|
///
|
||
|
/// There's more to be done to make this suitable for integration with other
|
||
|
/// systems, but for now the goal is to make things simple.
|
||
|
pub fn new() -> Result<Base, Error> {
|
||
|
unsafe {
|
||
|
let app_name = CString::new("VkToy").unwrap();
|
||
|
let entry = Entry::new()?;
|
||
|
let instance = entry.create_instance(
|
||
|
&vk::InstanceCreateInfo::builder().application_info(
|
||
|
&vk::ApplicationInfo::builder()
|
||
|
.application_name(&app_name)
|
||
|
.application_version(0)
|
||
|
.engine_name(&app_name)
|
||
|
.api_version(vk::make_version(1, 0, 0)),
|
||
|
),
|
||
|
None,
|
||
|
)?;
|
||
|
|
||
|
let devices = instance.enumerate_physical_devices()?;
|
||
|
let (pdevice, qfi) =
|
||
|
choose_compute_device(&instance, &devices).ok_or("no suitable device")?;
|
||
|
|
||
|
let device = instance.create_device(
|
||
|
pdevice,
|
||
|
&vk::DeviceCreateInfo::builder().queue_create_infos(&[
|
||
|
vk::DeviceQueueCreateInfo::builder()
|
||
|
.queue_family_index(qfi)
|
||
|
.queue_priorities(&[1.0])
|
||
|
.build(),
|
||
|
]),
|
||
|
None,
|
||
|
)?;
|
||
|
|
||
|
let device_mem_props = instance.get_physical_device_memory_properties(pdevice);
|
||
|
|
||
|
let queue_index = 0;
|
||
|
let queue = device.get_device_queue(qfi, queue_index);
|
||
|
|
||
|
let device = Arc::new(RawDevice { device });
|
||
|
|
||
|
Ok(Base {
|
||
|
entry,
|
||
|
instance,
|
||
|
device,
|
||
|
device_mem_props,
|
||
|
qfi,
|
||
|
queue,
|
||
|
})
|
||
|
}
|
||
|
}
|
||
|
|
||
|
pub fn create_buffer(
|
||
|
&self,
|
||
|
size: u64,
|
||
|
mem_flags: vk::MemoryPropertyFlags,
|
||
|
) -> Result<Buffer, Error> {
|
||
|
unsafe {
|
||
|
let device = &self.device.device;
|
||
|
let buffer = device.create_buffer(
|
||
|
&vk::BufferCreateInfo::builder()
|
||
|
.size(size)
|
||
|
.usage(vk::BufferUsageFlags::STORAGE_BUFFER)
|
||
|
.sharing_mode(vk::SharingMode::EXCLUSIVE),
|
||
|
None,
|
||
|
)?;
|
||
|
let mem_requirements = device.get_buffer_memory_requirements(buffer);
|
||
|
let mem_type = find_memory_type(
|
||
|
mem_requirements.memory_type_bits,
|
||
|
mem_flags,
|
||
|
&self.device_mem_props,
|
||
|
)
|
||
|
.unwrap(); // TODO: proper error
|
||
|
let buffer_memory = device.allocate_memory(
|
||
|
&vk::MemoryAllocateInfo::builder()
|
||
|
.allocation_size(mem_requirements.size)
|
||
|
.memory_type_index(mem_type),
|
||
|
None,
|
||
|
)?;
|
||
|
device.bind_buffer_memory(buffer, buffer_memory, 0)?;
|
||
|
Ok(Buffer {
|
||
|
buffer,
|
||
|
buffer_memory,
|
||
|
size,
|
||
|
})
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/// This creates a pipeline that runs over the buffer.
|
||
|
///
|
||
|
/// The code is included from "../comp.spv", and the descriptor set layout is just some
|
||
|
/// number of buffers.
|
||
|
pub unsafe fn create_simple_compute_pipeline(
|
||
|
&self,
|
||
|
code: &[u8],
|
||
|
n_buffers: u32,
|
||
|
) -> Result<Pipeline, Error> {
|
||
|
let device = &self.device.device;
|
||
|
let descriptor_set_layout = device.create_descriptor_set_layout(
|
||
|
&vk::DescriptorSetLayoutCreateInfo::builder().bindings(&[
|
||
|
vk::DescriptorSetLayoutBinding::builder()
|
||
|
.binding(0)
|
||
|
.descriptor_type(vk::DescriptorType::STORAGE_BUFFER)
|
||
|
.descriptor_count(n_buffers)
|
||
|
.stage_flags(vk::ShaderStageFlags::COMPUTE)
|
||
|
.build(),
|
||
|
]),
|
||
|
None,
|
||
|
)?;
|
||
|
|
||
|
let descriptor_set_layouts = [descriptor_set_layout];
|
||
|
|
||
|
// Create compute pipeline.
|
||
|
let code_u32 = convert_u32_vec(code);
|
||
|
let compute_shader_module = device
|
||
|
.create_shader_module(&vk::ShaderModuleCreateInfo::builder().code(&code_u32), None)?;
|
||
|
let entry_name = CString::new("main").unwrap();
|
||
|
let pipeline_layout = device.create_pipeline_layout(
|
||
|
&vk::PipelineLayoutCreateInfo::builder().set_layouts(&descriptor_set_layouts),
|
||
|
None,
|
||
|
)?;
|
||
|
|
||
|
let pipeline = device.create_compute_pipelines(
|
||
|
vk::PipelineCache::null(),
|
||
|
&[vk::ComputePipelineCreateInfo::builder()
|
||
|
.stage(
|
||
|
vk::PipelineShaderStageCreateInfo::builder()
|
||
|
.stage(vk::ShaderStageFlags::COMPUTE)
|
||
|
.module(compute_shader_module)
|
||
|
.name(&entry_name)
|
||
|
.build(),
|
||
|
)
|
||
|
.layout(pipeline_layout)
|
||
|
.build()],
|
||
|
None,
|
||
|
).map_err(|(_pipeline, err)| err)?[0];
|
||
|
Ok(Pipeline {
|
||
|
pipeline,
|
||
|
pipeline_layout,
|
||
|
descriptor_set_layout,
|
||
|
})
|
||
|
}
|
||
|
|
||
|
pub unsafe fn create_descriptor_set(
|
||
|
&self,
|
||
|
pipeline: &Pipeline,
|
||
|
bufs: &[&Buffer],
|
||
|
) -> Result<DescriptorSet, Error> {
|
||
|
let device = &self.device.device;
|
||
|
let descriptor_pool_sizes = [vk::DescriptorPoolSize::builder()
|
||
|
.ty(vk::DescriptorType::STORAGE_BUFFER)
|
||
|
.descriptor_count(bufs.len() as u32)
|
||
|
.build()];
|
||
|
let descriptor_pool = device.create_descriptor_pool(
|
||
|
&vk::DescriptorPoolCreateInfo::builder()
|
||
|
.pool_sizes(&descriptor_pool_sizes)
|
||
|
.max_sets(1),
|
||
|
None,
|
||
|
)?;
|
||
|
let descriptor_set_layouts = [pipeline.descriptor_set_layout];
|
||
|
let descriptor_sets = device
|
||
|
.allocate_descriptor_sets(
|
||
|
&vk::DescriptorSetAllocateInfo::builder()
|
||
|
.descriptor_pool(descriptor_pool)
|
||
|
.set_layouts(&descriptor_set_layouts),
|
||
|
)
|
||
|
.unwrap();
|
||
|
let buf_infos = bufs
|
||
|
.iter()
|
||
|
.map(|buf| {
|
||
|
vk::DescriptorBufferInfo::builder()
|
||
|
.buffer(buf.buffer)
|
||
|
.offset(0)
|
||
|
.range(vk::WHOLE_SIZE)
|
||
|
.build()
|
||
|
})
|
||
|
.collect::<Vec<_>>();
|
||
|
device.update_descriptor_sets(
|
||
|
&[vk::WriteDescriptorSet::builder()
|
||
|
.dst_set(descriptor_sets[0])
|
||
|
.dst_binding(0)
|
||
|
.descriptor_type(vk::DescriptorType::STORAGE_BUFFER)
|
||
|
.buffer_info(&buf_infos)
|
||
|
.build()],
|
||
|
&[],
|
||
|
);
|
||
|
Ok(DescriptorSet {
|
||
|
descriptor_set: descriptor_sets[0],
|
||
|
})
|
||
|
}
|
||
|
|
||
|
pub fn create_cmd_buf(&self) -> Result<CmdBuf, Error> {
|
||
|
unsafe {
|
||
|
let device = &self.device.device;
|
||
|
let command_pool = device.create_command_pool(
|
||
|
&vk::CommandPoolCreateInfo::builder()
|
||
|
.flags(vk::CommandPoolCreateFlags::empty())
|
||
|
.queue_family_index(self.qfi),
|
||
|
None,
|
||
|
)?;
|
||
|
let cmd_buf = device.allocate_command_buffers(
|
||
|
&vk::CommandBufferAllocateInfo::builder()
|
||
|
.command_pool(command_pool)
|
||
|
.level(vk::CommandBufferLevel::PRIMARY)
|
||
|
.command_buffer_count(1),
|
||
|
)?[0];
|
||
|
Ok(CmdBuf {
|
||
|
cmd_buf,
|
||
|
device: self.device.clone(),
|
||
|
})
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/// Run the command buffer.
|
||
|
///
|
||
|
/// This version simply blocks until it's complete.
|
||
|
pub unsafe fn run_cmd_buf(&self, cmd_buf: &CmdBuf) -> Result<(), Error> {
|
||
|
let device = &self.device.device;
|
||
|
|
||
|
// Run the command buffer.
|
||
|
let fence = device.create_fence(
|
||
|
&vk::FenceCreateInfo::builder().flags(vk::FenceCreateFlags::empty()),
|
||
|
None,
|
||
|
)?;
|
||
|
device.queue_submit(
|
||
|
self.queue,
|
||
|
&[vk::SubmitInfo::builder()
|
||
|
.command_buffers(&[cmd_buf.cmd_buf])
|
||
|
.build()],
|
||
|
fence,
|
||
|
)?;
|
||
|
device.wait_for_fences(&[fence], true, 1_000_000)?;
|
||
|
device.destroy_fence(fence, None);
|
||
|
Ok(())
|
||
|
}
|
||
|
|
||
|
pub unsafe fn read_buffer<T: Sized>(
|
||
|
&self,
|
||
|
buffer: &Buffer,
|
||
|
result: &mut Vec<T>,
|
||
|
) -> Result<(), Error> {
|
||
|
let device = &self.device.device;
|
||
|
let size = buffer.size as usize;
|
||
|
let buf = device.map_memory(
|
||
|
buffer.buffer_memory,
|
||
|
0,
|
||
|
size as u64,
|
||
|
vk::MemoryMapFlags::empty(),
|
||
|
)?;
|
||
|
if size > result.len() {
|
||
|
result.reserve(size - result.len());
|
||
|
}
|
||
|
std::ptr::copy_nonoverlapping(buf as *const T, result.as_mut_ptr(), size);
|
||
|
result.set_len(size);
|
||
|
device.unmap_memory(buffer.buffer_memory);
|
||
|
Ok(())
|
||
|
}
|
||
|
|
||
|
pub unsafe fn write_buffer<T: Sized>(
|
||
|
&self,
|
||
|
buffer: &Buffer,
|
||
|
contents: &[T],
|
||
|
) -> Result<(), Error> {
|
||
|
let device = &self.device.device;
|
||
|
let buf = device.map_memory(
|
||
|
buffer.buffer_memory,
|
||
|
0,
|
||
|
std::mem::size_of_val(contents) as u64,
|
||
|
vk::MemoryMapFlags::empty(),
|
||
|
)?;
|
||
|
std::ptr::copy_nonoverlapping(contents.as_ptr(), buf as *mut T, contents.len());
|
||
|
device.unmap_memory(buffer.buffer_memory);
|
||
|
Ok(())
|
||
|
}
|
||
|
}
|
||
|
|
||
|
impl CmdBuf {
|
||
|
pub unsafe fn begin(&mut self) {
|
||
|
self.device
|
||
|
.device
|
||
|
.begin_command_buffer(
|
||
|
self.cmd_buf,
|
||
|
&vk::CommandBufferBeginInfo::builder()
|
||
|
.flags(vk::CommandBufferUsageFlags::ONE_TIME_SUBMIT),
|
||
|
)
|
||
|
.unwrap();
|
||
|
}
|
||
|
|
||
|
pub unsafe fn finish(&mut self) {
|
||
|
self.device.device.end_command_buffer(self.cmd_buf).unwrap();
|
||
|
}
|
||
|
|
||
|
pub unsafe fn dispatch(&mut self, pipeline: &Pipeline, descriptor_set: &DescriptorSet) {
|
||
|
let device = &self.device.device;
|
||
|
device.cmd_bind_pipeline(
|
||
|
self.cmd_buf,
|
||
|
vk::PipelineBindPoint::COMPUTE,
|
||
|
pipeline.pipeline,
|
||
|
);
|
||
|
device.cmd_bind_descriptor_sets(
|
||
|
self.cmd_buf,
|
||
|
vk::PipelineBindPoint::COMPUTE,
|
||
|
pipeline.pipeline_layout,
|
||
|
0,
|
||
|
&[descriptor_set.descriptor_set],
|
||
|
&[],
|
||
|
);
|
||
|
device.cmd_dispatch(self.cmd_buf, 256, 1, 1);
|
||
|
}
|
||
|
|
||
|
/// Insert a pipeline barrier for all memory accesses.
|
||
|
#[allow(unused)]
|
||
|
pub unsafe fn memory_barrier(&mut self) {
|
||
|
let device = &self.device.device;
|
||
|
device.cmd_pipeline_barrier(
|
||
|
self.cmd_buf,
|
||
|
vk::PipelineStageFlags::ALL_COMMANDS,
|
||
|
vk::PipelineStageFlags::ALL_COMMANDS,
|
||
|
vk::DependencyFlags::empty(),
|
||
|
&[vk::MemoryBarrier::builder()
|
||
|
.src_access_mask(vk::AccessFlags::MEMORY_WRITE)
|
||
|
.dst_access_mask(vk::AccessFlags::MEMORY_READ)
|
||
|
.build()],
|
||
|
&[],
|
||
|
&[],
|
||
|
);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
unsafe fn choose_compute_device(
|
||
|
instance: &Instance,
|
||
|
devices: &[vk::PhysicalDevice],
|
||
|
) -> Option<(vk::PhysicalDevice, u32)> {
|
||
|
for pdevice in devices {
|
||
|
let props = instance.get_physical_device_queue_family_properties(*pdevice);
|
||
|
for (ix, info) in props.iter().enumerate() {
|
||
|
if info.queue_flags.contains(vk::QueueFlags::COMPUTE) {
|
||
|
return Some((*pdevice, ix as u32));
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
None
|
||
|
}
|
||
|
|
||
|
fn find_memory_type(
|
||
|
memory_type_bits: u32,
|
||
|
property_flags: vk::MemoryPropertyFlags,
|
||
|
props: &vk::PhysicalDeviceMemoryProperties,
|
||
|
) -> Option<u32> {
|
||
|
for i in 0..props.memory_type_count {
|
||
|
if (memory_type_bits & (1 << i)) != 0
|
||
|
&& props.memory_types[i as usize]
|
||
|
.property_flags
|
||
|
.contains(property_flags)
|
||
|
{
|
||
|
return Some(i);
|
||
|
}
|
||
|
}
|
||
|
None
|
||
|
}
|
||
|
|
||
|
fn convert_u32_vec(src: &[u8]) -> Vec<u32> {
|
||
|
src.chunks(4)
|
||
|
.map(|chunk| {
|
||
|
let mut buf = [0; 4];
|
||
|
buf.copy_from_slice(chunk);
|
||
|
u32::from_le_bytes(buf)
|
||
|
})
|
||
|
.collect()
|
||
|
}
|