mirror of
https://github.com/italicsjenga/vello.git
synced 2025-01-10 12:41:30 +11:00
commit
125f6f9d63
11
Cargo.lock
generated
11
Cargo.lock
generated
|
@ -851,6 +851,8 @@ dependencies = [
|
||||||
"ash-window",
|
"ash-window",
|
||||||
"bitflags",
|
"bitflags",
|
||||||
"raw-window-handle",
|
"raw-window-handle",
|
||||||
|
"winapi 0.3.9",
|
||||||
|
"wio",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
|
@ -1364,6 +1366,15 @@ dependencies = [
|
||||||
"x11-dl",
|
"x11-dl",
|
||||||
]
|
]
|
||||||
|
|
||||||
|
[[package]]
|
||||||
|
name = "wio"
|
||||||
|
version = "0.2.2"
|
||||||
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
|
checksum = "5d129932f4644ac2396cb456385cbf9e63b5b30c6e8dc4820bdca4eb082037a5"
|
||||||
|
dependencies = [
|
||||||
|
"winapi 0.3.9",
|
||||||
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "ws2_32-sys"
|
name = "ws2_32-sys"
|
||||||
version = "0.2.1"
|
version = "0.2.1"
|
||||||
|
|
|
@ -40,6 +40,8 @@ The piet-gpu project is dual-licensed under both [Apache 2.0](LICENSE-APACHE) an
|
||||||
|
|
||||||
In addition, the shaders are provided under the terms of the [Unlicense]. The intent is for this research to be used in as broad a context as possible.
|
In addition, the shaders are provided under the terms of the [Unlicense]. The intent is for this research to be used in as broad a context as possible.
|
||||||
|
|
||||||
|
The dx12 backend was adapted from piet-dx12 by Brian Merchant.
|
||||||
|
|
||||||
Contributions are welcome by pull request. The [Rust code of conduct] applies.
|
Contributions are welcome by pull request. The [Rust code of conduct] applies.
|
||||||
|
|
||||||
[piet-metal]: https://github.com/linebender/piet-metal
|
[piet-metal]: https://github.com/linebender/piet-metal
|
||||||
|
|
|
@ -11,3 +11,11 @@ ash = "0.31"
|
||||||
ash-window = "0.5"
|
ash-window = "0.5"
|
||||||
raw-window-handle = "0.3"
|
raw-window-handle = "0.3"
|
||||||
bitflags = "1.2.1"
|
bitflags = "1.2.1"
|
||||||
|
|
||||||
|
winapi = { version = "0.3.9", features = [
|
||||||
|
'd3d12', 'd3d12sdklayers', 'd3dcommon', 'd3dcompiler', 'dxgi',
|
||||||
|
'dxgi1_2', 'dxgi1_3', 'dxgi1_4', 'dxgidebug', 'dxgiformat', 'dxgitype',
|
||||||
|
'libloaderapi', 'shellscalingapi', 'synchapi', 'winbase', 'windef',
|
||||||
|
'winerror', 'winuser'
|
||||||
|
] }
|
||||||
|
wio = "0.2.2"
|
||||||
|
|
101
piet-gpu-hal/examples/dx12_toy.rs
Normal file
101
piet-gpu-hal/examples/dx12_toy.rs
Normal file
|
@ -0,0 +1,101 @@
|
||||||
|
//! An example to exercise the dx12 backend, while it's being developed.
|
||||||
|
//! This will probably go away when it's fully implemented and we can
|
||||||
|
//! just use the hub.
|
||||||
|
|
||||||
|
use piet_gpu_hal::{dx12, BufferUsage, CmdBuf, Device, Error};
|
||||||
|
|
||||||
|
const SHADER_CODE: &str = r#"RWByteAddressBuffer _53 : register(u0, space0);
|
||||||
|
|
||||||
|
RWTexture2D<float4> textureOut : register(u1);
|
||||||
|
|
||||||
|
static uint3 gl_GlobalInvocationID;
|
||||||
|
struct SPIRV_Cross_Input
|
||||||
|
{
|
||||||
|
uint3 gl_GlobalInvocationID : SV_DispatchThreadID;
|
||||||
|
};
|
||||||
|
|
||||||
|
uint collatz_iterations(inout uint n)
|
||||||
|
{
|
||||||
|
uint i = 0u;
|
||||||
|
while (n != 1u)
|
||||||
|
{
|
||||||
|
if ((n & 1u) == 0u)
|
||||||
|
{
|
||||||
|
n /= 2u;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
n = (3u * n) + 1u;
|
||||||
|
}
|
||||||
|
i++;
|
||||||
|
}
|
||||||
|
return i;
|
||||||
|
}
|
||||||
|
|
||||||
|
void comp_main()
|
||||||
|
{
|
||||||
|
uint index = gl_GlobalInvocationID.x;
|
||||||
|
uint param = _53.Load(index * 4 + 0);
|
||||||
|
uint _61 = collatz_iterations(param);
|
||||||
|
_53.Store(index * 4 + 0, _61);
|
||||||
|
textureOut[uint2(index, 0)] = float4(1.0, 0.0, 0.0, 1.0);
|
||||||
|
}
|
||||||
|
|
||||||
|
[numthreads(256, 1, 1)]
|
||||||
|
void main(SPIRV_Cross_Input stage_input)
|
||||||
|
{
|
||||||
|
gl_GlobalInvocationID = stage_input.gl_GlobalInvocationID;
|
||||||
|
comp_main();
|
||||||
|
}
|
||||||
|
"#;
|
||||||
|
|
||||||
|
fn toy() -> Result<(), Error> {
|
||||||
|
let instance = dx12::Dx12Instance::new()?;
|
||||||
|
let device = instance.device()?;
|
||||||
|
let buf = device.create_buffer(
|
||||||
|
1024,
|
||||||
|
BufferUsage::MAP_READ
|
||||||
|
| BufferUsage::MAP_WRITE
|
||||||
|
| BufferUsage::COPY_SRC
|
||||||
|
| BufferUsage::COPY_DST,
|
||||||
|
)?;
|
||||||
|
let dev_buf = device.create_buffer(
|
||||||
|
1024,
|
||||||
|
BufferUsage::STORAGE | BufferUsage::COPY_SRC | BufferUsage::COPY_DST,
|
||||||
|
)?;
|
||||||
|
let img_readback_buf =
|
||||||
|
device.create_buffer(1024, BufferUsage::MAP_READ | BufferUsage::COPY_DST)?;
|
||||||
|
let data: Vec<u32> = (1..257).collect();
|
||||||
|
let query_pool = device.create_query_pool(2)?;
|
||||||
|
unsafe {
|
||||||
|
let img = device.create_image2d(256, 1)?;
|
||||||
|
device.write_buffer(&buf, data.as_ptr() as *const u8, 0, 1024)?;
|
||||||
|
let pipeline = device.create_simple_compute_pipeline(SHADER_CODE, 1, 1)?;
|
||||||
|
let ds = device.create_descriptor_set(&pipeline, &[&dev_buf], &[&img])?;
|
||||||
|
let mut cmd_buf = device.create_cmd_buf()?;
|
||||||
|
let fence = device.create_fence(false)?;
|
||||||
|
cmd_buf.begin();
|
||||||
|
cmd_buf.copy_buffer(&buf, &dev_buf);
|
||||||
|
cmd_buf.memory_barrier();
|
||||||
|
cmd_buf.write_timestamp(&query_pool, 0);
|
||||||
|
cmd_buf.dispatch(&pipeline, &ds, (1, 1, 1));
|
||||||
|
cmd_buf.write_timestamp(&query_pool, 1);
|
||||||
|
cmd_buf.memory_barrier();
|
||||||
|
cmd_buf.copy_buffer(&dev_buf, &buf);
|
||||||
|
cmd_buf.copy_image_to_buffer(&img, &img_readback_buf);
|
||||||
|
cmd_buf.finish_timestamps(&query_pool);
|
||||||
|
cmd_buf.host_barrier();
|
||||||
|
cmd_buf.finish();
|
||||||
|
device.run_cmd_bufs(&[&cmd_buf], &[], &[], Some(&fence))?;
|
||||||
|
device.wait_and_reset(&[fence])?;
|
||||||
|
let mut readback: Vec<u32> = vec![0u32; 256];
|
||||||
|
device.read_buffer(&buf, readback.as_mut_ptr() as *mut u8, 0, 1024)?;
|
||||||
|
println!("{:?}", readback);
|
||||||
|
println!("{:?}", device.fetch_query_pool(&query_pool));
|
||||||
|
}
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn main() {
|
||||||
|
toy().unwrap();
|
||||||
|
}
|
632
piet-gpu-hal/src/dx12.rs
Normal file
632
piet-gpu-hal/src/dx12.rs
Normal file
|
@ -0,0 +1,632 @@
|
||||||
|
//! DX12 implemenation of HAL trait.
|
||||||
|
|
||||||
|
mod error;
|
||||||
|
mod wrappers;
|
||||||
|
|
||||||
|
use std::{cell::Cell, convert::TryInto, mem, ptr};
|
||||||
|
|
||||||
|
use winapi::shared::dxgi1_3;
|
||||||
|
use winapi::shared::minwindef::TRUE;
|
||||||
|
use winapi::um::d3d12;
|
||||||
|
|
||||||
|
use crate::{BufferUsage, Error, ImageLayout};
|
||||||
|
|
||||||
|
use self::wrappers::{
|
||||||
|
CommandAllocator, CommandQueue, Device, Factory4, GraphicsCommandList, Resource, ShaderByteCode,
|
||||||
|
};
|
||||||
|
|
||||||
|
pub struct Dx12Instance {
|
||||||
|
factory: Factory4,
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct Dx12Device {
|
||||||
|
device: Device,
|
||||||
|
command_allocator: CommandAllocator,
|
||||||
|
command_queue: CommandQueue,
|
||||||
|
ts_freq: u64,
|
||||||
|
memory_arch: MemoryArchitecture,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Clone)]
|
||||||
|
pub struct Buffer {
|
||||||
|
resource: Resource,
|
||||||
|
size: u64,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Clone)]
|
||||||
|
pub struct Image {
|
||||||
|
resource: Resource,
|
||||||
|
size: (u32, u32),
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct CmdBuf(GraphicsCommandList);
|
||||||
|
|
||||||
|
pub struct Pipeline {
|
||||||
|
pipeline_state: wrappers::PipelineState,
|
||||||
|
root_signature: wrappers::RootSignature,
|
||||||
|
}
|
||||||
|
|
||||||
|
// Right now, each descriptor set gets its own heap, but we'll move
|
||||||
|
// to a more sophisticated allocation scheme, probably using the
|
||||||
|
// gpu-descriptor crate.
|
||||||
|
pub struct DescriptorSet(wrappers::DescriptorHeap);
|
||||||
|
|
||||||
|
pub struct QueryPool {
|
||||||
|
heap: wrappers::QueryHeap,
|
||||||
|
buf: Buffer,
|
||||||
|
n_queries: u32,
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct Fence {
|
||||||
|
fence: wrappers::Fence,
|
||||||
|
event: wrappers::Event,
|
||||||
|
// This could as well be an atomic, if we needed to cross threads.
|
||||||
|
val: Cell<u64>,
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct Semaphore;
|
||||||
|
|
||||||
|
#[derive(Default)]
|
||||||
|
pub struct PipelineBuilder {
|
||||||
|
ranges: Vec<d3d12::D3D12_DESCRIPTOR_RANGE>,
|
||||||
|
n_uav: u32,
|
||||||
|
// TODO: add counters for other resource types
|
||||||
|
}
|
||||||
|
|
||||||
|
// TODO
|
||||||
|
#[derive(Default)]
|
||||||
|
pub struct DescriptorSetBuilder {
|
||||||
|
buffers: Vec<Buffer>,
|
||||||
|
images: Vec<Image>,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(PartialEq, Eq)]
|
||||||
|
enum MemoryArchitecture {
|
||||||
|
/// Integrated graphics
|
||||||
|
CacheCoherentUMA,
|
||||||
|
/// Unified memory with no cache coherence (does this happen?)
|
||||||
|
UMA,
|
||||||
|
/// Discrete graphics
|
||||||
|
NUMA,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Dx12Instance {
|
||||||
|
/// Create a new instance.
|
||||||
|
///
|
||||||
|
/// TODO: take a raw window handle.
|
||||||
|
/// TODO: can probably be a trait.
|
||||||
|
pub fn new() -> Result<Dx12Instance, Error> {
|
||||||
|
unsafe {
|
||||||
|
#[cfg(debug_assertions)]
|
||||||
|
if let Err(e) = wrappers::enable_debug_layer() {
|
||||||
|
// Maybe a better logging solution?
|
||||||
|
println!("{}", e);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[cfg(debug_assertions)]
|
||||||
|
let factory_flags = dxgi1_3::DXGI_CREATE_FACTORY_DEBUG;
|
||||||
|
|
||||||
|
#[cfg(not(debug_assertions))]
|
||||||
|
let factory_flags: u32 = 0;
|
||||||
|
|
||||||
|
let factory = Factory4::create(factory_flags)?;
|
||||||
|
Ok(Dx12Instance { factory })
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Get a device suitable for compute workloads.
|
||||||
|
///
|
||||||
|
/// TODO: handle window.
|
||||||
|
/// TODO: probably can also be trait'ified.
|
||||||
|
pub fn device(&self) -> Result<Dx12Device, Error> {
|
||||||
|
unsafe {
|
||||||
|
let device = Device::create_device(&self.factory)?;
|
||||||
|
let list_type = d3d12::D3D12_COMMAND_LIST_TYPE_DIRECT;
|
||||||
|
let command_queue = device.create_command_queue(
|
||||||
|
list_type,
|
||||||
|
0,
|
||||||
|
d3d12::D3D12_COMMAND_QUEUE_FLAG_NONE,
|
||||||
|
0,
|
||||||
|
)?;
|
||||||
|
let command_allocator = device.create_command_allocator(list_type)?;
|
||||||
|
let ts_freq = command_queue.get_timestamp_frequency()?;
|
||||||
|
let features_architecture = device.get_features_architecture()?;
|
||||||
|
let uma = features_architecture.UMA == TRUE;
|
||||||
|
let cc_uma = features_architecture.CacheCoherentUMA == TRUE;
|
||||||
|
let memory_arch = match (uma, cc_uma) {
|
||||||
|
(true, true) => MemoryArchitecture::CacheCoherentUMA,
|
||||||
|
(true, false) => MemoryArchitecture::UMA,
|
||||||
|
_ => MemoryArchitecture::NUMA,
|
||||||
|
};
|
||||||
|
Ok(Dx12Device {
|
||||||
|
device,
|
||||||
|
command_queue,
|
||||||
|
command_allocator,
|
||||||
|
ts_freq,
|
||||||
|
memory_arch,
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl crate::Device for Dx12Device {
|
||||||
|
type Buffer = Buffer;
|
||||||
|
|
||||||
|
type Image = Image;
|
||||||
|
|
||||||
|
type Pipeline = Pipeline;
|
||||||
|
|
||||||
|
type DescriptorSet = DescriptorSet;
|
||||||
|
|
||||||
|
type QueryPool = QueryPool;
|
||||||
|
|
||||||
|
type CmdBuf = CmdBuf;
|
||||||
|
|
||||||
|
type Fence = Fence;
|
||||||
|
|
||||||
|
type Semaphore = Semaphore;
|
||||||
|
|
||||||
|
type PipelineBuilder = PipelineBuilder;
|
||||||
|
|
||||||
|
type DescriptorSetBuilder = DescriptorSetBuilder;
|
||||||
|
|
||||||
|
type Sampler = ();
|
||||||
|
|
||||||
|
// Currently this is HLSL source, but we'll probably change it to IR.
|
||||||
|
type ShaderSource = str;
|
||||||
|
|
||||||
|
fn create_buffer(&self, size: u64, usage: BufferUsage) -> Result<Self::Buffer, Error> {
|
||||||
|
// TODO: consider supporting BufferUsage::QUERY_RESOLVE here rather than
|
||||||
|
// having a separate function.
|
||||||
|
unsafe {
|
||||||
|
let page_property = self.memory_arch.page_property(usage);
|
||||||
|
let memory_pool = self.memory_arch.memory_pool(usage);
|
||||||
|
//TODO: consider flag D3D12_HEAP_FLAG_ALLOW_SHADER_ATOMICS?
|
||||||
|
let flags = d3d12::D3D12_RESOURCE_FLAG_ALLOW_UNORDERED_ACCESS;
|
||||||
|
let resource = self.device.create_buffer(
|
||||||
|
size.try_into()?,
|
||||||
|
d3d12::D3D12_HEAP_TYPE_CUSTOM,
|
||||||
|
page_property,
|
||||||
|
memory_pool,
|
||||||
|
d3d12::D3D12_RESOURCE_STATE_COMMON,
|
||||||
|
flags,
|
||||||
|
)?;
|
||||||
|
Ok(Buffer { resource, size })
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn destroy_buffer(&self, buffer: &Self::Buffer) -> Result<(), Error> {
|
||||||
|
buffer.resource.destroy();
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn create_image2d(&self, width: u32, height: u32) -> Result<Self::Image, Error> {
|
||||||
|
let format = winapi::shared::dxgiformat::DXGI_FORMAT_R8G8B8A8_UNORM;
|
||||||
|
let resource = self
|
||||||
|
.device
|
||||||
|
.create_texture2d_buffer(width.into(), height, format, true)?;
|
||||||
|
let size = (width, height);
|
||||||
|
Ok(Image { resource, size })
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn destroy_image(&self, image: &Self::Image) -> Result<(), Error> {
|
||||||
|
image.resource.destroy();
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn create_cmd_buf(&self) -> Result<Self::CmdBuf, Error> {
|
||||||
|
let list_type = d3d12::D3D12_COMMAND_LIST_TYPE_DIRECT;
|
||||||
|
let node_mask = 0;
|
||||||
|
unsafe {
|
||||||
|
let cmd_buf = self.device.create_graphics_command_list(
|
||||||
|
list_type,
|
||||||
|
&self.command_allocator,
|
||||||
|
None,
|
||||||
|
node_mask,
|
||||||
|
)?;
|
||||||
|
Ok(CmdBuf(cmd_buf))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn create_query_pool(&self, n_queries: u32) -> Result<Self::QueryPool, Error> {
|
||||||
|
unsafe {
|
||||||
|
let heap = self
|
||||||
|
.device
|
||||||
|
.create_query_heap(d3d12::D3D12_QUERY_HEAP_TYPE_TIMESTAMP, n_queries)?;
|
||||||
|
let buf = self.create_readback_buffer((n_queries * 8) as u64)?;
|
||||||
|
Ok(QueryPool {
|
||||||
|
heap,
|
||||||
|
buf,
|
||||||
|
n_queries,
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn fetch_query_pool(&self, pool: &Self::QueryPool) -> Result<Vec<f64>, Error> {
|
||||||
|
let mut buf = vec![0u64; pool.n_queries as usize];
|
||||||
|
self.read_buffer(
|
||||||
|
&pool.buf,
|
||||||
|
buf.as_mut_ptr() as *mut u8,
|
||||||
|
0,
|
||||||
|
mem::size_of_val(buf.as_slice()) as u64,
|
||||||
|
)?;
|
||||||
|
let ts0 = buf[0];
|
||||||
|
let tsp = (self.ts_freq as f64).recip();
|
||||||
|
let result = buf[1..]
|
||||||
|
.iter()
|
||||||
|
.map(|ts| ts.wrapping_sub(ts0) as f64 * tsp)
|
||||||
|
.collect();
|
||||||
|
Ok(result)
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn run_cmd_bufs(
|
||||||
|
&self,
|
||||||
|
cmd_bufs: &[&Self::CmdBuf],
|
||||||
|
wait_semaphores: &[Self::Semaphore],
|
||||||
|
signal_semaphores: &[Self::Semaphore],
|
||||||
|
fence: Option<&Self::Fence>,
|
||||||
|
) -> Result<(), Error> {
|
||||||
|
// TODO: handle semaphores
|
||||||
|
// SmallVec?
|
||||||
|
let lists = cmd_bufs
|
||||||
|
.iter()
|
||||||
|
.map(|c| c.0.as_raw_command_list())
|
||||||
|
.collect::<Vec<_>>();
|
||||||
|
self.command_queue.execute_command_lists(&lists);
|
||||||
|
if let Some(fence) = fence {
|
||||||
|
let val = fence.val.get() + 1;
|
||||||
|
fence.val.set(val);
|
||||||
|
self.command_queue.signal(&fence.fence, val)?;
|
||||||
|
fence.fence.set_event_on_completion(&fence.event, val)?;
|
||||||
|
}
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn read_buffer(
|
||||||
|
&self,
|
||||||
|
buffer: &Self::Buffer,
|
||||||
|
dst: *mut u8,
|
||||||
|
offset: u64,
|
||||||
|
size: u64,
|
||||||
|
) -> Result<(), Error> {
|
||||||
|
buffer
|
||||||
|
.resource
|
||||||
|
.read_resource(dst, offset as usize, size as usize)?;
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn write_buffer(
|
||||||
|
&self,
|
||||||
|
buffer: &Self::Buffer,
|
||||||
|
contents: *const u8,
|
||||||
|
offset: u64,
|
||||||
|
size: u64,
|
||||||
|
) -> Result<(), Error> {
|
||||||
|
buffer
|
||||||
|
.resource
|
||||||
|
.write_resource(contents, offset as usize, size as usize)?;
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn create_semaphore(&self) -> Result<Self::Semaphore, Error> {
|
||||||
|
todo!()
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn create_fence(&self, signaled: bool) -> Result<Self::Fence, Error> {
|
||||||
|
let fence = self.device.create_fence(0)?;
|
||||||
|
let event = wrappers::Event::create(false, signaled)?;
|
||||||
|
let val = Cell::new(0);
|
||||||
|
Ok(Fence { fence, event, val })
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn wait_and_reset(&self, fences: &[Self::Fence]) -> Result<(), Error> {
|
||||||
|
for fence in fences {
|
||||||
|
// TODO: probably handle errors here.
|
||||||
|
let _status = fence.event.wait(winapi::um::winbase::INFINITE);
|
||||||
|
}
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn get_fence_status(&self, fence: Self::Fence) -> Result<bool, Error> {
|
||||||
|
let fence_val = fence.fence.get_value();
|
||||||
|
Ok(fence_val == fence.val.get())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn query_gpu_info(&self) -> crate::GpuInfo {
|
||||||
|
todo!()
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn pipeline_builder(&self) -> Self::PipelineBuilder {
|
||||||
|
PipelineBuilder::default()
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn descriptor_set_builder(&self) -> Self::DescriptorSetBuilder {
|
||||||
|
DescriptorSetBuilder::default()
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn create_sampler(&self, params: crate::SamplerParams) -> Result<Self::Sampler, Error> {
|
||||||
|
todo!()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Dx12Device {
|
||||||
|
fn create_readback_buffer(&self, size: u64) -> Result<Buffer, Error> {
|
||||||
|
unsafe {
|
||||||
|
let resource = self.device.create_buffer(
|
||||||
|
size.try_into()?,
|
||||||
|
d3d12::D3D12_HEAP_TYPE_READBACK,
|
||||||
|
d3d12::D3D12_CPU_PAGE_PROPERTY_UNKNOWN,
|
||||||
|
d3d12::D3D12_MEMORY_POOL_UNKNOWN,
|
||||||
|
d3d12::D3D12_RESOURCE_STATE_COPY_DEST,
|
||||||
|
d3d12::D3D12_RESOURCE_FLAG_NONE,
|
||||||
|
)?;
|
||||||
|
Ok(Buffer { resource, size })
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl crate::CmdBuf<Dx12Device> for CmdBuf {
|
||||||
|
unsafe fn begin(&mut self) {}
|
||||||
|
|
||||||
|
unsafe fn finish(&mut self) {
|
||||||
|
let _ = self.0.close();
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn dispatch(
|
||||||
|
&mut self,
|
||||||
|
pipeline: &Pipeline,
|
||||||
|
descriptor_set: &DescriptorSet,
|
||||||
|
size: (u32, u32, u32),
|
||||||
|
) {
|
||||||
|
self.0.set_pipeline_state(&pipeline.pipeline_state);
|
||||||
|
self.0
|
||||||
|
.set_compute_pipeline_root_signature(&pipeline.root_signature);
|
||||||
|
self.0.set_descriptor_heaps(&[&descriptor_set.0]);
|
||||||
|
self.0.set_compute_root_descriptor_table(
|
||||||
|
0,
|
||||||
|
descriptor_set.0.get_gpu_descriptor_handle_at_offset(0),
|
||||||
|
);
|
||||||
|
self.0.dispatch(size.0, size.1, size.2);
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn memory_barrier(&mut self) {
|
||||||
|
// See comments in CommandBuffer::pipeline_barrier in gfx-hal dx12 backend.
|
||||||
|
// The "proper" way to do this would be to name the actual buffers participating
|
||||||
|
// in the barrier. But it seems like this is a reasonable way to create a
|
||||||
|
// global barrier.
|
||||||
|
let bar = wrappers::create_uav_resource_barrier(ptr::null_mut());
|
||||||
|
self.0.resource_barrier(&[bar]);
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn host_barrier(&mut self) {
|
||||||
|
// My understanding is that a host barrier is not needed, but am still hunting
|
||||||
|
// down an authoritative source for that. Among other things, the docs for
|
||||||
|
// Map suggest that it does the needed visibility operation.
|
||||||
|
//
|
||||||
|
// https://docs.microsoft.com/en-us/windows/win32/api/d3d12/nf-d3d12-id3d12resource-map
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn image_barrier(
|
||||||
|
&mut self,
|
||||||
|
image: &Image,
|
||||||
|
src_layout: crate::ImageLayout,
|
||||||
|
dst_layout: crate::ImageLayout,
|
||||||
|
) {
|
||||||
|
let src_state = resource_state_for_image_layout(src_layout);
|
||||||
|
let dst_state = resource_state_for_image_layout(dst_layout);
|
||||||
|
if src_state != dst_state {
|
||||||
|
let bar = wrappers::create_transition_resource_barrier(
|
||||||
|
image.resource.get_mut(),
|
||||||
|
src_state,
|
||||||
|
dst_state,
|
||||||
|
);
|
||||||
|
self.0.resource_barrier(&[bar]);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn clear_buffer(&self, buffer: &Buffer, size: Option<u64>) {
|
||||||
|
// Open question: do we call ClearUnorderedAccessViewUint or dispatch a
|
||||||
|
// compute shader? Either way we will need descriptors here.
|
||||||
|
todo!()
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn copy_buffer(&self, src: &Buffer, dst: &Buffer) {
|
||||||
|
// TODO: consider using copy_resource here (if sizes match)
|
||||||
|
let size = src.size.min(dst.size);
|
||||||
|
self.0.copy_buffer(&dst.resource, 0, &src.resource, 0, size);
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn copy_image_to_buffer(&self, src: &Image, dst: &Buffer) {
|
||||||
|
self.0
|
||||||
|
.copy_texture_to_buffer(&src.resource, &dst.resource, src.size.0, src.size.1);
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn copy_buffer_to_image(&self, src: &Buffer, dst: &Image) {
|
||||||
|
self.0
|
||||||
|
.copy_buffer_to_texture(&src.resource, &dst.resource, dst.size.0, dst.size.1);
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn blit_image(&self, src: &Image, dst: &Image) {
|
||||||
|
self.0.copy_resource(&src.resource, &dst.resource);
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn reset_query_pool(&mut self, pool: &QueryPool) {
|
||||||
|
todo!()
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn write_timestamp(&mut self, pool: &QueryPool, query: u32) {
|
||||||
|
self.0.end_timing_query(&pool.heap, query);
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn finish_timestamps(&mut self, pool: &QueryPool) {
|
||||||
|
self.0
|
||||||
|
.resolve_timing_query_data(&pool.heap, 0, pool.n_queries, &pool.buf.resource, 0);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl crate::PipelineBuilder<Dx12Device> for PipelineBuilder {
|
||||||
|
fn add_buffers(&mut self, n_buffers: u32) {
|
||||||
|
if n_buffers != 0 {
|
||||||
|
self.ranges.push(d3d12::D3D12_DESCRIPTOR_RANGE {
|
||||||
|
RangeType: d3d12::D3D12_DESCRIPTOR_RANGE_TYPE_UAV,
|
||||||
|
NumDescriptors: n_buffers,
|
||||||
|
BaseShaderRegister: self.n_uav,
|
||||||
|
RegisterSpace: 0,
|
||||||
|
OffsetInDescriptorsFromTableStart: d3d12::D3D12_DESCRIPTOR_RANGE_OFFSET_APPEND,
|
||||||
|
});
|
||||||
|
self.n_uav += n_buffers;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn add_images(&mut self, n_images: u32) {
|
||||||
|
// These are UAV images, so the descriptor type is the same as buffers.
|
||||||
|
self.add_buffers(n_images)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn add_textures(&mut self, max_textures: u32) {
|
||||||
|
todo!()
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn create_compute_pipeline(
|
||||||
|
self,
|
||||||
|
device: &Dx12Device,
|
||||||
|
code: &str,
|
||||||
|
) -> Result<Pipeline, Error> {
|
||||||
|
#[cfg(debug_assertions)]
|
||||||
|
let flags = winapi::um::d3dcompiler::D3DCOMPILE_DEBUG
|
||||||
|
| winapi::um::d3dcompiler::D3DCOMPILE_SKIP_OPTIMIZATION;
|
||||||
|
#[cfg(not(debug_assertions))]
|
||||||
|
let flags = 0;
|
||||||
|
let shader_blob = ShaderByteCode::compile(code, "cs_5_1", "main", flags)?;
|
||||||
|
let shader = ShaderByteCode::from_blob(shader_blob);
|
||||||
|
let mut root_parameter = d3d12::D3D12_ROOT_PARAMETER {
|
||||||
|
ParameterType: d3d12::D3D12_ROOT_PARAMETER_TYPE_DESCRIPTOR_TABLE,
|
||||||
|
ShaderVisibility: d3d12::D3D12_SHADER_VISIBILITY_ALL,
|
||||||
|
..mem::zeroed()
|
||||||
|
};
|
||||||
|
*root_parameter.u.DescriptorTable_mut() = d3d12::D3D12_ROOT_DESCRIPTOR_TABLE {
|
||||||
|
NumDescriptorRanges: self.ranges.len().try_into()?,
|
||||||
|
pDescriptorRanges: self.ranges.as_ptr(),
|
||||||
|
};
|
||||||
|
let root_signature_desc = d3d12::D3D12_ROOT_SIGNATURE_DESC {
|
||||||
|
NumParameters: 1,
|
||||||
|
pParameters: &root_parameter,
|
||||||
|
NumStaticSamplers: 0,
|
||||||
|
pStaticSamplers: ptr::null(),
|
||||||
|
Flags: d3d12::D3D12_ROOT_SIGNATURE_FLAG_NONE,
|
||||||
|
};
|
||||||
|
let root_signature_blob = wrappers::RootSignature::serialize_description(
|
||||||
|
&root_signature_desc,
|
||||||
|
d3d12::D3D_ROOT_SIGNATURE_VERSION_1,
|
||||||
|
)?;
|
||||||
|
let root_signature = device
|
||||||
|
.device
|
||||||
|
.create_root_signature(0, root_signature_blob)?;
|
||||||
|
let desc = d3d12::D3D12_COMPUTE_PIPELINE_STATE_DESC {
|
||||||
|
pRootSignature: root_signature.0.as_raw(),
|
||||||
|
CS: shader.bytecode,
|
||||||
|
NodeMask: 0,
|
||||||
|
CachedPSO: d3d12::D3D12_CACHED_PIPELINE_STATE {
|
||||||
|
pCachedBlob: ptr::null(),
|
||||||
|
CachedBlobSizeInBytes: 0,
|
||||||
|
},
|
||||||
|
Flags: d3d12::D3D12_PIPELINE_STATE_FLAG_NONE,
|
||||||
|
};
|
||||||
|
let pipeline_state = device.device.create_compute_pipeline_state(&desc)?;
|
||||||
|
Ok(Pipeline {
|
||||||
|
pipeline_state,
|
||||||
|
root_signature,
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl crate::DescriptorSetBuilder<Dx12Device> for DescriptorSetBuilder {
|
||||||
|
fn add_buffers(&mut self, buffers: &[&Buffer]) {
|
||||||
|
// Note: we could get rid of the clone here (which is an AddRef)
|
||||||
|
// and store a raw pointer, as it's a safety precondition that
|
||||||
|
// the resources are kept alive til build.
|
||||||
|
self.buffers.extend(buffers.iter().copied().cloned());
|
||||||
|
}
|
||||||
|
|
||||||
|
fn add_images(&mut self, images: &[&Image]) {
|
||||||
|
self.images.extend(images.iter().copied().cloned());
|
||||||
|
}
|
||||||
|
|
||||||
|
fn add_textures(&mut self, images: &[&Image]) {
|
||||||
|
todo!()
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn build(
|
||||||
|
self,
|
||||||
|
device: &Dx12Device,
|
||||||
|
_pipeline: &Pipeline,
|
||||||
|
) -> Result<DescriptorSet, Error> {
|
||||||
|
let n_descriptors = self.buffers.len() + self.images.len();
|
||||||
|
let heap_desc = d3d12::D3D12_DESCRIPTOR_HEAP_DESC {
|
||||||
|
Type: d3d12::D3D12_DESCRIPTOR_HEAP_TYPE_CBV_SRV_UAV,
|
||||||
|
NumDescriptors: n_descriptors.try_into()?,
|
||||||
|
Flags: d3d12::D3D12_DESCRIPTOR_HEAP_FLAG_SHADER_VISIBLE,
|
||||||
|
NodeMask: 0,
|
||||||
|
};
|
||||||
|
let heap = device.device.create_descriptor_heap(&heap_desc)?;
|
||||||
|
let mut ix = 0;
|
||||||
|
for buffer in self.buffers {
|
||||||
|
device
|
||||||
|
.device
|
||||||
|
.create_byte_addressed_buffer_unordered_access_view(
|
||||||
|
&buffer.resource,
|
||||||
|
heap.get_cpu_descriptor_handle_at_offset(ix),
|
||||||
|
0,
|
||||||
|
(buffer.size / 4).try_into()?,
|
||||||
|
);
|
||||||
|
ix += 1;
|
||||||
|
}
|
||||||
|
for image in self.images {
|
||||||
|
device.device.create_unordered_access_view(
|
||||||
|
&image.resource,
|
||||||
|
heap.get_cpu_descriptor_handle_at_offset(ix),
|
||||||
|
);
|
||||||
|
ix += 1;
|
||||||
|
}
|
||||||
|
Ok(DescriptorSet(heap))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl MemoryArchitecture {
|
||||||
|
// See https://msdn.microsoft.com/de-de/library/windows/desktop/dn788678(v=vs.85).aspx
|
||||||
|
|
||||||
|
fn page_property(&self, usage: BufferUsage) -> d3d12::D3D12_CPU_PAGE_PROPERTY {
|
||||||
|
if usage.contains(BufferUsage::MAP_READ) {
|
||||||
|
d3d12::D3D12_CPU_PAGE_PROPERTY_WRITE_BACK
|
||||||
|
} else if usage.contains(BufferUsage::MAP_WRITE) {
|
||||||
|
if *self == MemoryArchitecture::CacheCoherentUMA {
|
||||||
|
d3d12::D3D12_CPU_PAGE_PROPERTY_WRITE_BACK
|
||||||
|
} else {
|
||||||
|
d3d12::D3D12_CPU_PAGE_PROPERTY_WRITE_COMBINE
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
d3d12::D3D12_CPU_PAGE_PROPERTY_NOT_AVAILABLE
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn memory_pool(&self, usage: BufferUsage) -> d3d12::D3D12_MEMORY_POOL {
|
||||||
|
if *self == MemoryArchitecture::NUMA
|
||||||
|
&& !usage.intersects(BufferUsage::MAP_READ | BufferUsage::MAP_WRITE)
|
||||||
|
{
|
||||||
|
d3d12::D3D12_MEMORY_POOL_L1
|
||||||
|
} else {
|
||||||
|
d3d12::D3D12_MEMORY_POOL_L0
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn resource_state_for_image_layout(layout: ImageLayout) -> d3d12::D3D12_RESOURCE_STATES {
|
||||||
|
match layout {
|
||||||
|
ImageLayout::Undefined => d3d12::D3D12_RESOURCE_STATE_COMMON,
|
||||||
|
ImageLayout::Present => d3d12::D3D12_RESOURCE_STATE_PRESENT,
|
||||||
|
ImageLayout::BlitSrc => d3d12::D3D12_RESOURCE_STATE_COPY_SOURCE,
|
||||||
|
ImageLayout::BlitDst => d3d12::D3D12_RESOURCE_STATE_COPY_DEST,
|
||||||
|
ImageLayout::General => d3d12::D3D12_RESOURCE_STATE_COMMON,
|
||||||
|
ImageLayout::ShaderRead => d3d12::D3D12_RESOURCE_STATE_PIXEL_SHADER_RESOURCE,
|
||||||
|
}
|
||||||
|
}
|
84
piet-gpu-hal/src/dx12/error.rs
Normal file
84
piet-gpu-hal/src/dx12/error.rs
Normal file
|
@ -0,0 +1,84 @@
|
||||||
|
// Copyright © 2019 piet-gpu developers.
|
||||||
|
//
|
||||||
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
||||||
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
||||||
|
// option. This file may not be copied, modified, or distributed
|
||||||
|
// except according to those terms.
|
||||||
|
|
||||||
|
//! This is a Windows-specific error mechanism (adapted from piet-dx12),
|
||||||
|
//! but we should adapt it to be more general.
|
||||||
|
|
||||||
|
use winapi::shared::winerror;
|
||||||
|
|
||||||
|
pub enum Error {
|
||||||
|
Hresult(winerror::HRESULT),
|
||||||
|
ExplainedHr(&'static str, winerror::HRESULT),
|
||||||
|
}
|
||||||
|
|
||||||
|
impl std::fmt::Debug for Error {
|
||||||
|
fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
|
||||||
|
match self {
|
||||||
|
Error::Hresult(hr) => write!(f, "hresult {:x}", hr),
|
||||||
|
Error::ExplainedHr(exp, hr) => {
|
||||||
|
write!(f, "{}: ", exp)?;
|
||||||
|
write_hr(f, *hr)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl std::fmt::Display for Error {
|
||||||
|
fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
|
||||||
|
std::fmt::Debug::fmt(self, f)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl std::error::Error for Error {}
|
||||||
|
|
||||||
|
/// Strings for errors we're likely to see.
|
||||||
|
///
|
||||||
|
/// See https://docs.microsoft.com/en-us/windows/win32/direct3ddxgi/dxgi-error
|
||||||
|
fn err_str_for_hr(hr: winerror::HRESULT) -> Option<&'static str> {
|
||||||
|
Some(match hr as u32 {
|
||||||
|
0x80070057 => "E_INVALIDARG",
|
||||||
|
0x887a0001 => "DXGI_ERROR_INVALID_CALL",
|
||||||
|
0x887a0002 => "DXGI_ERROR_NOT_FOUND",
|
||||||
|
0x887a0004 => "DXGI_ERROR_UNSUPPORTED",
|
||||||
|
0x887a0005 => "DXGI_ERROR_DEVICE_REMOVED",
|
||||||
|
0x887a0006 => "DXGI_ERROR_DEVICE_HUNG",
|
||||||
|
_ => return None,
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
fn write_hr(f: &mut std::fmt::Formatter, hr: winerror::HRESULT) -> std::fmt::Result {
|
||||||
|
if let Some(err_str) = err_str_for_hr(hr) {
|
||||||
|
write!(f, "{:x} ({})", hr, err_str)
|
||||||
|
} else {
|
||||||
|
write!(f, "{:x}", hr)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub type D3DResult<T> = (T, winerror::HRESULT);
|
||||||
|
|
||||||
|
pub fn error_if_failed_else_value<T>(result: D3DResult<T>) -> Result<T, Error> {
|
||||||
|
let (result_value, hresult) = result;
|
||||||
|
|
||||||
|
if winerror::SUCCEEDED(hresult) {
|
||||||
|
Ok(result_value)
|
||||||
|
} else {
|
||||||
|
Err(Error::Hresult(hresult))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn error_if_failed_else_unit(hresult: winerror::HRESULT) -> Result<(), Error> {
|
||||||
|
error_if_failed_else_value(((), hresult))
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn explain_error(hresult: winerror::HRESULT, explanation: &'static str) -> Result<(), Error> {
|
||||||
|
if winerror::SUCCEEDED(hresult) {
|
||||||
|
Ok(())
|
||||||
|
} else {
|
||||||
|
Err(Error::ExplainedHr(explanation, hresult))
|
||||||
|
}
|
||||||
|
}
|
1574
piet-gpu-hal/src/dx12/wrappers.rs
Normal file
1574
piet-gpu-hal/src/dx12/wrappers.rs
Normal file
File diff suppressed because it is too large
Load diff
|
@ -6,12 +6,14 @@ use bitflags::bitflags;
|
||||||
|
|
||||||
pub mod hub;
|
pub mod hub;
|
||||||
|
|
||||||
|
#[cfg(target_os = "windows")]
|
||||||
|
pub mod dx12;
|
||||||
pub mod vulkan;
|
pub mod vulkan;
|
||||||
|
|
||||||
/// This isn't great but is expedient.
|
/// This isn't great but is expedient.
|
||||||
pub type Error = Box<dyn std::error::Error>;
|
pub type Error = Box<dyn std::error::Error>;
|
||||||
|
|
||||||
#[derive(Copy, Clone, Debug)]
|
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
|
||||||
pub enum ImageLayout {
|
pub enum ImageLayout {
|
||||||
Undefined,
|
Undefined,
|
||||||
Present,
|
Present,
|
||||||
|
@ -87,6 +89,7 @@ pub trait Device: Sized {
|
||||||
type PipelineBuilder: PipelineBuilder<Self>;
|
type PipelineBuilder: PipelineBuilder<Self>;
|
||||||
type DescriptorSetBuilder: DescriptorSetBuilder<Self>;
|
type DescriptorSetBuilder: DescriptorSetBuilder<Self>;
|
||||||
type Sampler;
|
type Sampler;
|
||||||
|
type ShaderSource: ?Sized;
|
||||||
|
|
||||||
/// Query the GPU info.
|
/// Query the GPU info.
|
||||||
///
|
///
|
||||||
|
@ -133,7 +136,7 @@ pub trait Device: Sized {
|
||||||
/// is subsumed by the builder.
|
/// is subsumed by the builder.
|
||||||
unsafe fn create_simple_compute_pipeline(
|
unsafe fn create_simple_compute_pipeline(
|
||||||
&self,
|
&self,
|
||||||
code: &[u8],
|
code: &Self::ShaderSource,
|
||||||
n_buffers: u32,
|
n_buffers: u32,
|
||||||
n_images: u32,
|
n_images: u32,
|
||||||
) -> Result<Self::Pipeline, Error> {
|
) -> Result<Self::Pipeline, Error> {
|
||||||
|
@ -278,6 +281,10 @@ pub trait CmdBuf<D: Device> {
|
||||||
unsafe fn reset_query_pool(&mut self, pool: &D::QueryPool);
|
unsafe fn reset_query_pool(&mut self, pool: &D::QueryPool);
|
||||||
|
|
||||||
unsafe fn write_timestamp(&mut self, pool: &D::QueryPool, query: u32);
|
unsafe fn write_timestamp(&mut self, pool: &D::QueryPool, query: u32);
|
||||||
|
|
||||||
|
/// Prepare the timestamps for reading. This isn't required on Vulkan but
|
||||||
|
/// is required on (at least) DX12.
|
||||||
|
unsafe fn finish_timestamps(&mut self, pool: &D::QueryPool) {}
|
||||||
}
|
}
|
||||||
|
|
||||||
/// A builder for pipelines with more complex layouts.
|
/// A builder for pipelines with more complex layouts.
|
||||||
|
@ -288,7 +295,11 @@ pub trait PipelineBuilder<D: Device> {
|
||||||
fn add_images(&mut self, n_images: u32);
|
fn add_images(&mut self, n_images: u32);
|
||||||
/// Add a binding with a variable-size array of textures.
|
/// Add a binding with a variable-size array of textures.
|
||||||
fn add_textures(&mut self, max_textures: u32);
|
fn add_textures(&mut self, max_textures: u32);
|
||||||
unsafe fn create_compute_pipeline(self, device: &D, code: &[u8]) -> Result<D::Pipeline, Error>;
|
unsafe fn create_compute_pipeline(
|
||||||
|
self,
|
||||||
|
device: &D,
|
||||||
|
code: &D::ShaderSource,
|
||||||
|
) -> Result<D::Pipeline, Error>;
|
||||||
}
|
}
|
||||||
|
|
||||||
/// A builder for descriptor sets with more complex layouts.
|
/// A builder for descriptor sets with more complex layouts.
|
||||||
|
|
|
@ -465,6 +465,7 @@ impl crate::Device for VkDevice {
|
||||||
type PipelineBuilder = PipelineBuilder;
|
type PipelineBuilder = PipelineBuilder;
|
||||||
type DescriptorSetBuilder = DescriptorSetBuilder;
|
type DescriptorSetBuilder = DescriptorSetBuilder;
|
||||||
type Sampler = vk::Sampler;
|
type Sampler = vk::Sampler;
|
||||||
|
type ShaderSource = [u8];
|
||||||
|
|
||||||
fn query_gpu_info(&self) -> GpuInfo {
|
fn query_gpu_info(&self) -> GpuInfo {
|
||||||
self.gpu_info.clone()
|
self.gpu_info.clone()
|
||||||
|
|
Loading…
Reference in a new issue