librashader/librashader-runtime-d3d12/src/util.rs

434 lines
14 KiB
Rust
Raw Normal View History

2023-02-06 08:17:23 +11:00
use crate::error;
use crate::error::assume_d3d12_init;
use librashader_reflect::reflect::semantics::BindingStage;
use std::ffi::CStr;
2023-01-25 17:32:10 +11:00
use std::mem::ManuallyDrop;
use std::u64;
2023-02-05 17:54:56 +11:00
use windows::core::{Interface, PCSTR, PCWSTR};
2023-02-06 08:17:23 +11:00
use windows::Win32::Graphics::Direct3D::Dxc::{
DxcValidatorFlags_Default, DxcValidatorFlags_InPlaceEdit, DxcValidatorFlags_ModuleOnly,
DxcValidatorFlags_ValidMask, IDxcBlob, IDxcBlobUtf8, IDxcCompiler, IDxcLibrary, IDxcUtils,
IDxcValidator, DXC_CP, DXC_CP_UTF8,
};
use windows::Win32::Graphics::Direct3D::Fxc::{
D3DCompile, D3DCOMPILE_DEBUG, D3DCOMPILE_SKIP_OPTIMIZATION,
};
2023-01-25 15:15:43 +11:00
use windows::Win32::Graphics::Direct3D::ID3DBlob;
2023-02-06 08:17:23 +11:00
use windows::Win32::Graphics::Direct3D12::{
ID3D12Device, ID3D12GraphicsCommandList, ID3D12Resource, D3D12_FEATURE_DATA_FORMAT_SUPPORT,
D3D12_FEATURE_FORMAT_SUPPORT, D3D12_MEMCPY_DEST, D3D12_PLACED_SUBRESOURCE_FOOTPRINT,
D3D12_RESOURCE_BARRIER, D3D12_RESOURCE_BARRIER_0, D3D12_RESOURCE_BARRIER_ALL_SUBRESOURCES,
D3D12_RESOURCE_BARRIER_FLAG_NONE, D3D12_RESOURCE_BARRIER_TYPE_TRANSITION,
D3D12_RESOURCE_DIMENSION_BUFFER, D3D12_RESOURCE_STATES, D3D12_RESOURCE_TRANSITION_BARRIER,
D3D12_SUBRESOURCE_DATA, D3D12_TEXTURE_COPY_LOCATION, D3D12_TEXTURE_COPY_LOCATION_0,
D3D12_TEXTURE_COPY_TYPE_PLACED_FOOTPRINT, D3D12_TEXTURE_COPY_TYPE_SUBRESOURCE_INDEX,
};
2023-01-25 15:15:43 +11:00
use windows::Win32::Graphics::Dxgi::Common::*;
/// wtf retroarch?
const DXGI_FORMAT_EX_A4R4G4B4_UNORM: DXGI_FORMAT = DXGI_FORMAT(1000);
const fn d3d12_format_fallback_list(format: DXGI_FORMAT) -> Option<&'static [DXGI_FORMAT]> {
match format {
DXGI_FORMAT_R32G32B32A32_FLOAT => Some(&[
DXGI_FORMAT_R32G32B32A32_FLOAT,
DXGI_FORMAT_R16G16B16A16_FLOAT,
DXGI_FORMAT_R32G32B32_FLOAT,
DXGI_FORMAT_R11G11B10_FLOAT,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_R16G16B16A16_FLOAT => Some(&[
DXGI_FORMAT_R16G16B16A16_FLOAT,
DXGI_FORMAT_R32G32B32A32_FLOAT,
DXGI_FORMAT_R32G32B32_FLOAT,
DXGI_FORMAT_R11G11B10_FLOAT,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_R8G8B8A8_UNORM => Some(&[
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_B8G8R8X8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_R8G8B8A8_UNORM_SRGB => Some(&[
DXGI_FORMAT_R8G8B8A8_UNORM_SRGB,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_B8G8R8X8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_B8G8R8A8_UNORM => Some(&[
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_B8G8R8X8_UNORM => Some(&[
DXGI_FORMAT_B8G8R8X8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_B5G6R5_UNORM => Some(&[
DXGI_FORMAT_B5G6R5_UNORM,
DXGI_FORMAT_B8G8R8X8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_EX_A4R4G4B4_UNORM | DXGI_FORMAT_B4G4R4A4_UNORM => Some(&[
DXGI_FORMAT_B4G4R4A4_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_A8_UNORM => Some(&[
DXGI_FORMAT_A8_UNORM,
DXGI_FORMAT_R8_UNORM,
DXGI_FORMAT_R8G8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_R8_UNORM => Some(&[
DXGI_FORMAT_R8_UNORM,
DXGI_FORMAT_A8_UNORM,
DXGI_FORMAT_R8G8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
_ => None,
}
}
pub fn d3d12_get_closest_format(
device: &ID3D12Device,
format: DXGI_FORMAT,
format_support: D3D12_FEATURE_DATA_FORMAT_SUPPORT,
) -> DXGI_FORMAT {
let default_list = [format, DXGI_FORMAT_UNKNOWN];
let format_support_list = d3d12_format_fallback_list(format).unwrap_or(&default_list);
for supported in format_support_list {
unsafe {
let mut support = D3D12_FEATURE_DATA_FORMAT_SUPPORT {
Format: format,
..Default::default()
};
if device
.CheckFeatureSupport(
D3D12_FEATURE_FORMAT_SUPPORT,
&mut support as *mut _ as *mut _,
std::mem::size_of::<D3D12_FEATURE_DATA_FORMAT_SUPPORT>() as u32,
)
.is_ok()
&& (support.Support1 & format_support.Support1) == format_support.Support1
&& (support.Support2 & format_support.Support2) == format_support.Support2
{
return *supported;
}
}
}
DXGI_FORMAT_UNKNOWN
}
pub fn fxc_compile_shader(source: &[u8], entry: &[u8], version: &[u8]) -> error::Result<ID3DBlob> {
2023-01-30 18:02:10 +11:00
// todo: compile with dxc
2023-01-25 15:15:43 +11:00
unsafe {
let mut blob = None;
D3DCompile(
source.as_ptr().cast(),
source.len(),
None,
None,
None,
PCSTR(entry.as_ptr()),
PCSTR(version.as_ptr()),
2023-02-06 08:17:23 +11:00
D3DCOMPILE_DEBUG | D3DCOMPILE_SKIP_OPTIMIZATION,
2023-01-30 18:02:10 +11:00
// if cfg!(feature = "debug-shader") {
// D3DCOMPILE_DEBUG | D3DCOMPILE_SKIP_OPTIMIZATION
// } else {
// D3DCOMPILE_OPTIMIZATION_LEVEL3
// },
2023-01-25 15:15:43 +11:00
0,
&mut blob,
None,
)?;
2023-01-31 17:25:45 +11:00
assume_d3d12_init!(blob, "D3DCompile");
Ok(blob)
2023-01-25 15:15:43 +11:00
}
}
2023-01-25 17:32:10 +11:00
2023-02-06 08:17:23 +11:00
pub fn dxc_compile_shader(
library: &IDxcUtils,
compiler: &IDxcCompiler,
source: &String,
profile: BindingStage,
) -> error::Result<IDxcBlob> {
// todo: compile with dxc
// let mut source = source.to_vec();
2023-02-06 08:17:23 +11:00
let include = unsafe { library.CreateDefaultIncludeHandler()? };
2023-02-05 17:54:56 +11:00
let blob = unsafe {
2023-02-05 17:54:56 +11:00
library.CreateBlobFromPinned(
source.as_ptr().cast(),
2023-02-05 17:54:56 +11:00
source.as_bytes().len() as u32,
2023-02-06 08:17:23 +11:00
DXC_CP_UTF8,
)?
};
2023-02-05 17:54:56 +11:00
let profile = if profile == BindingStage::FRAGMENT {
windows::w!("ps_6_0")
} else {
windows::w!("vs_6_0")
};
unsafe {
2023-02-06 08:17:23 +11:00
let result = compiler.Compile(
&blob,
2023-02-05 17:54:56 +11:00
PCWSTR::null(),
windows::w!("main"),
profile,
None,
&[],
2023-02-06 08:17:23 +11:00
&include,
2023-02-05 17:54:56 +11:00
)?;
if let Ok(buf) = result.GetErrorBuffer() {
unsafe {
let buf: IDxcBlobUtf8 = buf.cast().unwrap();
2023-02-06 08:17:23 +11:00
let buf =
std::slice::from_raw_parts(buf.GetBufferPointer().cast(), buf.GetBufferSize());
2023-02-05 17:54:56 +11:00
let str = std::str::from_utf8_unchecked(buf);
if str.len() != 0 {
eprintln!("{}", str);
}
}
}
let result = result.GetResult()?;
Ok(result)
}
}
2023-02-06 08:17:23 +11:00
pub fn dxc_validate_shader(
library: &IDxcUtils,
validator: &IDxcValidator,
source: &[u8],
) -> error::Result<IDxcBlob> {
2023-02-05 17:54:56 +11:00
// todo: compile with dxc
// let mut source = source.to_vec();
2023-02-06 08:17:23 +11:00
let blob =
unsafe { library.CreateBlob(source.as_ptr().cast(), source.len() as u32, DXC_CP(0))? };
2023-02-05 17:54:56 +11:00
unsafe {
let result = validator
2023-02-06 08:17:23 +11:00
.Validate(&blob, DxcValidatorFlags_InPlaceEdit)
.unwrap();
if let Ok(buf) = result.GetErrorBuffer() {
unsafe {
let buf: IDxcBlobUtf8 = buf.cast().unwrap();
2023-02-06 08:17:23 +11:00
let buf =
std::slice::from_raw_parts(buf.GetBufferPointer().cast(), buf.GetBufferSize());
let str = std::str::from_utf8_unchecked(buf);
if str.len() != 0 {
eprintln!("{}", str);
}
}
}
Ok(IDxcBlob::from(blob))
}
}
2023-01-28 17:38:55 +11:00
#[inline(always)]
2023-02-06 08:17:23 +11:00
pub fn d3d12_resource_transition(
cmd: &ID3D12GraphicsCommandList,
2023-01-25 17:32:10 +11:00
resource: &ID3D12Resource,
before: D3D12_RESOURCE_STATES,
2023-01-28 17:38:55 +11:00
after: D3D12_RESOURCE_STATES,
) {
2023-02-06 08:17:23 +11:00
d3d12_resource_transition_subresource(
cmd,
resource,
before,
after,
D3D12_RESOURCE_BARRIER_ALL_SUBRESOURCES,
);
2023-01-28 17:38:55 +11:00
}
#[inline(always)]
2023-02-06 08:17:23 +11:00
pub fn d3d12_resource_transition_subresource(
cmd: &ID3D12GraphicsCommandList,
resource: &ID3D12Resource,
before: D3D12_RESOURCE_STATES,
after: D3D12_RESOURCE_STATES,
subresource: u32,
2023-01-25 17:32:10 +11:00
) {
let barrier = [D3D12_RESOURCE_BARRIER {
Type: D3D12_RESOURCE_BARRIER_TYPE_TRANSITION,
Flags: D3D12_RESOURCE_BARRIER_FLAG_NONE,
Anonymous: D3D12_RESOURCE_BARRIER_0 {
Transition: ManuallyDrop::new(D3D12_RESOURCE_TRANSITION_BARRIER {
pResource: windows::core::ManuallyDrop::new(resource),
2023-01-28 17:38:55 +11:00
Subresource: subresource,
2023-01-25 17:32:10 +11:00
StateBefore: before,
StateAfter: after,
2023-02-06 08:17:23 +11:00
}),
2023-01-25 17:32:10 +11:00
},
}];
2023-02-06 08:17:23 +11:00
unsafe { cmd.ResourceBarrier(&barrier) }
2023-01-25 17:32:10 +11:00
}
2023-02-06 08:17:23 +11:00
pub fn d3d12_update_subresources(
cmd: &ID3D12GraphicsCommandList,
destination_resource: &ID3D12Resource,
intermediate_resource: &ID3D12Resource,
intermediate_offset: u64,
first_subresouce: u32,
num_subresources: u32,
source: &[D3D12_SUBRESOURCE_DATA],
2023-01-25 17:32:10 +11:00
) -> error::Result<u64> {
// let allocation_size = std::mem::size_of::<D3D12_PLACED_SUBRESOURCE_FOOTPRINT>()
// + std::mem::size_of::<u32>()
// + std::mem::size_of::<u64>() * num_subresources;
unsafe {
let destination_desc = destination_resource.GetDesc();
let mut device: Option<ID3D12Device> = None;
destination_resource.GetDevice(&mut device)?;
assume_d3d12_init!(device, "GetDevice");
2023-02-06 08:17:23 +11:00
let mut layouts =
vec![D3D12_PLACED_SUBRESOURCE_FOOTPRINT::default(); num_subresources as usize];
2023-01-25 17:32:10 +11:00
let mut num_rows = vec![0; num_subresources as usize];
2023-02-06 08:17:23 +11:00
let mut row_sizes_in_bytes = vec![0; num_subresources as usize];
2023-01-25 17:32:10 +11:00
let mut required_size = 0;
// texture upload
unsafe {
device.GetCopyableFootprints(
&destination_desc,
first_subresouce,
num_subresources,
intermediate_offset,
Some(layouts.as_mut_ptr()),
Some(num_rows.as_mut_ptr()),
Some(row_sizes_in_bytes.as_mut_ptr()),
Some(&mut required_size),
);
}
update_subresources(
cmd,
destination_resource,
intermediate_resource,
first_subresouce,
num_subresources,
required_size,
&layouts,
&num_rows,
&row_sizes_in_bytes,
source,
)
}
}
#[allow(clippy::too_many_arguments)]
fn update_subresources(
cmd: &ID3D12GraphicsCommandList,
destination_resource: &ID3D12Resource,
intermediate_resource: &ID3D12Resource,
first_subresouce: u32,
num_subresources: u32,
required_size: u64,
layouts: &[D3D12_PLACED_SUBRESOURCE_FOOTPRINT],
num_rows: &[u32],
row_sizes_in_bytes: &[u64],
source_data: &[D3D12_SUBRESOURCE_DATA],
) -> error::Result<u64> {
// ToDo: implement validation as in the original function
unsafe {
let mut data = std::ptr::null_mut();
intermediate_resource.Map(0, None, Some(&mut data))?;
for i in 0..num_subresources as usize {
let dest_data = D3D12_MEMCPY_DEST {
2023-02-06 08:17:23 +11:00
pData: data.offset(layouts[i].Offset as isize) as *mut std::ffi::c_void,
2023-01-25 17:32:10 +11:00
RowPitch: layouts[i].Footprint.RowPitch as usize,
2023-02-06 08:17:23 +11:00
SlicePitch: ((layouts[i].Footprint.RowPitch) * num_rows[i]) as usize,
2023-01-25 17:32:10 +11:00
};
memcpy_subresource(
&dest_data,
&source_data[i],
row_sizes_in_bytes[i],
num_rows[i],
layouts[i].Footprint.Depth,
);
}
intermediate_resource.Unmap(0, None);
}
unsafe {
let destination_desc = destination_resource.GetDesc();
if destination_desc.Dimension == D3D12_RESOURCE_DIMENSION_BUFFER {
cmd.CopyBufferRegion(
destination_resource,
0,
intermediate_resource,
layouts[0].Offset,
layouts[0].Footprint.Width as u64,
);
} else {
for i in 0..num_subresources as usize {
let dest_location = D3D12_TEXTURE_COPY_LOCATION {
pResource: windows::core::ManuallyDrop::new(destination_resource),
Type: D3D12_TEXTURE_COPY_TYPE_SUBRESOURCE_INDEX,
Anonymous: D3D12_TEXTURE_COPY_LOCATION_0 {
2023-02-06 08:17:23 +11:00
SubresourceIndex: i as u32 + first_subresouce,
2023-01-25 17:32:10 +11:00
},
};
let source_location = D3D12_TEXTURE_COPY_LOCATION {
pResource: windows::core::ManuallyDrop::new(intermediate_resource),
Type: D3D12_TEXTURE_COPY_TYPE_PLACED_FOOTPRINT,
Anonymous: D3D12_TEXTURE_COPY_LOCATION_0 {
2023-02-06 08:17:23 +11:00
PlacedFootprint: layouts[i],
2023-01-25 17:32:10 +11:00
},
};
2023-02-06 08:17:23 +11:00
cmd.CopyTextureRegion(&dest_location, 0, 0, 0, &source_location, None);
2023-01-25 17:32:10 +11:00
}
}
Ok(required_size)
}
}
// this function should not leak to the public API, so
// there is no point in using struct wrappers
unsafe fn memcpy_subresource(
dest: &D3D12_MEMCPY_DEST,
src: &D3D12_SUBRESOURCE_DATA,
row_sizes_in_bytes: u64,
num_rows: u32,
num_slices: u32,
) {
2023-02-06 08:17:23 +11:00
for z in 0..num_slices as usize {
let dest_slice = dest.pData.add(dest.SlicePitch * z);
2023-02-01 09:50:47 +11:00
let src_slice = src.pData.offset(src.SlicePitch * z as isize);
2023-01-25 17:32:10 +11:00
for y in 0..num_rows as usize {
std::ptr::copy_nonoverlapping(
2023-02-01 09:50:47 +11:00
src_slice.offset(src.RowPitch * y as isize),
dest_slice.add(dest.RowPitch * y),
2023-01-25 17:32:10 +11:00
row_sizes_in_bytes as usize,
);
}
}
}