librashader/librashader-runtime-d3d12/src/util.rs

394 lines
13 KiB
Rust
Raw Normal View History

2023-02-06 08:17:23 +11:00
use crate::error;
use crate::error::assume_d3d12_init;
2023-02-06 10:34:30 +11:00
2023-01-25 17:32:10 +11:00
use std::mem::ManuallyDrop;
use std::u64;
use widestring::{u16cstr, U16CStr};
2024-08-02 14:53:13 +10:00
use windows::core::{Interface, PCWSTR};
2023-02-06 08:17:23 +11:00
use windows::Win32::Graphics::Direct3D::Dxc::{
2023-02-06 14:24:58 +11:00
DxcValidatorFlags_InPlaceEdit, IDxcBlob, IDxcCompiler, IDxcUtils, IDxcValidator, DXC_CP,
DXC_CP_UTF8,
};
2023-07-20 15:13:22 +10:00
use crate::filter_chain::FrameResiduals;
2023-02-06 08:17:23 +11:00
use windows::Win32::Graphics::Direct3D12::{
ID3D12Device, ID3D12GraphicsCommandList, ID3D12Resource, D3D12_FEATURE_DATA_FORMAT_SUPPORT,
D3D12_FEATURE_FORMAT_SUPPORT, D3D12_MEMCPY_DEST, D3D12_PLACED_SUBRESOURCE_FOOTPRINT,
D3D12_RESOURCE_BARRIER, D3D12_RESOURCE_BARRIER_0, D3D12_RESOURCE_BARRIER_ALL_SUBRESOURCES,
D3D12_RESOURCE_BARRIER_FLAG_NONE, D3D12_RESOURCE_BARRIER_TYPE_TRANSITION,
D3D12_RESOURCE_DIMENSION_BUFFER, D3D12_RESOURCE_STATES, D3D12_RESOURCE_TRANSITION_BARRIER,
D3D12_SUBRESOURCE_DATA, D3D12_TEXTURE_COPY_LOCATION, D3D12_TEXTURE_COPY_LOCATION_0,
D3D12_TEXTURE_COPY_TYPE_PLACED_FOOTPRINT, D3D12_TEXTURE_COPY_TYPE_SUBRESOURCE_INDEX,
};
2023-01-25 15:15:43 +11:00
use windows::Win32::Graphics::Dxgi::Common::*;
/// wtf retroarch?
const DXGI_FORMAT_EX_A4R4G4B4_UNORM: DXGI_FORMAT = DXGI_FORMAT(1000);
const fn d3d12_format_fallback_list(format: DXGI_FORMAT) -> Option<&'static [DXGI_FORMAT]> {
match format {
DXGI_FORMAT_R32G32B32A32_FLOAT => Some(&[
DXGI_FORMAT_R32G32B32A32_FLOAT,
DXGI_FORMAT_R16G16B16A16_FLOAT,
DXGI_FORMAT_R32G32B32_FLOAT,
DXGI_FORMAT_R11G11B10_FLOAT,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_R16G16B16A16_FLOAT => Some(&[
DXGI_FORMAT_R16G16B16A16_FLOAT,
DXGI_FORMAT_R32G32B32A32_FLOAT,
DXGI_FORMAT_R32G32B32_FLOAT,
DXGI_FORMAT_R11G11B10_FLOAT,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_R8G8B8A8_UNORM => Some(&[
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_B8G8R8X8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_R8G8B8A8_UNORM_SRGB => Some(&[
DXGI_FORMAT_R8G8B8A8_UNORM_SRGB,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_B8G8R8X8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_B8G8R8A8_UNORM => Some(&[
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_B8G8R8X8_UNORM => Some(&[
DXGI_FORMAT_B8G8R8X8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_B5G6R5_UNORM => Some(&[
DXGI_FORMAT_B5G6R5_UNORM,
DXGI_FORMAT_B8G8R8X8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_EX_A4R4G4B4_UNORM | DXGI_FORMAT_B4G4R4A4_UNORM => Some(&[
DXGI_FORMAT_B4G4R4A4_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_A8_UNORM => Some(&[
DXGI_FORMAT_A8_UNORM,
DXGI_FORMAT_R8_UNORM,
DXGI_FORMAT_R8G8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
DXGI_FORMAT_R8_UNORM => Some(&[
DXGI_FORMAT_R8_UNORM,
DXGI_FORMAT_A8_UNORM,
DXGI_FORMAT_R8G8_UNORM,
DXGI_FORMAT_R8G8B8A8_UNORM,
DXGI_FORMAT_B8G8R8A8_UNORM,
DXGI_FORMAT_UNKNOWN,
]),
_ => None,
}
}
pub fn d3d12_get_closest_format(
device: &ID3D12Device,
format_support: D3D12_FEATURE_DATA_FORMAT_SUPPORT,
) -> DXGI_FORMAT {
let format = format_support.Format;
2023-01-25 15:15:43 +11:00
let default_list = [format, DXGI_FORMAT_UNKNOWN];
let format_support_list = d3d12_format_fallback_list(format).unwrap_or(&default_list);
for supported in format_support_list {
unsafe {
let mut support = D3D12_FEATURE_DATA_FORMAT_SUPPORT {
Format: *supported,
2023-01-25 15:15:43 +11:00
..Default::default()
};
if device
.CheckFeatureSupport(
D3D12_FEATURE_FORMAT_SUPPORT,
&mut support as *mut _ as *mut _,
std::mem::size_of::<D3D12_FEATURE_DATA_FORMAT_SUPPORT>() as u32,
)
.is_ok()
&& (support.Support1 & format_support.Support1) == format_support.Support1
&& (support.Support2 & format_support.Support2) == format_support.Support2
{
return *supported;
}
}
}
DXGI_FORMAT_UNKNOWN
}
2023-02-06 08:17:23 +11:00
pub fn dxc_compile_shader(
library: &IDxcUtils,
compiler: &IDxcCompiler,
source: impl AsRef<[u8]>,
profile: &U16CStr,
2023-02-06 08:17:23 +11:00
) -> error::Result<IDxcBlob> {
let include = unsafe { library.CreateDefaultIncludeHandler()? };
let source = source.as_ref();
let blob = unsafe {
library.CreateBlobFromPinned(source.as_ptr().cast(), source.len() as u32, DXC_CP_UTF8)?
};
2023-02-05 17:54:56 +11:00
unsafe {
2023-02-06 08:17:23 +11:00
let result = compiler.Compile(
&blob,
2023-02-05 17:54:56 +11:00
PCWSTR::null(),
2023-02-06 13:49:55 +11:00
PCWSTR(u16cstr!("main").as_ptr()),
PCWSTR(profile.as_ptr()),
Some(&[PCWSTR(u16cstr!("-HV 2016").as_ptr())]),
2023-02-05 17:54:56 +11:00
&[],
2023-02-06 08:17:23 +11:00
&include,
2023-02-05 17:54:56 +11:00
)?;
let result = result.GetResult()?;
{
2024-02-20 04:39:44 +11:00
let blob = std::slice::from_raw_parts_mut(
result.GetBufferPointer() as *mut u8,
result.GetBufferSize(),
);
mach_siegbert_vogt_dxcsa::sign_in_place(blob);
}
2023-02-05 17:54:56 +11:00
Ok(result)
}
}
2023-02-06 08:17:23 +11:00
pub fn dxc_validate_shader(
library: &IDxcUtils,
validator: &IDxcValidator,
source: &[u8],
) -> error::Result<IDxcBlob> {
let blob =
unsafe { library.CreateBlob(source.as_ptr().cast(), source.len() as u32, DXC_CP(0))? };
2023-02-05 17:54:56 +11:00
unsafe {
2023-02-06 12:05:22 +11:00
let _result = validator.Validate(&blob, DxcValidatorFlags_InPlaceEdit)?;
2023-04-23 15:13:31 +10:00
Ok(blob.cast()?)
}
}
#[must_use = "Resource Barrier must be disposed"]
2023-02-07 13:56:24 +11:00
pub fn d3d12_get_resource_transition_subresource(
2023-02-06 08:17:23 +11:00
resource: &ID3D12Resource,
before: D3D12_RESOURCE_STATES,
after: D3D12_RESOURCE_STATES,
subresource: u32,
2023-02-07 13:56:24 +11:00
) -> D3D12_RESOURCE_BARRIER {
2023-02-07 18:19:37 +11:00
D3D12_RESOURCE_BARRIER {
2023-01-25 17:32:10 +11:00
Type: D3D12_RESOURCE_BARRIER_TYPE_TRANSITION,
Flags: D3D12_RESOURCE_BARRIER_FLAG_NONE,
Anonymous: D3D12_RESOURCE_BARRIER_0 {
Transition: ManuallyDrop::new(D3D12_RESOURCE_TRANSITION_BARRIER {
2023-04-23 15:13:31 +10:00
pResource: ManuallyDrop::new(Some(resource.clone())),
2023-01-28 17:38:55 +11:00
Subresource: subresource,
2023-01-25 17:32:10 +11:00
StateBefore: before,
StateAfter: after,
2023-02-06 08:17:23 +11:00
}),
2023-01-25 17:32:10 +11:00
},
2023-02-07 18:19:37 +11:00
}
2023-02-07 13:56:24 +11:00
}
#[must_use = "Resource Barrier must be disposed"]
#[inline(always)]
pub fn d3d12_resource_transition(
cmd: &ID3D12GraphicsCommandList,
resource: &ID3D12Resource,
before: D3D12_RESOURCE_STATES,
after: D3D12_RESOURCE_STATES,
) -> [D3D12_RESOURCE_BARRIER; 1] {
d3d12_resource_transition_subresource(
cmd,
resource,
before,
after,
D3D12_RESOURCE_BARRIER_ALL_SUBRESOURCES,
)
}
#[must_use = "Resource Barrier must be disposed"]
2023-02-07 13:56:24 +11:00
#[inline(always)]
pub fn d3d12_resource_transition_subresource(
cmd: &ID3D12GraphicsCommandList,
resource: &ID3D12Resource,
before: D3D12_RESOURCE_STATES,
after: D3D12_RESOURCE_STATES,
subresource: u32,
) -> [D3D12_RESOURCE_BARRIER; 1] {
2023-02-07 13:56:24 +11:00
let barrier = [d3d12_get_resource_transition_subresource(
resource,
before,
after,
subresource,
)];
2023-02-06 08:17:23 +11:00
unsafe { cmd.ResourceBarrier(&barrier) }
barrier
2023-01-25 17:32:10 +11:00
}
2023-04-23 15:13:31 +10:00
pub(crate) fn d3d12_update_subresources(
2023-02-06 08:17:23 +11:00
cmd: &ID3D12GraphicsCommandList,
destination_resource: &ID3D12Resource,
intermediate_resource: &ID3D12Resource,
intermediate_offset: u64,
first_subresouce: u32,
num_subresources: u32,
source: &[D3D12_SUBRESOURCE_DATA],
2023-04-23 15:13:31 +10:00
gc: &mut FrameResiduals,
2023-01-25 17:32:10 +11:00
) -> error::Result<u64> {
// let allocation_size = std::mem::size_of::<D3D12_PLACED_SUBRESOURCE_FOOTPRINT>()
// + std::mem::size_of::<u32>()
// + std::mem::size_of::<u64>() * num_subresources;
unsafe {
let destination_desc = destination_resource.GetDesc();
let mut device: Option<ID3D12Device> = None;
destination_resource.GetDevice(&mut device)?;
assume_d3d12_init!(device, "GetDevice");
2023-02-06 08:17:23 +11:00
let mut layouts =
vec![D3D12_PLACED_SUBRESOURCE_FOOTPRINT::default(); num_subresources as usize];
2023-01-25 17:32:10 +11:00
let mut num_rows = vec![0; num_subresources as usize];
2023-02-06 08:17:23 +11:00
let mut row_sizes_in_bytes = vec![0; num_subresources as usize];
2023-01-25 17:32:10 +11:00
let mut required_size = 0;
2023-02-10 13:03:55 +11:00
2023-01-25 17:32:10 +11:00
// texture upload
2023-02-10 13:03:55 +11:00
device.GetCopyableFootprints(
&destination_desc,
first_subresouce,
num_subresources,
intermediate_offset,
Some(layouts.as_mut_ptr()),
Some(num_rows.as_mut_ptr()),
Some(row_sizes_in_bytes.as_mut_ptr()),
Some(&mut required_size),
);
2023-01-25 17:32:10 +11:00
update_subresources(
cmd,
destination_resource,
intermediate_resource,
first_subresouce,
num_subresources,
required_size,
&layouts,
&num_rows,
&row_sizes_in_bytes,
source,
2023-07-20 15:13:22 +10:00
gc,
2023-01-25 17:32:10 +11:00
)
}
}
#[allow(clippy::too_many_arguments)]
fn update_subresources(
cmd: &ID3D12GraphicsCommandList,
destination_resource: &ID3D12Resource,
intermediate_resource: &ID3D12Resource,
first_subresouce: u32,
num_subresources: u32,
required_size: u64,
layouts: &[D3D12_PLACED_SUBRESOURCE_FOOTPRINT],
num_rows: &[u32],
row_sizes_in_bytes: &[u64],
source_data: &[D3D12_SUBRESOURCE_DATA],
2023-04-23 15:13:31 +10:00
gc: &mut FrameResiduals,
2023-01-25 17:32:10 +11:00
) -> error::Result<u64> {
// ToDo: implement validation as in the original function
unsafe {
let mut data = std::ptr::null_mut();
intermediate_resource.Map(0, None, Some(&mut data))?;
for i in 0..num_subresources as usize {
let dest_data = D3D12_MEMCPY_DEST {
2023-02-06 08:17:23 +11:00
pData: data.offset(layouts[i].Offset as isize) as *mut std::ffi::c_void,
2023-01-25 17:32:10 +11:00
RowPitch: layouts[i].Footprint.RowPitch as usize,
2023-02-06 08:17:23 +11:00
SlicePitch: ((layouts[i].Footprint.RowPitch) * num_rows[i]) as usize,
2023-01-25 17:32:10 +11:00
};
memcpy_subresource(
&dest_data,
&source_data[i],
row_sizes_in_bytes[i],
num_rows[i],
layouts[i].Footprint.Depth,
);
}
intermediate_resource.Unmap(0, None);
}
unsafe {
let destination_desc = destination_resource.GetDesc();
if destination_desc.Dimension == D3D12_RESOURCE_DIMENSION_BUFFER {
cmd.CopyBufferRegion(
destination_resource,
0,
intermediate_resource,
layouts[0].Offset,
layouts[0].Footprint.Width as u64,
);
} else {
for i in 0..num_subresources as usize {
let dest_location = D3D12_TEXTURE_COPY_LOCATION {
2023-04-23 15:13:31 +10:00
pResource: ManuallyDrop::new(Some(destination_resource.clone())),
2023-01-25 17:32:10 +11:00
Type: D3D12_TEXTURE_COPY_TYPE_SUBRESOURCE_INDEX,
Anonymous: D3D12_TEXTURE_COPY_LOCATION_0 {
2023-02-06 08:17:23 +11:00
SubresourceIndex: i as u32 + first_subresouce,
2023-01-25 17:32:10 +11:00
},
};
let source_location = D3D12_TEXTURE_COPY_LOCATION {
2023-04-23 15:13:31 +10:00
pResource: ManuallyDrop::new(Some(intermediate_resource.clone())),
2023-01-25 17:32:10 +11:00
Type: D3D12_TEXTURE_COPY_TYPE_PLACED_FOOTPRINT,
Anonymous: D3D12_TEXTURE_COPY_LOCATION_0 {
2023-02-06 08:17:23 +11:00
PlacedFootprint: layouts[i],
2023-01-25 17:32:10 +11:00
},
};
2023-02-06 08:17:23 +11:00
cmd.CopyTextureRegion(&dest_location, 0, 0, 0, &source_location, None);
2023-04-23 15:13:31 +10:00
gc.dispose_resource(dest_location.pResource);
gc.dispose_resource(source_location.pResource);
2023-01-25 17:32:10 +11:00
}
}
Ok(required_size)
}
}
// this function should not leak to the public API, so
// there is no point in using struct wrappers
unsafe fn memcpy_subresource(
dest: &D3D12_MEMCPY_DEST,
src: &D3D12_SUBRESOURCE_DATA,
row_sizes_in_bytes: u64,
num_rows: u32,
num_slices: u32,
) {
unsafe {
for z in 0..num_slices as usize {
let dest_slice = dest.pData.add(dest.SlicePitch * z);
let src_slice = src.pData.offset(src.SlicePitch * z as isize);
2023-01-25 17:32:10 +11:00
for y in 0..num_rows as usize {
std::ptr::copy_nonoverlapping(
src_slice.offset(src.RowPitch * y as isize),
dest_slice.add(dest.RowPitch * y),
row_sizes_in_bytes as usize,
);
}
2023-01-25 17:32:10 +11:00
}
}
}