mirror of
https://github.com/italicsjenga/vello.git
synced 2025-01-25 18:56:35 +11:00
Merge branch 'master' into mtl_guest
This commit is contained in:
commit
012d679e3d
18 changed files with 132 additions and 49 deletions
|
@ -225,6 +225,12 @@ pub trait CmdBuf<D: Device> {
|
||||||
/// Prepare the timestamps for reading. This isn't required on Vulkan but
|
/// Prepare the timestamps for reading. This isn't required on Vulkan but
|
||||||
/// is required on (at least) DX12.
|
/// is required on (at least) DX12.
|
||||||
unsafe fn finish_timestamps(&mut self, _pool: &D::QueryPool) {}
|
unsafe fn finish_timestamps(&mut self, _pool: &D::QueryPool) {}
|
||||||
|
|
||||||
|
/// Begin a labeled section for debugging and profiling purposes.
|
||||||
|
unsafe fn begin_debug_label(&mut self, label: &str) {}
|
||||||
|
|
||||||
|
/// End a section opened by `begin_debug_label`.
|
||||||
|
unsafe fn end_debug_label(&mut self) {}
|
||||||
}
|
}
|
||||||
|
|
||||||
/// A builder for descriptor sets with more complex layouts.
|
/// A builder for descriptor sets with more complex layouts.
|
||||||
|
|
|
@ -598,6 +598,16 @@ impl CmdBuf {
|
||||||
self.cmd_buf().finish_timestamps(pool);
|
self.cmd_buf().finish_timestamps(pool);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Begin a labeled section for debugging and profiling purposes.
|
||||||
|
pub unsafe fn begin_debug_label(&mut self, label: &str) {
|
||||||
|
self.cmd_buf().begin_debug_label(label);
|
||||||
|
}
|
||||||
|
|
||||||
|
/// End a section opened by `begin_debug_label`.
|
||||||
|
pub unsafe fn end_debug_label(&mut self) {
|
||||||
|
self.cmd_buf().end_debug_label();
|
||||||
|
}
|
||||||
|
|
||||||
/// Make sure the resource lives until the command buffer completes.
|
/// Make sure the resource lives until the command buffer completes.
|
||||||
///
|
///
|
||||||
/// The submitted command buffer will hold this reference until the corresponding
|
/// The submitted command buffer will hold this reference until the corresponding
|
||||||
|
|
|
@ -772,6 +772,22 @@ impl CmdBuf {
|
||||||
CmdBuf::Mtl(c) => c.finish_timestamps(pool.mtl()),
|
CmdBuf::Mtl(c) => c.finish_timestamps(pool.mtl()),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
pub unsafe fn begin_debug_label(&mut self, label: &str) {
|
||||||
|
mux_match! { self;
|
||||||
|
CmdBuf::Vk(c) => c.begin_debug_label(label),
|
||||||
|
CmdBuf::Dx12(c) => c.begin_debug_label(label),
|
||||||
|
CmdBuf::Mtl(c) => c.begin_debug_label(label),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub unsafe fn end_debug_label(&mut self) {
|
||||||
|
mux_match! { self;
|
||||||
|
CmdBuf::Vk(c) => c.end_debug_label(),
|
||||||
|
CmdBuf::Dx12(c) => c.end_debug_label(),
|
||||||
|
CmdBuf::Mtl(c) => c.end_debug_label(),
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
impl Buffer {
|
impl Buffer {
|
||||||
|
|
|
@ -8,6 +8,7 @@ use std::sync::Arc;
|
||||||
|
|
||||||
use ash::extensions::{ext::DebugUtils, khr};
|
use ash::extensions::{ext::DebugUtils, khr};
|
||||||
use ash::{vk, Device, Entry, Instance};
|
use ash::{vk, Device, Entry, Instance};
|
||||||
|
use ash::vk::DebugUtilsLabelEXT;
|
||||||
|
|
||||||
use smallvec::SmallVec;
|
use smallvec::SmallVec;
|
||||||
|
|
||||||
|
@ -23,7 +24,7 @@ pub struct VkInstance {
|
||||||
entry: Entry,
|
entry: Entry,
|
||||||
instance: Instance,
|
instance: Instance,
|
||||||
vk_version: u32,
|
vk_version: u32,
|
||||||
_dbg_loader: Option<DebugUtils>,
|
dbg_loader: Option<DebugUtils>,
|
||||||
_dbg_callbk: Option<vk::DebugUtilsMessengerEXT>,
|
_dbg_callbk: Option<vk::DebugUtilsMessengerEXT>,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -39,6 +40,7 @@ pub struct VkDevice {
|
||||||
|
|
||||||
struct RawDevice {
|
struct RawDevice {
|
||||||
device: Device,
|
device: Device,
|
||||||
|
dbg_loader: Option<DebugUtils>,
|
||||||
}
|
}
|
||||||
|
|
||||||
pub struct VkSurface {
|
pub struct VkSurface {
|
||||||
|
@ -202,7 +204,7 @@ impl VkInstance {
|
||||||
None,
|
None,
|
||||||
)?;
|
)?;
|
||||||
|
|
||||||
let (_dbg_loader, _dbg_callbk) = if has_debug_ext {
|
let (dbg_loader, _dbg_callbk) = if has_debug_ext {
|
||||||
let dbg_info = vk::DebugUtilsMessengerCreateInfoEXT::builder()
|
let dbg_info = vk::DebugUtilsMessengerCreateInfoEXT::builder()
|
||||||
.message_severity(
|
.message_severity(
|
||||||
vk::DebugUtilsMessageSeverityFlagsEXT::ERROR
|
vk::DebugUtilsMessageSeverityFlagsEXT::ERROR
|
||||||
|
@ -231,7 +233,7 @@ impl VkInstance {
|
||||||
entry,
|
entry,
|
||||||
instance,
|
instance,
|
||||||
vk_version,
|
vk_version,
|
||||||
_dbg_loader,
|
dbg_loader,
|
||||||
_dbg_callbk,
|
_dbg_callbk,
|
||||||
};
|
};
|
||||||
|
|
||||||
|
@ -317,7 +319,7 @@ impl VkInstance {
|
||||||
let queue_index = 0;
|
let queue_index = 0;
|
||||||
let queue = device.get_device_queue(qfi, queue_index);
|
let queue = device.get_device_queue(qfi, queue_index);
|
||||||
|
|
||||||
let device = Arc::new(RawDevice { device });
|
let device = Arc::new(RawDevice { device, dbg_loader: self.dbg_loader.clone() });
|
||||||
|
|
||||||
let props = self.instance.get_physical_device_properties(pdevice);
|
let props = self.instance.get_physical_device_properties(pdevice);
|
||||||
let timestamp_period = props.limits.timestamp_period;
|
let timestamp_period = props.limits.timestamp_period;
|
||||||
|
@ -1112,6 +1114,20 @@ impl crate::backend::CmdBuf<VkDevice> for CmdBuf {
|
||||||
query,
|
query,
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
unsafe fn begin_debug_label(&mut self, label: &str) {
|
||||||
|
if let Some(utils) = &self.device.dbg_loader {
|
||||||
|
let label_cstr = CString::new(label).unwrap();
|
||||||
|
let label_ext = DebugUtilsLabelEXT::builder().label_name(&label_cstr).build();
|
||||||
|
utils.cmd_begin_debug_utils_label(self.cmd_buf, &label_ext);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
unsafe fn end_debug_label(&mut self) {
|
||||||
|
if let Some(utils) = &self.device.dbg_loader {
|
||||||
|
utils.cmd_end_debug_utils_label(self.cmd_buf);
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
impl crate::backend::DescriptorSetBuilder<VkDevice> for DescriptorSetBuilder {
|
impl crate::backend::DescriptorSetBuilder<VkDevice> for DescriptorSetBuilder {
|
||||||
|
|
5
piet-gpu/shader/.clang-format
Normal file
5
piet-gpu/shader/.clang-format
Normal file
|
@ -0,0 +1,5 @@
|
||||||
|
BasedOnStyle: LLVM
|
||||||
|
IndentWidth: 4
|
||||||
|
ColumnLimit: 120
|
||||||
|
AllowShortFunctionsOnASingleLine: None
|
||||||
|
SortIncludes: false
|
|
@ -77,7 +77,8 @@ void main() {
|
||||||
// long as it doesn't cross the left edge.
|
// long as it doesn't cross the left edge.
|
||||||
row_count = 0;
|
row_count = 0;
|
||||||
}
|
}
|
||||||
Alloc path_alloc = new_alloc(path.tiles.offset, (path.bbox.z - path.bbox.x) * (path.bbox.w - path.bbox.y) * Tile_size, mem_ok);
|
Alloc path_alloc = new_alloc(
|
||||||
|
path.tiles.offset, (path.bbox.z - path.bbox.x) * (path.bbox.w - path.bbox.y) * Tile_size, mem_ok);
|
||||||
sh_row_alloc[th_ix] = path_alloc;
|
sh_row_alloc[th_ix] = path_alloc;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -81,7 +81,8 @@ void main() {
|
||||||
x1 = clamp(x1, x0, int(width_in_bins));
|
x1 = clamp(x1, x0, int(width_in_bins));
|
||||||
y0 = clamp(y0, 0, int(height_in_bins));
|
y0 = clamp(y0, 0, int(height_in_bins));
|
||||||
y1 = clamp(y1, y0, int(height_in_bins));
|
y1 = clamp(y1, y0, int(height_in_bins));
|
||||||
if (x0 == x1) y1 = y0;
|
if (x0 == x1)
|
||||||
|
y1 = y0;
|
||||||
int x = x0, y = y0;
|
int x = x0, y = y0;
|
||||||
uint my_slice = gl_LocalInvocationID.x / 32;
|
uint my_slice = gl_LocalInvocationID.x / 32;
|
||||||
uint my_mask = 1u << (gl_LocalInvocationID.x & 31);
|
uint my_mask = 1u << (gl_LocalInvocationID.x & 31);
|
||||||
|
|
|
@ -118,3 +118,7 @@ build gen/draw_leaf.spv: glsl draw_leaf.comp | scene.h drawtag.h annotated.h set
|
||||||
build gen/draw_leaf.hlsl: hlsl gen/draw_leaf.spv
|
build gen/draw_leaf.hlsl: hlsl gen/draw_leaf.spv
|
||||||
build gen/draw_leaf.dxil: dxil gen/draw_leaf.hlsl
|
build gen/draw_leaf.dxil: dxil gen/draw_leaf.hlsl
|
||||||
build gen/draw_leaf.msl: msl gen/draw_leaf.spv
|
build gen/draw_leaf.msl: msl gen/draw_leaf.spv
|
||||||
|
|
||||||
|
build spv: phony gen/backdrop_lg.spv gen/backdrop.spv gen/bbox_clear.spv gen/binning.spv gen/coarse.spv gen/draw_leaf.spv gen/draw_reduce.spv gen/draw_root.spv gen/kernel4.spv gen/path_coarse.spv gen/pathseg.spv gen/pathtag_reduce.spv gen/pathtag_root.spv gen/tile_alloc.spv gen/transform_leaf.spv gen/transform_reduce.spv gen/transform_root.spv
|
||||||
|
build dxil: phony gen/backdrop.hlsl gen/backdrop_lg.hlsl gen/bbox_clear.hlsl gen/binning.hlsl gen/coarse.hlsl gen/draw_leaf.hlsl gen/draw_reduce.hlsl gen/draw_root.hlsl gen/kernel4.hlsl gen/path_coarse.hlsl gen/pathseg.hlsl gen/pathtag_reduce.hlsl gen/pathtag_root.hlsl gen/tile_alloc.hlsl gen/transform_leaf.hlsl gen/transform_reduce.hlsl gen/transform_root.hlsl
|
||||||
|
build msl: phony gen/backdrop_lg.msl gen/backdrop.msl gen/bbox_clear.msl gen/binning.msl gen/coarse.msl gen/draw_leaf.msl gen/draw_reduce.msl gen/draw_root.msl gen/kernel4.msl gen/path_coarse.msl gen/pathseg.msl gen/pathtag_reduce.msl gen/pathtag_root.msl gen/tile_alloc.msl gen/transform_leaf.msl gen/transform_reduce.msl gen/transform_root.msl
|
||||||
|
|
|
@ -8,7 +8,8 @@
|
||||||
// Each workgroup operating on one bin by stream compacting
|
// Each workgroup operating on one bin by stream compacting
|
||||||
// the elements corresponding to the bin.
|
// the elements corresponding to the bin.
|
||||||
//
|
//
|
||||||
// As output we have an ordered command stream per tile. Every tile from a path (backdrop + segment list) will be encoded.
|
// As output we have an ordered command stream per tile. Every tile from a path (backdrop + segment list) will be
|
||||||
|
// encoded.
|
||||||
|
|
||||||
#version 450
|
#version 450
|
||||||
#extension GL_GOOGLE_include_directive : enable
|
#extension GL_GOOGLE_include_directive : enable
|
||||||
|
@ -245,7 +246,8 @@ void main() {
|
||||||
// base relative to bin
|
// base relative to bin
|
||||||
uint base = path.tiles.offset - uint(dy * stride + dx) * Tile_size;
|
uint base = path.tiles.offset - uint(dy * stride + dx) * Tile_size;
|
||||||
sh_tile_base[th_ix] = base;
|
sh_tile_base[th_ix] = base;
|
||||||
Alloc path_alloc = new_alloc(path.tiles.offset, (path.bbox.z - path.bbox.x) * (path.bbox.w - path.bbox.y) * Tile_size, mem_ok);
|
Alloc path_alloc = new_alloc(path.tiles.offset,
|
||||||
|
(path.bbox.z - path.bbox.x) * (path.bbox.w - path.bbox.y) * Tile_size, mem_ok);
|
||||||
write_tile_alloc(th_ix, path_alloc);
|
write_tile_alloc(th_ix, path_alloc);
|
||||||
break;
|
break;
|
||||||
default:
|
default:
|
||||||
|
@ -284,7 +286,8 @@ void main() {
|
||||||
if (tag == Annotated_BeginClip || tag == Annotated_EndClip) {
|
if (tag == Annotated_BeginClip || tag == Annotated_EndClip) {
|
||||||
include_tile = true;
|
include_tile = true;
|
||||||
} else if (mem_ok) {
|
} else if (mem_ok) {
|
||||||
Tile tile = Tile_read(read_tile_alloc(el_ix, mem_ok), TileRef(sh_tile_base[el_ix] + (sh_tile_stride[el_ix] * y + x) * Tile_size));
|
Tile tile = Tile_read(read_tile_alloc(el_ix, mem_ok),
|
||||||
|
TileRef(sh_tile_base[el_ix] + (sh_tile_stride[el_ix] * y + x) * Tile_size));
|
||||||
// Include the path in the tile if
|
// Include the path in the tile if
|
||||||
// - the tile contains at least a segment (tile offset non-zero)
|
// - the tile contains at least a segment (tile offset non-zero)
|
||||||
// - the tile is completely covered (backdrop non-zero)
|
// - the tile is completely covered (backdrop non-zero)
|
||||||
|
@ -329,8 +332,9 @@ void main() {
|
||||||
if (clip_zero_depth == 0) {
|
if (clip_zero_depth == 0) {
|
||||||
switch (tag.tag) {
|
switch (tag.tag) {
|
||||||
case Annotated_Color:
|
case Annotated_Color:
|
||||||
Tile tile = Tile_read(read_tile_alloc(element_ref_ix, mem_ok), TileRef(sh_tile_base[element_ref_ix]
|
Tile tile = Tile_read(read_tile_alloc(element_ref_ix, mem_ok),
|
||||||
+ (sh_tile_stride[element_ref_ix] * tile_y + tile_x) * Tile_size));
|
TileRef(sh_tile_base[element_ref_ix] +
|
||||||
|
(sh_tile_stride[element_ref_ix] * tile_y + tile_x) * Tile_size));
|
||||||
AnnoColor fill = Annotated_Color_read(conf.anno_alloc, ref);
|
AnnoColor fill = Annotated_Color_read(conf.anno_alloc, ref);
|
||||||
if (!alloc_cmd(cmd_alloc, cmd_ref, cmd_limit)) {
|
if (!alloc_cmd(cmd_alloc, cmd_ref, cmd_limit)) {
|
||||||
break;
|
break;
|
||||||
|
@ -340,8 +344,9 @@ void main() {
|
||||||
cmd_ref.offset += 4 + CmdColor_size;
|
cmd_ref.offset += 4 + CmdColor_size;
|
||||||
break;
|
break;
|
||||||
case Annotated_LinGradient:
|
case Annotated_LinGradient:
|
||||||
tile = Tile_read(read_tile_alloc(element_ref_ix, mem_ok), TileRef(sh_tile_base[element_ref_ix]
|
tile = Tile_read(read_tile_alloc(element_ref_ix, mem_ok),
|
||||||
+ (sh_tile_stride[element_ref_ix] * tile_y + tile_x) * Tile_size));
|
TileRef(sh_tile_base[element_ref_ix] +
|
||||||
|
(sh_tile_stride[element_ref_ix] * tile_y + tile_x) * Tile_size));
|
||||||
AnnoLinGradient lin = Annotated_LinGradient_read(conf.anno_alloc, ref);
|
AnnoLinGradient lin = Annotated_LinGradient_read(conf.anno_alloc, ref);
|
||||||
if (!alloc_cmd(cmd_alloc, cmd_ref, cmd_limit)) {
|
if (!alloc_cmd(cmd_alloc, cmd_ref, cmd_limit)) {
|
||||||
break;
|
break;
|
||||||
|
@ -356,8 +361,9 @@ void main() {
|
||||||
cmd_ref.offset += 4 + CmdLinGrad_size;
|
cmd_ref.offset += 4 + CmdLinGrad_size;
|
||||||
break;
|
break;
|
||||||
case Annotated_Image:
|
case Annotated_Image:
|
||||||
tile = Tile_read(read_tile_alloc(element_ref_ix, mem_ok), TileRef(sh_tile_base[element_ref_ix]
|
tile = Tile_read(read_tile_alloc(element_ref_ix, mem_ok),
|
||||||
+ (sh_tile_stride[element_ref_ix] * tile_y + tile_x) * Tile_size));
|
TileRef(sh_tile_base[element_ref_ix] +
|
||||||
|
(sh_tile_stride[element_ref_ix] * tile_y + tile_x) * Tile_size));
|
||||||
AnnoImage fill_img = Annotated_Image_read(conf.anno_alloc, ref);
|
AnnoImage fill_img = Annotated_Image_read(conf.anno_alloc, ref);
|
||||||
if (!alloc_cmd(cmd_alloc, cmd_ref, cmd_limit)) {
|
if (!alloc_cmd(cmd_alloc, cmd_ref, cmd_limit)) {
|
||||||
break;
|
break;
|
||||||
|
@ -367,8 +373,9 @@ void main() {
|
||||||
cmd_ref.offset += 4 + CmdImage_size;
|
cmd_ref.offset += 4 + CmdImage_size;
|
||||||
break;
|
break;
|
||||||
case Annotated_BeginClip:
|
case Annotated_BeginClip:
|
||||||
tile = Tile_read(read_tile_alloc(element_ref_ix, mem_ok), TileRef(sh_tile_base[element_ref_ix]
|
tile = Tile_read(read_tile_alloc(element_ref_ix, mem_ok),
|
||||||
+ (sh_tile_stride[element_ref_ix] * tile_y + tile_x) * Tile_size));
|
TileRef(sh_tile_base[element_ref_ix] +
|
||||||
|
(sh_tile_stride[element_ref_ix] * tile_y + tile_x) * Tile_size));
|
||||||
if (tile.tile.offset == 0 && tile.backdrop == 0) {
|
if (tile.tile.offset == 0 && tile.backdrop == 0) {
|
||||||
clip_zero_depth = clip_depth + 1;
|
clip_zero_depth = clip_depth + 1;
|
||||||
} else if (tile.tile.offset == 0 && clip_depth < 32) {
|
} else if (tile.tile.offset == 0 && clip_depth < 32) {
|
||||||
|
@ -418,7 +425,8 @@ void main() {
|
||||||
barrier();
|
barrier();
|
||||||
|
|
||||||
rd_ix += N_TILE;
|
rd_ix += N_TILE;
|
||||||
if (rd_ix >= ready_ix && partition_ix >= n_partitions) break;
|
if (rd_ix >= ready_ix && partition_ix >= n_partitions)
|
||||||
|
break;
|
||||||
}
|
}
|
||||||
if (bin_tile_x + tile_x < conf.width_in_tiles && bin_tile_y + tile_y < conf.height_in_tiles) {
|
if (bin_tile_x + tile_x < conf.width_in_tiles && bin_tile_y + tile_y < conf.height_in_tiles) {
|
||||||
Cmd_End_write(cmd_alloc, cmd_ref);
|
Cmd_End_write(cmd_alloc, cmd_ref);
|
||||||
|
|
|
@ -3,7 +3,6 @@
|
||||||
// The leaf scan pass for draw tag scan implemented as a tree reduction.
|
// The leaf scan pass for draw tag scan implemented as a tree reduction.
|
||||||
// This stage can be fused with its consumer but is separate now.
|
// This stage can be fused with its consumer but is separate now.
|
||||||
|
|
||||||
|
|
||||||
#version 450
|
#version 450
|
||||||
#extension GL_GOOGLE_include_directive : enable
|
#extension GL_GOOGLE_include_directive : enable
|
||||||
|
|
||||||
|
|
|
@ -14,7 +14,7 @@
|
||||||
|
|
||||||
#define CHUNK_X 2
|
#define CHUNK_X 2
|
||||||
#define CHUNK_Y 4
|
#define CHUNK_Y 4
|
||||||
#define CHUNK CHUNK_X * CHUNK_Y
|
#define CHUNK (CHUNK_X * CHUNK_Y)
|
||||||
#define CHUNK_DX (TILE_WIDTH_PX / CHUNK_X)
|
#define CHUNK_DX (TILE_WIDTH_PX / CHUNK_X)
|
||||||
#define CHUNK_DY (TILE_HEIGHT_PX / CHUNK_Y)
|
#define CHUNK_DY (TILE_HEIGHT_PX / CHUNK_Y)
|
||||||
layout(local_size_x = CHUNK_DX, local_size_y = CHUNK_DY) in;
|
layout(local_size_x = CHUNK_DX, local_size_y = CHUNK_DY) in;
|
||||||
|
@ -86,7 +86,8 @@ void main() {
|
||||||
Alloc cmd_alloc = slice_mem(conf.ptcl_alloc, tile_ix * PTCL_INITIAL_ALLOC, PTCL_INITIAL_ALLOC);
|
Alloc cmd_alloc = slice_mem(conf.ptcl_alloc, tile_ix * PTCL_INITIAL_ALLOC, PTCL_INITIAL_ALLOC);
|
||||||
CmdRef cmd_ref = CmdRef(cmd_alloc.offset);
|
CmdRef cmd_ref = CmdRef(cmd_alloc.offset);
|
||||||
|
|
||||||
uvec2 xy_uint = uvec2(gl_LocalInvocationID.x + TILE_WIDTH_PX * gl_WorkGroupID.x, gl_LocalInvocationID.y + TILE_HEIGHT_PX * gl_WorkGroupID.y);
|
uvec2 xy_uint = uvec2(gl_LocalInvocationID.x + TILE_WIDTH_PX * gl_WorkGroupID.x,
|
||||||
|
gl_LocalInvocationID.y + TILE_HEIGHT_PX * gl_WorkGroupID.y);
|
||||||
vec2 xy = vec2(xy_uint);
|
vec2 xy = vec2(xy_uint);
|
||||||
mediump vec4 rgba[CHUNK];
|
mediump vec4 rgba[CHUNK];
|
||||||
uint blend_stack[MAX_BLEND_STACK][CHUNK];
|
uint blend_stack[MAX_BLEND_STACK][CHUNK];
|
||||||
|
@ -108,7 +109,8 @@ void main() {
|
||||||
// Calculate distance field from all the line segments in this tile.
|
// Calculate distance field from all the line segments in this tile.
|
||||||
CmdStroke stroke = Cmd_Stroke_read(cmd_alloc, cmd_ref);
|
CmdStroke stroke = Cmd_Stroke_read(cmd_alloc, cmd_ref);
|
||||||
mediump float df[CHUNK];
|
mediump float df[CHUNK];
|
||||||
for (uint k = 0; k < CHUNK; k++) df[k] = 1e9;
|
for (uint k = 0; k < CHUNK; k++)
|
||||||
|
df[k] = 1e9;
|
||||||
TileSegRef tile_seg_ref = TileSegRef(stroke.tile_ref);
|
TileSegRef tile_seg_ref = TileSegRef(stroke.tile_ref);
|
||||||
do {
|
do {
|
||||||
TileSeg seg = TileSeg_read(new_alloc(tile_seg_ref.offset, TileSeg_size, mem_ok), tile_seg_ref);
|
TileSeg seg = TileSeg_read(new_alloc(tile_seg_ref.offset, TileSeg_size, mem_ok), tile_seg_ref);
|
||||||
|
@ -128,7 +130,8 @@ void main() {
|
||||||
break;
|
break;
|
||||||
case Cmd_Fill:
|
case Cmd_Fill:
|
||||||
CmdFill fill = Cmd_Fill_read(cmd_alloc, cmd_ref);
|
CmdFill fill = Cmd_Fill_read(cmd_alloc, cmd_ref);
|
||||||
for (uint k = 0; k < CHUNK; k++) area[k] = float(fill.backdrop);
|
for (uint k = 0; k < CHUNK; k++)
|
||||||
|
area[k] = float(fill.backdrop);
|
||||||
tile_seg_ref = TileSegRef(fill.tile_ref);
|
tile_seg_ref = TileSegRef(fill.tile_ref);
|
||||||
// Calculate coverage based on backdrop + coverage of each line segment
|
// Calculate coverage based on backdrop + coverage of each line segment
|
||||||
do {
|
do {
|
||||||
|
|
|
@ -139,7 +139,8 @@ void main() {
|
||||||
bool is_stroke = fill_mode_from_flags(tag.flags) == MODE_STROKE;
|
bool is_stroke = fill_mode_from_flags(tag.flags) == MODE_STROKE;
|
||||||
uint path_ix = cubic.path_ix;
|
uint path_ix = cubic.path_ix;
|
||||||
Path path = Path_read(conf.tile_alloc, PathRef(conf.tile_alloc.offset + path_ix * Path_size));
|
Path path = Path_read(conf.tile_alloc, PathRef(conf.tile_alloc.offset + path_ix * Path_size));
|
||||||
Alloc path_alloc = new_alloc(path.tiles.offset, (path.bbox.z - path.bbox.x) * (path.bbox.w - path.bbox.y) * Tile_size, mem_ok);
|
Alloc path_alloc =
|
||||||
|
new_alloc(path.tiles.offset, (path.bbox.z - path.bbox.x) * (path.bbox.w - path.bbox.y) * Tile_size, mem_ok);
|
||||||
ivec4 bbox = ivec4(path.bbox);
|
ivec4 bbox = ivec4(path.bbox);
|
||||||
vec2 p0 = cubic.p0;
|
vec2 p0 = cubic.p0;
|
||||||
qp0 = cubic.p0;
|
qp0 = cubic.p0;
|
||||||
|
|
|
@ -46,8 +46,7 @@ Monoid combine_monoid(Monoid a, Monoid b) {
|
||||||
if ((a.flags & FLAG_RESET_BBOX) == 0 && b.bbox.z <= b.bbox.x && b.bbox.w <= b.bbox.y) {
|
if ((a.flags & FLAG_RESET_BBOX) == 0 && b.bbox.z <= b.bbox.x && b.bbox.w <= b.bbox.y) {
|
||||||
c.bbox = a.bbox;
|
c.bbox = a.bbox;
|
||||||
} else if ((a.flags & FLAG_RESET_BBOX) == 0 && (b.flags & FLAG_SET_BBOX) == 0 &&
|
} else if ((a.flags & FLAG_RESET_BBOX) == 0 && (b.flags & FLAG_SET_BBOX) == 0 &&
|
||||||
(a.bbox.z > a.bbox.x || a.bbox.w > a.bbox.y))
|
(a.bbox.z > a.bbox.x || a.bbox.w > a.bbox.y)) {
|
||||||
{
|
|
||||||
c.bbox.xy = min(a.bbox.xy, c.bbox.xy);
|
c.bbox.xy = min(a.bbox.xy, c.bbox.xy);
|
||||||
c.bbox.zw = max(a.bbox.zw, c.bbox.zw);
|
c.bbox.zw = max(a.bbox.zw, c.bbox.zw);
|
||||||
}
|
}
|
||||||
|
|
|
@ -388,6 +388,7 @@ impl Renderer {
|
||||||
cmd_buf.image_barrier(&self.gradients, ImageLayout::BlitDst, ImageLayout::General);
|
cmd_buf.image_barrier(&self.gradients, ImageLayout::BlitDst, ImageLayout::General);
|
||||||
cmd_buf.reset_query_pool(&query_pool);
|
cmd_buf.reset_query_pool(&query_pool);
|
||||||
cmd_buf.write_timestamp(&query_pool, 0);
|
cmd_buf.write_timestamp(&query_pool, 0);
|
||||||
|
cmd_buf.begin_debug_label("Element bounding box calculation");
|
||||||
self.element_stage.record(
|
self.element_stage.record(
|
||||||
cmd_buf,
|
cmd_buf,
|
||||||
&self.element_code,
|
&self.element_code,
|
||||||
|
@ -397,43 +398,53 @@ impl Renderer {
|
||||||
self.n_pathtag as u32,
|
self.n_pathtag as u32,
|
||||||
self.n_drawobj as u64,
|
self.n_drawobj as u64,
|
||||||
);
|
);
|
||||||
|
cmd_buf.end_debug_label();
|
||||||
cmd_buf.write_timestamp(&query_pool, 1);
|
cmd_buf.write_timestamp(&query_pool, 1);
|
||||||
cmd_buf.memory_barrier();
|
cmd_buf.memory_barrier();
|
||||||
|
cmd_buf.begin_debug_label("Tile allocation");
|
||||||
cmd_buf.dispatch(
|
cmd_buf.dispatch(
|
||||||
&self.tile_pipeline,
|
&self.tile_pipeline,
|
||||||
&self.tile_ds,
|
&self.tile_ds,
|
||||||
(((self.n_paths + 255) / 256) as u32, 1, 1),
|
(((self.n_paths + 255) / 256) as u32, 1, 1),
|
||||||
(256, 1, 1),
|
(256, 1, 1),
|
||||||
);
|
);
|
||||||
|
cmd_buf.end_debug_label();
|
||||||
cmd_buf.write_timestamp(&query_pool, 2);
|
cmd_buf.write_timestamp(&query_pool, 2);
|
||||||
cmd_buf.memory_barrier();
|
cmd_buf.memory_barrier();
|
||||||
|
cmd_buf.begin_debug_label("Path flattening");
|
||||||
cmd_buf.dispatch(
|
cmd_buf.dispatch(
|
||||||
&self.path_pipeline,
|
&self.path_pipeline,
|
||||||
&self.path_ds,
|
&self.path_ds,
|
||||||
(((self.n_pathseg + 31) / 32) as u32, 1, 1),
|
(((self.n_pathseg + 31) / 32) as u32, 1, 1),
|
||||||
(32, 1, 1),
|
(32, 1, 1),
|
||||||
);
|
);
|
||||||
|
cmd_buf.end_debug_label();
|
||||||
cmd_buf.write_timestamp(&query_pool, 3);
|
cmd_buf.write_timestamp(&query_pool, 3);
|
||||||
cmd_buf.memory_barrier();
|
cmd_buf.memory_barrier();
|
||||||
|
cmd_buf.begin_debug_label("Backdrop propagation");
|
||||||
cmd_buf.dispatch(
|
cmd_buf.dispatch(
|
||||||
&self.backdrop_pipeline,
|
&self.backdrop_pipeline,
|
||||||
&self.backdrop_ds,
|
&self.backdrop_ds,
|
||||||
(((self.n_paths + 255) / 256) as u32, 1, 1),
|
(((self.n_paths + 255) / 256) as u32, 1, 1),
|
||||||
(256, self.backdrop_y, 1),
|
(256, self.backdrop_y, 1),
|
||||||
);
|
);
|
||||||
|
cmd_buf.end_debug_label();
|
||||||
cmd_buf.write_timestamp(&query_pool, 4);
|
cmd_buf.write_timestamp(&query_pool, 4);
|
||||||
// Note: this barrier is not needed as an actual dependency between
|
// Note: this barrier is not needed as an actual dependency between
|
||||||
// pipeline stages, but I am keeping it in so that timer queries are
|
// pipeline stages, but I am keeping it in so that timer queries are
|
||||||
// easier to interpret.
|
// easier to interpret.
|
||||||
cmd_buf.memory_barrier();
|
cmd_buf.memory_barrier();
|
||||||
|
cmd_buf.begin_debug_label("Element binning");
|
||||||
cmd_buf.dispatch(
|
cmd_buf.dispatch(
|
||||||
&self.bin_pipeline,
|
&self.bin_pipeline,
|
||||||
&self.bin_ds,
|
&self.bin_ds,
|
||||||
(((self.n_paths + 255) / 256) as u32, 1, 1),
|
(((self.n_paths + 255) / 256) as u32, 1, 1),
|
||||||
(256, 1, 1),
|
(256, 1, 1),
|
||||||
);
|
);
|
||||||
|
cmd_buf.end_debug_label();
|
||||||
cmd_buf.write_timestamp(&query_pool, 5);
|
cmd_buf.write_timestamp(&query_pool, 5);
|
||||||
cmd_buf.memory_barrier();
|
cmd_buf.memory_barrier();
|
||||||
|
cmd_buf.begin_debug_label("Coarse raster");
|
||||||
cmd_buf.dispatch(
|
cmd_buf.dispatch(
|
||||||
&self.coarse_pipeline,
|
&self.coarse_pipeline,
|
||||||
&self.coarse_ds,
|
&self.coarse_ds,
|
||||||
|
@ -444,8 +455,10 @@ impl Renderer {
|
||||||
),
|
),
|
||||||
(256, 1, 1),
|
(256, 1, 1),
|
||||||
);
|
);
|
||||||
|
cmd_buf.end_debug_label();
|
||||||
cmd_buf.write_timestamp(&query_pool, 6);
|
cmd_buf.write_timestamp(&query_pool, 6);
|
||||||
cmd_buf.memory_barrier();
|
cmd_buf.memory_barrier();
|
||||||
|
cmd_buf.begin_debug_label("Fine raster");
|
||||||
cmd_buf.dispatch(
|
cmd_buf.dispatch(
|
||||||
&self.k4_pipeline,
|
&self.k4_pipeline,
|
||||||
&self.k4_ds,
|
&self.k4_ds,
|
||||||
|
@ -456,6 +469,7 @@ impl Renderer {
|
||||||
),
|
),
|
||||||
(8, 4, 1),
|
(8, 4, 1),
|
||||||
);
|
);
|
||||||
|
cmd_buf.end_debug_label();
|
||||||
cmd_buf.write_timestamp(&query_pool, 7);
|
cmd_buf.write_timestamp(&query_pool, 7);
|
||||||
cmd_buf.memory_barrier();
|
cmd_buf.memory_barrier();
|
||||||
cmd_buf.image_barrier(&self.image_dev, ImageLayout::General, ImageLayout::BlitSrc);
|
cmd_buf.image_barrier(&self.image_dev, ImageLayout::General, ImageLayout::BlitSrc);
|
||||||
|
|
Loading…
Add table
Reference in a new issue