//! Take an encoded scene and create a graph to render it use bytemuck::{Pod, Zeroable}; use crate::{ encoding::Encoding, engine::{BufProxy, ImageFormat, ImageProxy, Recording, ResourceProxy}, shaders::{self, FullShaders, Shaders}, Scene, }; const TAG_MONOID_SIZE: u64 = 12; const TAG_MONOID_FULL_SIZE: u64 = 20; const PATH_BBOX_SIZE: u64 = 24; const CUBIC_SIZE: u64 = 48; const DRAWMONOID_SIZE: u64 = 16; const MAX_DRAWINFO_SIZE: u64 = 44; const CLIP_BIC_SIZE: u64 = 8; const CLIP_EL_SIZE: u64 = 32; const CLIP_INP_SIZE: u64 = 8; const CLIP_BBOX_SIZE: u64 = 16; const PATH_SIZE: u64 = 32; const DRAW_BBOX_SIZE: u64 = 16; const BUMP_SIZE: u64 = 16; const BIN_HEADER_SIZE: u64 = 8; #[repr(C)] #[derive(Clone, Copy, Debug, Default, Zeroable, Pod)] struct Config { width_in_tiles: u32, height_in_tiles: u32, target_width: u32, target_height: u32, n_drawobj: u32, n_path: u32, n_clip: u32, bin_data_start: u32, pathtag_base: u32, pathdata_base: u32, drawtag_base: u32, drawdata_base: u32, transform_base: u32, linewidth_base: u32, } fn size_to_words(byte_size: usize) -> u32 { (byte_size / std::mem::size_of::()) as u32 } pub const fn next_multiple_of(val: u32, rhs: u32) -> u32 { match val % rhs { 0 => val, r => val + (rhs - r), } } #[allow(unused)] fn render(scene: &Scene, shaders: &Shaders) -> (Recording, BufProxy) { let mut recording = Recording::default(); let data = scene.data(); let n_pathtag = data.path_tags.len(); let pathtag_padded = align_up(n_pathtag, 4 * shaders::PATHTAG_REDUCE_WG); let pathtag_wgs = pathtag_padded / (4 * shaders::PATHTAG_REDUCE_WG as usize); let mut scene: Vec = Vec::with_capacity(pathtag_padded); let pathtag_base = size_to_words(scene.len()); scene.extend(bytemuck::cast_slice(&data.path_tags)); scene.resize(pathtag_padded, 0); let pathdata_base = size_to_words(scene.len()); scene.extend(&data.path_data); let config = Config { width_in_tiles: 64, height_in_tiles: 64, target_width: 64 * 16, target_height: 64 * 16, pathtag_base, pathdata_base, ..Default::default() }; let scene_buf = recording.upload(scene); let config_buf = recording.upload_uniform(bytemuck::bytes_of(&config)); let reduced_buf = BufProxy::new(pathtag_wgs as u64 * TAG_MONOID_SIZE); // TODO: really only need pathtag_wgs - 1 recording.dispatch( shaders.pathtag_reduce, (pathtag_wgs as u32, 1, 1), [config_buf, scene_buf, reduced_buf], ); let tagmonoid_buf = BufProxy::new(pathtag_wgs as u64 * shaders::PATHTAG_REDUCE_WG as u64 * TAG_MONOID_SIZE); recording.dispatch( shaders.pathtag_scan, (pathtag_wgs as u32, 1, 1), [config_buf, scene_buf, reduced_buf, tagmonoid_buf], ); let path_coarse_wgs = (n_pathtag as u32 + shaders::PATH_COARSE_WG - 1) / shaders::PATH_COARSE_WG; // TODO: more principled size calc let tiles_buf = BufProxy::new(4097 * 8); let segments_buf = BufProxy::new(256 * 24); recording.clear_all(tiles_buf); recording.dispatch( shaders.path_coarse, (path_coarse_wgs, 1, 1), [ config_buf, scene_buf, tagmonoid_buf, tiles_buf, segments_buf, ], ); recording.dispatch( shaders.backdrop, (config.height_in_tiles, 1, 1), [config_buf, tiles_buf], ); let out_buf_size = config.width_in_tiles * config.height_in_tiles * 256; let out_buf = BufProxy::new(out_buf_size as u64); recording.dispatch( shaders.fine, (config.width_in_tiles, config.height_in_tiles, 1), [config_buf, tiles_buf, segments_buf, out_buf], ); recording.download(out_buf); (recording, out_buf) } pub fn render_full( scene: &Scene, shaders: &FullShaders, width: u32, height: u32, ) -> (Recording, ResourceProxy) { render_encoding_full(scene.data(), shaders, width, height) } pub fn render_encoding_full( encoding: &Encoding, shaders: &FullShaders, width: u32, height: u32, ) -> (Recording, ResourceProxy) { use crate::encoding::{resource::ResourceCache, PackedEncoding}; let mut recording = Recording::default(); let mut resources = ResourceCache::new(); let mut packed = PackedEncoding::default(); packed.pack(encoding, &mut resources); let (ramp_data, ramps_width, ramps_height) = resources.ramps(packed.resources).unwrap(); let gradient_image = if encoding.patches.is_empty() { ResourceProxy::new_image(1, 1, ImageFormat::Rgba8) } else { let data: &[u8] = bytemuck::cast_slice(ramp_data); ResourceProxy::Image(recording.upload_image( ramps_width, ramps_height, ImageFormat::Rgba8, data, )) }; // TODO: calculate for real when we do rectangles let n_pathtag = encoding.path_tags.len(); let pathtag_padded = align_up(encoding.path_tags.len(), 4 * shaders::PATHTAG_REDUCE_WG); let n_paths = encoding.n_paths; let n_drawobj = n_paths; let n_clip = encoding.n_clips; let new_width = next_multiple_of(width, 16); let new_height = next_multiple_of(height, 16); let config = crate::encoding::Config { width_in_tiles: new_width / 16, height_in_tiles: new_height / 16, target_width: width, target_height: height, layout: packed.layout, }; // println!("{:?}", config); let scene_buf = ResourceProxy::Buf(recording.upload(packed.data)); let config_buf = ResourceProxy::Buf(recording.upload_uniform(bytemuck::bytes_of(&config))); let pathtag_wgs = pathtag_padded / (4 * shaders::PATHTAG_REDUCE_WG as usize); let pathtag_large = pathtag_wgs > shaders::PATHTAG_REDUCE_WG as usize; let reduced_size = if pathtag_large { align_up(pathtag_wgs, shaders::PATHTAG_REDUCE_WG) } else { pathtag_wgs }; let reduced_buf = ResourceProxy::new_buf(reduced_size as u64 * TAG_MONOID_FULL_SIZE); // TODO: really only need pathtag_wgs - 1 recording.dispatch( shaders.pathtag_reduce, (pathtag_wgs as u32, 1, 1), [config_buf, scene_buf, reduced_buf], ); let mut pathtag_parent = reduced_buf; if pathtag_large { let reduced2_size = shaders::PATHTAG_REDUCE_WG as usize; let reduced2_buf = ResourceProxy::new_buf(reduced2_size as u64 * TAG_MONOID_FULL_SIZE); recording.dispatch( shaders.pathtag_reduce2, (reduced2_size as u32, 1, 1), [reduced_buf, reduced2_buf], ); let reduced_scan_buf = ResourceProxy::new_buf(pathtag_wgs as u64 * TAG_MONOID_FULL_SIZE); recording.dispatch( shaders.pathtag_scan1, (reduced_size as u32 / shaders::PATHTAG_REDUCE_WG, 1, 1), [reduced_buf, reduced2_buf, reduced_scan_buf], ); pathtag_parent = reduced_scan_buf; } let tagmonoid_buf = ResourceProxy::new_buf( pathtag_wgs as u64 * shaders::PATHTAG_REDUCE_WG as u64 * TAG_MONOID_FULL_SIZE, ); let pathtag_scan = if pathtag_large { shaders.pathtag_scan_large } else { shaders.pathtag_scan }; recording.dispatch( pathtag_scan, (pathtag_wgs as u32, 1, 1), [config_buf, scene_buf, pathtag_parent, tagmonoid_buf], ); let drawobj_wgs = (n_drawobj + shaders::PATH_BBOX_WG - 1) / shaders::PATH_BBOX_WG; let path_bbox_buf = ResourceProxy::new_buf(n_paths as u64 * PATH_BBOX_SIZE); recording.dispatch( shaders.bbox_clear, (drawobj_wgs, 1, 1), [config_buf, path_bbox_buf], ); let cubic_buf = ResourceProxy::new_buf(n_pathtag as u64 * CUBIC_SIZE); let path_coarse_wgs = (n_pathtag as u32 + shaders::PATH_COARSE_WG - 1) / shaders::PATH_COARSE_WG; recording.dispatch( shaders.pathseg, (path_coarse_wgs, 1, 1), [ config_buf, scene_buf, tagmonoid_buf, path_bbox_buf, cubic_buf, ], ); let draw_reduced_buf = ResourceProxy::new_buf(drawobj_wgs as u64 * DRAWMONOID_SIZE); recording.dispatch( shaders.draw_reduce, (drawobj_wgs, 1, 1), [config_buf, scene_buf, draw_reduced_buf], ); let draw_monoid_buf = ResourceProxy::new_buf(n_drawobj as u64 * DRAWMONOID_SIZE); let info_bin_data_buf = ResourceProxy::new_buf(1 << 20); let clip_inp_buf = ResourceProxy::new_buf(encoding.n_clips as u64 * CLIP_INP_SIZE); recording.dispatch( shaders.draw_leaf, (drawobj_wgs, 1, 1), [ config_buf, scene_buf, draw_reduced_buf, path_bbox_buf, draw_monoid_buf, info_bin_data_buf, clip_inp_buf, ], ); let clip_el_buf = ResourceProxy::new_buf(encoding.n_clips as u64 * CLIP_EL_SIZE); let clip_bic_buf = ResourceProxy::new_buf((n_clip / shaders::CLIP_REDUCE_WG) as u64 * CLIP_BIC_SIZE); let clip_wg_reduce = n_clip.saturating_sub(1) / shaders::CLIP_REDUCE_WG; if clip_wg_reduce > 0 { recording.dispatch( shaders.clip_reduce, (clip_wg_reduce, 1, 1), [ config_buf, clip_inp_buf, path_bbox_buf, clip_bic_buf, clip_el_buf, ], ); } let clip_wg = (n_clip + shaders::CLIP_REDUCE_WG - 1) / shaders::CLIP_REDUCE_WG; let clip_bbox_buf = ResourceProxy::new_buf(n_clip as u64 * CLIP_BBOX_SIZE); if clip_wg > 0 { recording.dispatch( shaders.clip_leaf, (clip_wg, 1, 1), [ config_buf, clip_inp_buf, path_bbox_buf, clip_bic_buf, clip_el_buf, draw_monoid_buf, clip_bbox_buf, ], ); } let draw_bbox_buf = ResourceProxy::new_buf(n_paths as u64 * DRAW_BBOX_SIZE); let bump_buf = BufProxy::new(BUMP_SIZE); let width_in_bins = (config.width_in_tiles + 15) / 16; let height_in_bins = (config.height_in_tiles + 15) / 16; let bin_header_buf = ResourceProxy::new_buf((256 * drawobj_wgs) as u64 * BIN_HEADER_SIZE); recording.clear_all(bump_buf); let bump_buf = ResourceProxy::Buf(bump_buf); recording.dispatch( shaders.binning, (drawobj_wgs, 1, 1), [ config_buf, draw_monoid_buf, path_bbox_buf, clip_bbox_buf, draw_bbox_buf, bump_buf, info_bin_data_buf, bin_header_buf, ], ); // Note: this only needs to be rounded up because of the workaround to store the tile_offset // in storage rather than workgroup memory. let n_path_aligned = align_up(n_paths as usize, 256); let path_buf = ResourceProxy::new_buf(n_path_aligned as u64 * PATH_SIZE); let tile_buf = ResourceProxy::new_buf(1 << 24); let path_wgs = (n_paths + shaders::PATH_BBOX_WG - 1) / shaders::PATH_BBOX_WG; recording.dispatch( shaders.tile_alloc, (path_wgs, 1, 1), [ config_buf, scene_buf, draw_bbox_buf, bump_buf, path_buf, tile_buf, ], ); let segments_buf = ResourceProxy::new_buf(1 << 24); recording.dispatch( shaders.path_coarse, (path_coarse_wgs, 1, 1), [ config_buf, scene_buf, tagmonoid_buf, cubic_buf, path_buf, bump_buf, tile_buf, segments_buf, ], ); recording.dispatch( shaders.backdrop, (path_wgs, 1, 1), [config_buf, path_buf, tile_buf], ); let ptcl_buf = ResourceProxy::new_buf(1 << 24); recording.dispatch( shaders.coarse, (width_in_bins, height_in_bins, 1), [ config_buf, scene_buf, draw_monoid_buf, bin_header_buf, info_bin_data_buf, path_buf, tile_buf, bump_buf, ptcl_buf, ], ); let out_image = ImageProxy::new(width, height, ImageFormat::Rgba8); recording.dispatch( shaders.fine, (config.width_in_tiles, config.height_in_tiles, 1), [ config_buf, tile_buf, segments_buf, ResourceProxy::Image(out_image), ptcl_buf, gradient_image, info_bin_data_buf, ], ); (recording, ResourceProxy::Image(out_image)) } pub fn align_up(len: usize, alignment: u32) -> usize { len + (len.wrapping_neg() & (alignment as usize - 1)) }