// SPDX-License-Identifier: Apache-2.0 OR MIT OR Unlicense // Finish prefix sum of drawtags, decode draw objects. #import config #import clip #import drawtag #import bbox @group(0) @binding(0) var config: Config; @group(0) @binding(1) var scene: array; @group(0) @binding(2) var reduced: array; @group(0) @binding(3) var path_bbox: array; @group(0) @binding(4) var draw_monoid: array; @group(0) @binding(5) var info: array; @group(0) @binding(6) var clip_inp: array; let WG_SIZE = 256u; // Possibly dedup? struct Transform { matrx: vec4, translate: vec2, } fn read_transform(transform_base: u32, ix: u32) -> Transform { let base = transform_base + ix * 6u; let c0 = bitcast(scene[base]); let c1 = bitcast(scene[base + 1u]); let c2 = bitcast(scene[base + 2u]); let c3 = bitcast(scene[base + 3u]); let c4 = bitcast(scene[base + 4u]); let c5 = bitcast(scene[base + 5u]); let matrx = vec4(c0, c1, c2, c3); let translate = vec2(c4, c5); return Transform(matrx, translate); } var sh_scratch: array; @compute @workgroup_size(256) fn main( @builtin(global_invocation_id) global_id: vec3, @builtin(local_invocation_id) local_id: vec3, @builtin(workgroup_id) wg_id: vec3, ) { let ix = global_id.x; // Reduce prefix of workgroups up to this one var agg = draw_monoid_identity(); if local_id.x < wg_id.x { agg = reduced[local_id.x]; } sh_scratch[local_id.x] = agg; for (var i = 0u; i < firstTrailingBit(WG_SIZE); i += 1u) { workgroupBarrier(); if local_id.x + (1u << i) < WG_SIZE { let other = sh_scratch[local_id.x + (1u << i)]; agg = combine_draw_monoid(agg, other); } workgroupBarrier(); sh_scratch[local_id.x] = agg; } // Two barriers can be eliminated if we use separate shared arrays // for prefix and intra-workgroup prefix sum. workgroupBarrier(); var m = sh_scratch[0]; workgroupBarrier(); let tag_word = scene[config.drawtag_base + ix]; agg = map_draw_tag(tag_word); sh_scratch[local_id.x] = agg; for (var i = 0u; i < firstTrailingBit(WG_SIZE); i += 1u) { workgroupBarrier(); if local_id.x >= 1u << i { let other = sh_scratch[local_id.x - (1u << i)]; agg = combine_draw_monoid(agg, other); } workgroupBarrier(); sh_scratch[local_id.x] = agg; } workgroupBarrier(); if local_id.x > 0u { m = combine_draw_monoid(m, sh_scratch[local_id.x - 1u]); } // m now contains exclusive prefix sum of draw monoid draw_monoid[ix] = m; let dd = config.drawdata_base + m.scene_offset; let di = m.info_offset; if tag_word == DRAWTAG_FILL_COLOR || tag_word == DRAWTAG_FILL_LIN_GRADIENT || tag_word == DRAWTAG_FILL_RAD_GRADIENT || tag_word == DRAWTAG_FILL_IMAGE || tag_word == DRAWTAG_BEGIN_CLIP { let bbox = path_bbox[m.path_ix]; // TODO: bbox is mostly yagni here, sort that out. Maybe clips? // let x0 = f32(bbox.x0); // let y0 = f32(bbox.y0); // let x1 = f32(bbox.x1); // let y1 = f32(bbox.y1); // let bbox_f = vec4(x0, y0, x1, y1); let fill_mode = u32(bbox.linewidth >= 0.0); var matrx: vec4; var translate: vec2; var linewidth = bbox.linewidth; if linewidth >= 0.0 || tag_word == DRAWTAG_FILL_LIN_GRADIENT || tag_word == DRAWTAG_FILL_RAD_GRADIENT || tag_word == DRAWTAG_FILL_IMAGE { let transform = read_transform(config.transform_base, bbox.trans_ix); matrx = transform.matrx; translate = transform.translate; } if linewidth >= 0.0 { // Note: doesn't deal with anisotropic case linewidth *= sqrt(abs(matrx.x * matrx.w - matrx.y * matrx.z)); } switch tag_word { // DRAWTAG_FILL_COLOR case 0x44u: { info[di] = bitcast(linewidth); } // DRAWTAG_FILL_LIN_GRADIENT case 0x114u: { info[di] = bitcast(linewidth); var p0 = bitcast>(vec2(scene[dd + 1u], scene[dd + 2u])); var p1 = bitcast>(vec2(scene[dd + 3u], scene[dd + 4u])); p0 = matrx.xy * p0.x + matrx.zw * p0.y + translate; p1 = matrx.xy * p1.x + matrx.zw * p1.y + translate; let dxy = p1 - p0; let scale = 1.0 / dot(dxy, dxy); let line_xy = dxy * scale; let line_c = -dot(p0, line_xy); info[di + 1u] = bitcast(line_xy.x); info[di + 2u] = bitcast(line_xy.y); info[di + 3u] = bitcast(line_c); } // DRAWTAG_FILL_RAD_GRADIENT case 0x2dcu: { info[di] = bitcast(linewidth); var p0 = bitcast>(vec2(scene[dd + 1u], scene[dd + 2u])); var p1 = bitcast>(vec2(scene[dd + 3u], scene[dd + 4u])); let r0 = bitcast(scene[dd + 5u]); let r1 = bitcast(scene[dd + 6u]); let inv_det = 1.0 / (matrx.x * matrx.w - matrx.y * matrx.z); let inv_mat = inv_det * vec4(matrx.w, -matrx.y, -matrx.z, matrx.x); let inv_tr = mat2x2(inv_mat.xy, inv_mat.zw) * -translate - p0; let center1 = p1 - p0; let rr = r1 / (r1 - r0); let ra_inv = rr / (r1 * r1 - dot(center1, center1)); let c1 = center1 * ra_inv; let ra = rr * ra_inv; let roff = rr - 1.0; info[di + 1u] = bitcast(inv_mat.x); info[di + 2u] = bitcast(inv_mat.y); info[di + 3u] = bitcast(inv_mat.z); info[di + 4u] = bitcast(inv_mat.w); info[di + 5u] = bitcast(inv_tr.x); info[di + 6u] = bitcast(inv_tr.y); info[di + 7u] = bitcast(c1.x); info[di + 8u] = bitcast(c1.y); info[di + 9u] = bitcast(ra); info[di + 10u] = bitcast(roff); } // DRAWTAG_FILL_IMAGE case 0x248u: { info[di] = bitcast(linewidth); let inv_det = 1.0 / (matrx.x * matrx.w - matrx.y * matrx.z); let inv_mat = inv_det * vec4(matrx.w, -matrx.y, -matrx.z, matrx.x); let inv_tr = mat2x2(inv_mat.xy, inv_mat.zw) * -translate; info[di + 1u] = bitcast(inv_mat.x); info[di + 2u] = bitcast(inv_mat.y); info[di + 3u] = bitcast(inv_mat.z); info[di + 4u] = bitcast(inv_mat.w); info[di + 5u] = bitcast(inv_tr.x); info[di + 6u] = bitcast(inv_tr.y); info[di + 7u] = scene[dd]; info[di + 8u] = scene[dd + 1u]; } default: {} } } if tag_word == DRAWTAG_BEGIN_CLIP || tag_word == DRAWTAG_END_CLIP { var path_ix = ~ix; if tag_word == DRAWTAG_BEGIN_CLIP { path_ix = m.path_ix; } clip_inp[m.clip_ix] = ClipInp(ix, i32(path_ix)); } }