2020-12-11 15:01:48 +01:00
|
|
|
// SPDX-License-Identifier: Apache-2.0 OR MIT OR Unlicense
|
|
|
|
|
2020-06-02 17:10:20 -07:00
|
|
|
// Allocation and initialization of tiles for paths.
|
|
|
|
|
|
|
|
#version 450
|
|
|
|
#extension GL_GOOGLE_include_directive : enable
|
|
|
|
|
2020-12-11 18:30:20 +01:00
|
|
|
#include "mem.h"
|
2020-12-24 12:00:53 +01:00
|
|
|
#include "setup.h"
|
2020-06-02 17:10:20 -07:00
|
|
|
|
2020-09-13 12:58:47 +02:00
|
|
|
#define LG_TILE_ALLOC_WG (7 + LG_WG_FACTOR)
|
2020-06-03 13:04:52 -07:00
|
|
|
#define TILE_ALLOC_WG (1 << LG_TILE_ALLOC_WG)
|
2020-06-02 17:10:20 -07:00
|
|
|
|
|
|
|
layout(local_size_x = TILE_ALLOC_WG, local_size_y = 1) in;
|
|
|
|
|
2020-12-11 18:30:20 +01:00
|
|
|
layout(set = 0, binding = 1) readonly buffer ConfigBuf {
|
|
|
|
Config conf;
|
2020-06-02 17:10:20 -07:00
|
|
|
};
|
|
|
|
|
2022-03-02 14:44:03 -08:00
|
|
|
layout(binding = 2) readonly buffer SceneBuf {
|
|
|
|
uint[] scene;
|
|
|
|
};
|
|
|
|
|
|
|
|
#include "drawtag.h"
|
2020-06-02 17:10:20 -07:00
|
|
|
#include "tile.h"
|
|
|
|
|
|
|
|
// scale factors useful for converting coordinates to tiles
|
|
|
|
#define SX (1.0 / float(TILE_WIDTH_PX))
|
|
|
|
#define SY (1.0 / float(TILE_HEIGHT_PX))
|
|
|
|
|
2020-06-03 13:04:52 -07:00
|
|
|
shared uint sh_tile_count[TILE_ALLOC_WG];
|
2022-06-23 08:48:26 -07:00
|
|
|
shared uint sh_tile_offset;
|
2020-06-03 13:04:52 -07:00
|
|
|
|
2022-03-02 14:44:03 -08:00
|
|
|
vec4 load_draw_bbox(uint draw_ix) {
|
|
|
|
uint base = (conf.draw_bbox_alloc.offset >> 2) + 4 * draw_ix;
|
|
|
|
float x0 = uintBitsToFloat(memory[base]);
|
|
|
|
float y0 = uintBitsToFloat(memory[base + 1]);
|
|
|
|
float x1 = uintBitsToFloat(memory[base + 2]);
|
|
|
|
float y1 = uintBitsToFloat(memory[base + 3]);
|
|
|
|
vec4 bbox = vec4(x0, y0, x1, y1);
|
|
|
|
return bbox;
|
|
|
|
}
|
|
|
|
|
2020-06-02 17:10:20 -07:00
|
|
|
void main() {
|
2022-06-23 08:48:26 -07:00
|
|
|
if (!check_deps(STAGE_BINNING)) {
|
|
|
|
return;
|
|
|
|
}
|
2020-06-03 13:04:52 -07:00
|
|
|
uint th_ix = gl_LocalInvocationID.x;
|
2020-06-02 17:10:20 -07:00
|
|
|
uint element_ix = gl_GlobalInvocationID.x;
|
2022-03-02 14:44:03 -08:00
|
|
|
// At the moment, element_ix == path_ix. The clip-intersected bounding boxes
|
|
|
|
// for elements (draw objects) are computed in the binning stage, but at some
|
|
|
|
// point we'll probably want to break that correspondence. Tiles should be
|
|
|
|
// allocated for paths, not draw objs. EndClip doesn't need an allocation.
|
2020-12-24 12:00:53 +01:00
|
|
|
PathRef path_ref = PathRef(conf.tile_alloc.offset + element_ix * Path_size);
|
2022-03-02 14:44:03 -08:00
|
|
|
uint drawtag_base = conf.drawtag_offset >> 2;
|
2020-06-02 17:10:20 -07:00
|
|
|
|
2022-03-02 14:44:03 -08:00
|
|
|
uint drawtag = Drawtag_Nop;
|
2020-12-11 18:30:20 +01:00
|
|
|
if (element_ix < conf.n_elements) {
|
2022-03-02 14:44:03 -08:00
|
|
|
drawtag = scene[drawtag_base + element_ix];
|
2020-06-02 17:10:20 -07:00
|
|
|
}
|
|
|
|
int x0 = 0, y0 = 0, x1 = 0, y1 = 0;
|
2022-03-02 14:44:03 -08:00
|
|
|
// Allocate an empty path for EndClip; at some point we'll change
|
|
|
|
// this to be per path rather than per draw object.
|
|
|
|
if (drawtag != Drawtag_Nop && drawtag != Drawtag_EndClip) {
|
|
|
|
vec4 bbox = load_draw_bbox(element_ix);
|
|
|
|
x0 = int(floor(bbox.x * SX));
|
|
|
|
y0 = int(floor(bbox.y * SY));
|
|
|
|
x1 = int(ceil(bbox.z * SX));
|
|
|
|
y1 = int(ceil(bbox.w * SY));
|
2020-06-02 17:10:20 -07:00
|
|
|
}
|
2020-12-18 00:55:21 +01:00
|
|
|
x0 = clamp(x0, 0, int(conf.width_in_tiles));
|
|
|
|
y0 = clamp(y0, 0, int(conf.height_in_tiles));
|
|
|
|
x1 = clamp(x1, 0, int(conf.width_in_tiles));
|
|
|
|
y1 = clamp(y1, 0, int(conf.height_in_tiles));
|
2020-06-02 17:10:20 -07:00
|
|
|
|
|
|
|
Path path;
|
|
|
|
path.bbox = uvec4(x0, y0, x1, y1);
|
2020-06-03 13:04:52 -07:00
|
|
|
uint tile_count = (x1 - x0) * (y1 - y0);
|
|
|
|
|
|
|
|
sh_tile_count[th_ix] = tile_count;
|
2020-12-24 12:00:53 +01:00
|
|
|
uint total_tile_count = tile_count;
|
2020-06-03 13:04:52 -07:00
|
|
|
// Prefix sum of sh_tile_count
|
|
|
|
for (uint i = 0; i < LG_TILE_ALLOC_WG; i++) {
|
|
|
|
barrier();
|
2021-12-08 10:42:35 -08:00
|
|
|
if (th_ix >= (1u << i)) {
|
2021-12-03 15:49:58 -08:00
|
|
|
total_tile_count += sh_tile_count[th_ix - (1u << i)];
|
2020-06-02 17:10:20 -07:00
|
|
|
}
|
2020-06-03 13:04:52 -07:00
|
|
|
barrier();
|
2020-12-24 12:00:53 +01:00
|
|
|
sh_tile_count[th_ix] = total_tile_count;
|
2020-06-03 13:04:52 -07:00
|
|
|
}
|
|
|
|
if (th_ix == TILE_ALLOC_WG - 1) {
|
2022-06-23 08:48:26 -07:00
|
|
|
sh_tile_offset = malloc_stage(total_tile_count * Tile_size, conf.mem_size, STAGE_TILE_ALLOC);
|
2020-06-02 17:10:20 -07:00
|
|
|
}
|
2020-06-03 13:04:52 -07:00
|
|
|
barrier();
|
2022-06-23 08:48:26 -07:00
|
|
|
uint offset_start = sh_tile_offset;
|
|
|
|
if (offset_start == MALLOC_FAILED) {
|
2020-12-11 18:30:20 +01:00
|
|
|
return;
|
|
|
|
}
|
2020-06-03 13:04:52 -07:00
|
|
|
|
2020-12-11 18:30:20 +01:00
|
|
|
if (element_ix < conf.n_elements) {
|
2020-06-04 15:58:38 -07:00
|
|
|
uint tile_subix = th_ix > 0 ? sh_tile_count[th_ix - 1] : 0;
|
2022-06-23 08:48:26 -07:00
|
|
|
path.tiles = TileRef(offset_start + Tile_size * tile_subix);
|
2020-12-24 12:00:53 +01:00
|
|
|
Path_write(conf.tile_alloc, path_ref, path);
|
2020-06-04 15:58:38 -07:00
|
|
|
}
|
2020-06-03 13:04:52 -07:00
|
|
|
|
|
|
|
// Zero out allocated tiles efficiently
|
|
|
|
uint total_count = sh_tile_count[TILE_ALLOC_WG - 1] * (Tile_size / 4);
|
2022-06-23 08:48:26 -07:00
|
|
|
uint start_ix = offset_start >> 2;
|
2020-06-03 13:04:52 -07:00
|
|
|
for (uint i = th_ix; i < total_count; i += TILE_ALLOC_WG) {
|
2022-06-23 08:48:26 -07:00
|
|
|
memory[start_ix + i] = 0;
|
2020-06-03 13:04:52 -07:00
|
|
|
}
|
2020-06-02 17:10:20 -07:00
|
|
|
}
|