mirror of
https://github.com/italicsjenga/vello.git
synced 2025-01-10 20:51:29 +11:00
acb3933d94
This patch switches to a variable size encoding of draw objects. In addition to the CPU-side scene encoding, it changes the representation of intermediate per draw object state from the `Annotated` struct to a variable "info" encoding. In addition, the bounding boxes are moved to a separate array (for a more "structure of "arrays" approach). Data that's unchanged from the scene encoding is not copied. Rather, downstream stages can access the data from the scene buffer (reducing allocation and copying). Prefix sums, computed in `DrawMonoid` track the offset of both scene and intermediate data. The tags for the CPU-side encoding have been split into their own stream (again a change from AoS to SoA style). This is not necessarily the final form. There's some stuff (including at least one piet-gpu-derive type) that can be deleted. In addition, the linewidth field should probably move from the info to path-specific. Also, the 1:1 correspondence between draw object and path has not yet been broken. Closes #152
100 lines
3 KiB
GLSL
100 lines
3 KiB
GLSL
// SPDX-License-Identifier: Apache-2.0 OR MIT OR Unlicense
|
|
|
|
// Various constants for the sizes of groups and tiles.
|
|
|
|
// Much of this will be made dynamic in various ways, but for now it's easiest
|
|
// to hardcode and keep all in one place.
|
|
|
|
// A LG_WG_FACTOR of n scales workgroup sizes by 2^n. Use 0 for a
|
|
// maximum workgroup size of 128, or 1 for a maximum size of 256.
|
|
#define LG_WG_FACTOR 1
|
|
#define WG_FACTOR (1<<LG_WG_FACTOR)
|
|
|
|
#define TILE_WIDTH_PX 16
|
|
#define TILE_HEIGHT_PX 16
|
|
|
|
#define PTCL_INITIAL_ALLOC 1024
|
|
|
|
// These should probably be renamed and/or reworked. In the binning
|
|
// kernel, they represent the number of bins. Also, the workgroup size
|
|
// of that kernel is equal to the number of bins, but should probably
|
|
// be more flexible (it's 512 in the K&L paper).
|
|
#define N_TILE_X 16
|
|
#define N_TILE_Y (8 * WG_FACTOR)
|
|
#define N_TILE (N_TILE_X * N_TILE_Y)
|
|
#define LG_N_TILE (7 + LG_WG_FACTOR)
|
|
#define N_SLICE (N_TILE / 32)
|
|
|
|
#define GRADIENT_WIDTH 512
|
|
|
|
#ifdef ERR_MALLOC_FAILED
|
|
struct Config {
|
|
uint n_elements; // paths
|
|
uint n_pathseg;
|
|
uint width_in_tiles;
|
|
uint height_in_tiles;
|
|
Alloc tile_alloc;
|
|
Alloc bin_alloc;
|
|
Alloc ptcl_alloc;
|
|
Alloc pathseg_alloc;
|
|
Alloc anno_alloc;
|
|
Alloc trans_alloc;
|
|
// new element pipeline stuff follows
|
|
|
|
// Bounding boxes of paths, stored as int (so atomics work)
|
|
Alloc path_bbox_alloc;
|
|
// Monoid for draw objects
|
|
Alloc drawmonoid_alloc;
|
|
|
|
// BeginClip(path_ix) / EndClip
|
|
Alloc clip_alloc;
|
|
// Intermediate bicyclic semigroup
|
|
Alloc clip_bic_alloc;
|
|
// Intermediate stack
|
|
Alloc clip_stack_alloc;
|
|
// Clip processing results (path_ix + bbox)
|
|
Alloc clip_bbox_alloc;
|
|
// Bounding box per draw object
|
|
Alloc draw_bbox_alloc;
|
|
// Info computed in draw stage, per draw object
|
|
Alloc drawinfo_alloc;
|
|
|
|
// Number of transforms in scene
|
|
// This is probably not needed.
|
|
uint n_trans;
|
|
// This *should* count only actual paths, but in the current
|
|
// implementation is redundant with n_elements.
|
|
uint n_path;
|
|
// Total number of BeginClip and EndClip draw objects.
|
|
uint n_clip;
|
|
|
|
// Note: one of these offsets *could* be hardcoded to zero (as was the
|
|
// original element stream), but for now retain flexibility.
|
|
|
|
// Offset (in bytes) of transform stream in scene buffer
|
|
uint trans_offset;
|
|
// Offset (in bytes) of linewidth stream in scene
|
|
uint linewidth_offset;
|
|
// Offset (in bytes) of path tag stream in scene
|
|
uint pathtag_offset;
|
|
// Offset (in bytes) of path segment stream in scene
|
|
uint pathseg_offset;
|
|
// Offset (in bytes) of draw object tag stream in scene; see drawtag.h
|
|
uint drawtag_offset;
|
|
// Offset (in bytes) of draw payload stream in scene
|
|
uint drawdata_offset;
|
|
};
|
|
#endif
|
|
|
|
// Fill modes.
|
|
#define MODE_NONZERO 0
|
|
#define MODE_STROKE 1
|
|
|
|
// Size of kernel4 clip state, in words.
|
|
#define CLIP_STATE_SIZE 2
|
|
|
|
// fill_mode_from_flags extracts the fill mode from tag flags.
|
|
uint fill_mode_from_flags(uint flags) {
|
|
return flags & 0x1;
|
|
}
|