src/render.rs - external/github.com/linebender/vello - Git at Google

 //! Take an encoded scene and create a graph to render it

 use bytemuck::{Pod, Zeroable};

 use crate::{
     encoding::Encoding,
     engine::{BufProxy, ImageFormat, ImageProxy, Recording, ResourceProxy},
     shaders::{self, FullShaders, Shaders},
     Scene,
 };

 const TAG_MONOID_SIZE: u64 = 12;
 const TAG_MONOID_FULL_SIZE: u64 = 20;
 const PATH_BBOX_SIZE: u64 = 24;
 const CUBIC_SIZE: u64 = 48;
 const DRAWMONOID_SIZE: u64 = 16;
 const MAX_DRAWINFO_SIZE: u64 = 44;
 const CLIP_BIC_SIZE: u64 = 8;
 const CLIP_EL_SIZE: u64 = 32;
 const CLIP_INP_SIZE: u64 = 8;
 const CLIP_BBOX_SIZE: u64 = 16;
 const PATH_SIZE: u64 = 32;
 const DRAW_BBOX_SIZE: u64 = 16;
 const BUMP_SIZE: u64 = 16;
 const BIN_HEADER_SIZE: u64 = 8;
 const BBOX_MONOID_SIZE: u64 = 32;

 // Note: this is defined here as it's still used by the reduced pipeline,
 // but for the full pipeline, use the version in `encoding`.
 #[repr(C)]
 #[derive(Clone, Copy, Debug, Default, Zeroable, Pod)]
 struct Config {
     width_in_tiles: u32,
     height_in_tiles: u32,
     target_width: u32,
     target_height: u32,
     n_drawobj: u32,
     n_path: u32,
     n_clip: u32,
     n_pathtag: u32,
     bin_data_start: u32,
     pathtag_base: u32,
     pathdata_base: u32,
     drawtag_base: u32,
     drawdata_base: u32,
     transform_base: u32,
     linewidth_base: u32,
 }

 fn size_to_words(byte_size: usize) -> u32 {
     (byte_size / std::mem::size_of::<u32>()) as u32
 }

 pub const fn next_multiple_of(val: u32, rhs: u32) -> u32 {
     match val % rhs {
         0 => val,
         r => val + (rhs - r),
     }
 }

 #[allow(unused)]
 fn render(scene: &Scene, shaders: &Shaders) -> (Recording, BufProxy) {
     let mut recording = Recording::default();
     let data = scene.data();
     let n_pathtag = data.path_tags.len();
     let pathtag_padded = align_up(n_pathtag, 4 * shaders::PATHTAG_REDUCE_WG);
     let pathtag_wgs = pathtag_padded / (4 * shaders::PATHTAG_REDUCE_WG as usize);
     let mut scene: Vec<u8> = Vec::with_capacity(pathtag_padded);
     let pathtag_base = size_to_words(scene.len());
     scene.extend(bytemuck::cast_slice(&data.path_tags));
     scene.resize(pathtag_padded, 0);
     let pathdata_base = size_to_words(scene.len());
     scene.extend(&data.path_data);

     let config = Config {
         width_in_tiles: 64,
         height_in_tiles: 64,
         target_width: 64 * 16,
         target_height: 64 * 16,
         pathtag_base,
         pathdata_base,
         ..Default::default()
     };
     let scene_buf = recording.upload(scene);
     let config_buf = recording.upload_uniform(bytemuck::bytes_of(&config));

     let reduced_buf = BufProxy::new(pathtag_wgs as u64 * TAG_MONOID_SIZE);
     // TODO: really only need pathtag_wgs - 1
     recording.dispatch(
         shaders.pathtag_reduce,
         (pathtag_wgs as u32, 1, 1),
         [config_buf, scene_buf, reduced_buf],
     );

     let tagmonoid_buf =
         BufProxy::new(pathtag_wgs as u64 * shaders::PATHTAG_REDUCE_WG as u64 * TAG_MONOID_SIZE);
     recording.dispatch(
         shaders.pathtag_scan,
         (pathtag_wgs as u32, 1, 1),
         [config_buf, scene_buf, reduced_buf, tagmonoid_buf],
     );

     let path_coarse_wgs =
         (n_pathtag as u32 + shaders::PATH_COARSE_WG - 1) / shaders::PATH_COARSE_WG;
     // TODO: more principled size calc
     let tiles_buf = BufProxy::new(4097 * 8);
     let segments_buf = BufProxy::new(256 * 24);
     recording.clear_all(tiles_buf);
     recording.dispatch(
         shaders.path_coarse,
         (path_coarse_wgs, 1, 1),
         [
             config_buf,
             scene_buf,
             tagmonoid_buf,
             tiles_buf,
             segments_buf,
         ],
     );
     recording.dispatch(
         shaders.backdrop,
         (config.height_in_tiles, 1, 1),
         [config_buf, tiles_buf],
     );
     let out_buf_size = config.width_in_tiles * config.height_in_tiles * 256;
     let out_buf = BufProxy::new(out_buf_size as u64);
     recording.dispatch(
         shaders.fine,
         (config.width_in_tiles, config.height_in_tiles, 1),
         [config_buf, tiles_buf, segments_buf, out_buf],
     );

     recording.download(out_buf);
     (recording, out_buf)
 }

 pub fn render_full(
     scene: &Scene,
     shaders: &FullShaders,
     width: u32,
     height: u32,
 ) -> (Recording, ResourceProxy) {
     render_encoding_full(&scene.data(), shaders, width, height)
 }

 pub fn render_encoding_full(
     encoding: &Encoding,
     shaders: &FullShaders,
     width: u32,
     height: u32,
 ) -> (Recording, ResourceProxy) {
     use crate::encoding::{resource::ResourceCache, PackedEncoding};
     let mut recording = Recording::default();
     let mut resources = ResourceCache::new();
     let mut packed = PackedEncoding::default();
     packed.pack(&encoding, &mut resources);
     let (ramp_data, ramps_width, ramps_height) = resources.ramps(packed.resources).unwrap();
     let gradient_image = if encoding.patches.is_empty() {
         ResourceProxy::new_image(1, 1, ImageFormat::Rgba8)
     } else {
         let data: &[u8] = bytemuck::cast_slice(ramp_data);
         ResourceProxy::Image(recording.upload_image(
             ramps_width,
             ramps_height,
             ImageFormat::Rgba8,
             data,
         ))
     };
     // TODO: calculate for real when we do rectangles
     let n_pathtag = encoding.path_tags.len();
     let pathtag_padded = align_up(encoding.path_tags.len(), 4 * shaders::PATHTAG_REDUCE_WG);
     let n_paths = encoding.n_paths;
     let n_drawobj = n_paths;
     let n_clip = encoding.n_clips;

     let new_width = next_multiple_of(width, 16);
     let new_height = next_multiple_of(height, 16);

     let config = crate::encoding::Config {
         width_in_tiles: new_width / 16,
         height_in_tiles: new_height / 16,
         target_width: width,
         target_height: height,
         layout: packed.layout,
     };
     // println!("{:?}", config);
     let scene_buf = ResourceProxy::Buf(recording.upload(packed.data));
     let config_buf = ResourceProxy::Buf(recording.upload_uniform(bytemuck::bytes_of(&config)));

     let pathtag_wgs = pathtag_padded / (4 * shaders::PATHTAG_REDUCE_WG as usize);
     let reduced_buf = ResourceProxy::new_buf(pathtag_wgs as u64 * TAG_MONOID_FULL_SIZE);
     // TODO: really only need pathtag_wgs - 1
     recording.dispatch(
         shaders.pathtag_reduce,
         (pathtag_wgs as u32, 1, 1),
         [config_buf, scene_buf, reduced_buf],
     );

     let tagmonoid_buf = ResourceProxy::new_buf(
         pathtag_wgs as u64 * shaders::PATHTAG_REDUCE_WG as u64 * TAG_MONOID_FULL_SIZE,
     );
     recording.dispatch(
         shaders.pathtag_scan,
         (pathtag_wgs as u32, 1, 1),
         [config_buf, scene_buf, reduced_buf, tagmonoid_buf],
     );
     let drawobj_wgs = (n_drawobj + shaders::PATH_BBOX_WG - 1) / shaders::PATH_BBOX_WG;
     let path_bbox_buf = ResourceProxy::new_buf(n_paths as u64 * PATH_BBOX_SIZE);
     let cubic_buf = ResourceProxy::new_buf(n_pathtag as u64 * CUBIC_SIZE);
     let path_coarse_wgs =
         (n_pathtag as u32 + shaders::PATH_COARSE_WG - 1) / shaders::PATH_COARSE_WG;
     let bbox_reduced_buf = ResourceProxy::new_buf(path_coarse_wgs as u64 * BBOX_MONOID_SIZE);
     recording.dispatch(
         shaders.pathseg,
         (path_coarse_wgs, 1, 1),
         [
             config_buf,
             scene_buf,
             tagmonoid_buf,
             path_bbox_buf,
             cubic_buf,
             bbox_reduced_buf,
         ],
     );
     recording.dispatch(
         shaders.bbox_fixup,
         (1, 1, 1),
         [config_buf, tagmonoid_buf, bbox_reduced_buf, path_bbox_buf],
     );
     let draw_reduced_buf = ResourceProxy::new_buf(drawobj_wgs as u64 * DRAWMONOID_SIZE);
     recording.dispatch(
         shaders.draw_reduce,
         (drawobj_wgs, 1, 1),
         [config_buf, scene_buf, draw_reduced_buf],
     );
     let draw_monoid_buf = ResourceProxy::new_buf(n_drawobj as u64 * DRAWMONOID_SIZE);
     let info_bin_data_buf = ResourceProxy::new_buf(1 << 20);
     let clip_inp_buf = ResourceProxy::new_buf(encoding.n_clips as u64 * CLIP_INP_SIZE);
     recording.dispatch(
         shaders.draw_leaf,
         (drawobj_wgs, 1, 1),
         [
             config_buf,
             scene_buf,
             draw_reduced_buf,
             path_bbox_buf,
             draw_monoid_buf,
             info_bin_data_buf,
             clip_inp_buf,
         ],
     );
     let clip_el_buf = ResourceProxy::new_buf(encoding.n_clips as u64 * CLIP_EL_SIZE);
     let clip_bic_buf =
         ResourceProxy::new_buf((n_clip / shaders::CLIP_REDUCE_WG) as u64 * CLIP_BIC_SIZE);
     let clip_wg_reduce = n_clip.saturating_sub(1) / shaders::CLIP_REDUCE_WG;
     if clip_wg_reduce > 0 {
         recording.dispatch(
             shaders.clip_reduce,
             (clip_wg_reduce, 1, 1),
             [
                 config_buf,
                 clip_inp_buf,
                 path_bbox_buf,
                 clip_bic_buf,
                 clip_el_buf,
             ],
         );
     }
     let clip_wg = (n_clip + shaders::CLIP_REDUCE_WG - 1) / shaders::CLIP_REDUCE_WG;
     let clip_bbox_buf = ResourceProxy::new_buf(n_clip as u64 * CLIP_BBOX_SIZE);
     if clip_wg > 0 {
         recording.dispatch(
             shaders.clip_leaf,
             (clip_wg, 1, 1),
             [
                 config_buf,
                 clip_inp_buf,
                 path_bbox_buf,
                 clip_bic_buf,
                 clip_el_buf,
                 draw_monoid_buf,
                 clip_bbox_buf,
             ],
         );
     }
     let draw_bbox_buf = ResourceProxy::new_buf(n_paths as u64 * DRAW_BBOX_SIZE);
     let bump_buf = BufProxy::new(BUMP_SIZE);
     let width_in_bins = (config.width_in_tiles + 15) / 16;
     let height_in_bins = (config.height_in_tiles + 15) / 16;
     let bin_header_buf = ResourceProxy::new_buf((256 * drawobj_wgs) as u64 * BIN_HEADER_SIZE);
     recording.clear_all(bump_buf);
     let bump_buf = ResourceProxy::Buf(bump_buf);
     recording.dispatch(
         shaders.binning,
         (drawobj_wgs, 1, 1),
         [
             config_buf,
             draw_monoid_buf,
             path_bbox_buf,
             clip_bbox_buf,
             draw_bbox_buf,
             bump_buf,
             info_bin_data_buf,
             bin_header_buf,
         ],
     );
     // Note: this only needs to be rounded up because of the workaround to store the tile_offset
     // in storage rather than workgroup memory.
     let n_path_aligned = align_up(n_paths as usize, 256);
     let path_buf = ResourceProxy::new_buf(n_path_aligned as u64 * PATH_SIZE);
     let tile_buf = ResourceProxy::new_buf(1 << 20);
     let path_wgs = (n_paths + shaders::PATH_BBOX_WG - 1) / shaders::PATH_BBOX_WG;
     recording.dispatch(
         shaders.tile_alloc,
         (path_wgs, 1, 1),
         [
             config_buf,
             scene_buf,
             draw_bbox_buf,
             bump_buf,
             path_buf,
             tile_buf,
         ],
     );

     let segments_buf = ResourceProxy::new_buf(1 << 24);
     recording.dispatch(
         shaders.path_coarse,
         (path_coarse_wgs, 1, 1),
         [
             config_buf,
             scene_buf,
             tagmonoid_buf,
             cubic_buf,
             path_buf,
             bump_buf,
             tile_buf,
             segments_buf,
         ],
     );
     recording.dispatch(
         shaders.backdrop,
         (path_wgs, 1, 1),
         [config_buf, path_buf, tile_buf],
     );
     let ptcl_buf = ResourceProxy::new_buf(1 << 24);
     recording.dispatch(
         shaders.coarse,
         (width_in_bins, height_in_bins, 1),
         [
             config_buf,
             scene_buf,
             draw_monoid_buf,
             bin_header_buf,
             info_bin_data_buf,
             path_buf,
             tile_buf,
             bump_buf,
             ptcl_buf,
         ],
     );
     let out_image = ImageProxy::new(width, height, ImageFormat::Rgba8);
     recording.dispatch(
         shaders.fine,
         (config.width_in_tiles, config.height_in_tiles, 1),
         [
             config_buf,
             tile_buf,
             segments_buf,
             ResourceProxy::Image(out_image),
             ptcl_buf,
             gradient_image,
             info_bin_data_buf,
         ],
     );
     (recording, ResourceProxy::Image(out_image))
 }

 pub fn align_up(len: usize, alignment: u32) -> usize {
     len + (len.wrapping_neg() & alignment as usize - 1)
 }
	//! Take an encoded scene and create a graph to render it

	use bytemuck::{Pod, Zeroable};

	use crate::{
	encoding::Encoding,
	engine::{BufProxy, ImageFormat, ImageProxy, Recording, ResourceProxy},
	shaders::{self, FullShaders, Shaders},
	Scene,
	};

	const TAG_MONOID_SIZE: u64 = 12;
	const TAG_MONOID_FULL_SIZE: u64 = 20;
	const PATH_BBOX_SIZE: u64 = 24;
	const CUBIC_SIZE: u64 = 48;
	const DRAWMONOID_SIZE: u64 = 16;
	const MAX_DRAWINFO_SIZE: u64 = 44;
	const CLIP_BIC_SIZE: u64 = 8;
	const CLIP_EL_SIZE: u64 = 32;
	const CLIP_INP_SIZE: u64 = 8;
	const CLIP_BBOX_SIZE: u64 = 16;
	const PATH_SIZE: u64 = 32;
	const DRAW_BBOX_SIZE: u64 = 16;
	const BUMP_SIZE: u64 = 16;
	const BIN_HEADER_SIZE: u64 = 8;
	const BBOX_MONOID_SIZE: u64 = 32;

	// Note: this is defined here as it's still used by the reduced pipeline,
	// but for the full pipeline, use the version in `encoding`.
	#[repr(C)]
	#[derive(Clone, Copy, Debug, Default, Zeroable, Pod)]
	struct Config {
	width_in_tiles: u32,
	height_in_tiles: u32,
	target_width: u32,
	target_height: u32,
	n_drawobj: u32,
	n_path: u32,
	n_clip: u32,
	n_pathtag: u32,
	bin_data_start: u32,
	pathtag_base: u32,
	pathdata_base: u32,
	drawtag_base: u32,
	drawdata_base: u32,
	transform_base: u32,
	linewidth_base: u32,
	}

	fn size_to_words(byte_size: usize) -> u32 {
	(byte_size / std::mem::size_of::<u32>()) as u32
	}

	pub const fn next_multiple_of(val: u32, rhs: u32) -> u32 {
	match val % rhs {
	0 => val,
	r => val + (rhs - r),
	}
	}

	#[allow(unused)]
	fn render(scene: &Scene, shaders: &Shaders) -> (Recording, BufProxy) {
	let mut recording = Recording::default();
	let data = scene.data();
	let n_pathtag = data.path_tags.len();
	let pathtag_padded = align_up(n_pathtag, 4 * shaders::PATHTAG_REDUCE_WG);
	let pathtag_wgs = pathtag_padded / (4 * shaders::PATHTAG_REDUCE_WG as usize);
	let mut scene: Vec<u8> = Vec::with_capacity(pathtag_padded);
	let pathtag_base = size_to_words(scene.len());
	scene.extend(bytemuck::cast_slice(&data.path_tags));
	scene.resize(pathtag_padded, 0);
	let pathdata_base = size_to_words(scene.len());
	scene.extend(&data.path_data);

	let config = Config {
	width_in_tiles: 64,
	height_in_tiles: 64,
	target_width: 64 * 16,
	target_height: 64 * 16,
	pathtag_base,
	pathdata_base,
	..Default::default()
	};
	let scene_buf = recording.upload(scene);
	let config_buf = recording.upload_uniform(bytemuck::bytes_of(&config));

	let reduced_buf = BufProxy::new(pathtag_wgs as u64 * TAG_MONOID_SIZE);
	// TODO: really only need pathtag_wgs - 1
	recording.dispatch(
	shaders.pathtag_reduce,
	(pathtag_wgs as u32, 1, 1),
	[config_buf, scene_buf, reduced_buf],
	);

	let tagmonoid_buf =
	BufProxy::new(pathtag_wgs as u64 * shaders::PATHTAG_REDUCE_WG as u64 * TAG_MONOID_SIZE);
	recording.dispatch(
	shaders.pathtag_scan,
	(pathtag_wgs as u32, 1, 1),
	[config_buf, scene_buf, reduced_buf, tagmonoid_buf],
	);

	let path_coarse_wgs =
	(n_pathtag as u32 + shaders::PATH_COARSE_WG - 1) / shaders::PATH_COARSE_WG;
	// TODO: more principled size calc
	let tiles_buf = BufProxy::new(4097 * 8);
	let segments_buf = BufProxy::new(256 * 24);
	recording.clear_all(tiles_buf);
	recording.dispatch(
	shaders.path_coarse,
	(path_coarse_wgs, 1, 1),
	[
	config_buf,
	scene_buf,
	tagmonoid_buf,
	tiles_buf,
	segments_buf,
	],
	);
	recording.dispatch(
	shaders.backdrop,
	(config.height_in_tiles, 1, 1),
	[config_buf, tiles_buf],
	);
	let out_buf_size = config.width_in_tiles * config.height_in_tiles * 256;
	let out_buf = BufProxy::new(out_buf_size as u64);
	recording.dispatch(
	shaders.fine,
	(config.width_in_tiles, config.height_in_tiles, 1),
	[config_buf, tiles_buf, segments_buf, out_buf],
	);

	recording.download(out_buf);
	(recording, out_buf)
	}

	pub fn render_full(
	scene: &Scene,
	shaders: &FullShaders,
	width: u32,
	height: u32,
	) -> (Recording, ResourceProxy) {
	render_encoding_full(&scene.data(), shaders, width, height)
	}

	pub fn render_encoding_full(
	encoding: &Encoding,
	shaders: &FullShaders,
	width: u32,
	height: u32,
	) -> (Recording, ResourceProxy) {
	use crate::encoding::{resource::ResourceCache, PackedEncoding};
	let mut recording = Recording::default();
	let mut resources = ResourceCache::new();
	let mut packed = PackedEncoding::default();
	packed.pack(&encoding, &mut resources);
	let (ramp_data, ramps_width, ramps_height) = resources.ramps(packed.resources).unwrap();
	let gradient_image = if encoding.patches.is_empty() {
	ResourceProxy::new_image(1, 1, ImageFormat::Rgba8)
	} else {
	let data: &[u8] = bytemuck::cast_slice(ramp_data);
	ResourceProxy::Image(recording.upload_image(
	ramps_width,
	ramps_height,
	ImageFormat::Rgba8,
	data,
	))
	};
	// TODO: calculate for real when we do rectangles
	let n_pathtag = encoding.path_tags.len();
	let pathtag_padded = align_up(encoding.path_tags.len(), 4 * shaders::PATHTAG_REDUCE_WG);
	let n_paths = encoding.n_paths;
	let n_drawobj = n_paths;
	let n_clip = encoding.n_clips;

	let new_width = next_multiple_of(width, 16);
	let new_height = next_multiple_of(height, 16);

	let config = crate::encoding::Config {
	width_in_tiles: new_width / 16,
	height_in_tiles: new_height / 16,
	target_width: width,
	target_height: height,
	layout: packed.layout,
	};
	// println!("{:?}", config);
	let scene_buf = ResourceProxy::Buf(recording.upload(packed.data));
	let config_buf = ResourceProxy::Buf(recording.upload_uniform(bytemuck::bytes_of(&config)));

	let pathtag_wgs = pathtag_padded / (4 * shaders::PATHTAG_REDUCE_WG as usize);
	let reduced_buf = ResourceProxy::new_buf(pathtag_wgs as u64 * TAG_MONOID_FULL_SIZE);
	// TODO: really only need pathtag_wgs - 1
	recording.dispatch(
	shaders.pathtag_reduce,
	(pathtag_wgs as u32, 1, 1),
	[config_buf, scene_buf, reduced_buf],
	);

	let tagmonoid_buf = ResourceProxy::new_buf(
	pathtag_wgs as u64 * shaders::PATHTAG_REDUCE_WG as u64 * TAG_MONOID_FULL_SIZE,
	);
	recording.dispatch(
	shaders.pathtag_scan,
	(pathtag_wgs as u32, 1, 1),
	[config_buf, scene_buf, reduced_buf, tagmonoid_buf],
	);
	let drawobj_wgs = (n_drawobj + shaders::PATH_BBOX_WG - 1) / shaders::PATH_BBOX_WG;
	let path_bbox_buf = ResourceProxy::new_buf(n_paths as u64 * PATH_BBOX_SIZE);
	let cubic_buf = ResourceProxy::new_buf(n_pathtag as u64 * CUBIC_SIZE);
	let path_coarse_wgs =
	(n_pathtag as u32 + shaders::PATH_COARSE_WG - 1) / shaders::PATH_COARSE_WG;
	let bbox_reduced_buf = ResourceProxy::new_buf(path_coarse_wgs as u64 * BBOX_MONOID_SIZE);
	recording.dispatch(
	shaders.pathseg,
	(path_coarse_wgs, 1, 1),
	[
	config_buf,
	scene_buf,
	tagmonoid_buf,
	path_bbox_buf,
	cubic_buf,
	bbox_reduced_buf,
	],
	);
	recording.dispatch(
	shaders.bbox_fixup,
	(1, 1, 1),
	[config_buf, tagmonoid_buf, bbox_reduced_buf, path_bbox_buf],
	);
	let draw_reduced_buf = ResourceProxy::new_buf(drawobj_wgs as u64 * DRAWMONOID_SIZE);
	recording.dispatch(
	shaders.draw_reduce,
	(drawobj_wgs, 1, 1),
	[config_buf, scene_buf, draw_reduced_buf],
	);
	let draw_monoid_buf = ResourceProxy::new_buf(n_drawobj as u64 * DRAWMONOID_SIZE);
	let info_bin_data_buf = ResourceProxy::new_buf(1 << 20);
	let clip_inp_buf = ResourceProxy::new_buf(encoding.n_clips as u64 * CLIP_INP_SIZE);
	recording.dispatch(
	shaders.draw_leaf,
	(drawobj_wgs, 1, 1),
	[
	config_buf,
	scene_buf,
	draw_reduced_buf,
	path_bbox_buf,
	draw_monoid_buf,
	info_bin_data_buf,
	clip_inp_buf,
	],
	);
	let clip_el_buf = ResourceProxy::new_buf(encoding.n_clips as u64 * CLIP_EL_SIZE);
	let clip_bic_buf =
	ResourceProxy::new_buf((n_clip / shaders::CLIP_REDUCE_WG) as u64 * CLIP_BIC_SIZE);
	let clip_wg_reduce = n_clip.saturating_sub(1) / shaders::CLIP_REDUCE_WG;
	if clip_wg_reduce > 0 {
	recording.dispatch(
	shaders.clip_reduce,
	(clip_wg_reduce, 1, 1),
	[
	config_buf,
	clip_inp_buf,
	path_bbox_buf,
	clip_bic_buf,
	clip_el_buf,
	],
	);
	}
	let clip_wg = (n_clip + shaders::CLIP_REDUCE_WG - 1) / shaders::CLIP_REDUCE_WG;
	let clip_bbox_buf = ResourceProxy::new_buf(n_clip as u64 * CLIP_BBOX_SIZE);
	if clip_wg > 0 {
	recording.dispatch(
	shaders.clip_leaf,
	(clip_wg, 1, 1),
	[
	config_buf,
	clip_inp_buf,
	path_bbox_buf,
	clip_bic_buf,
	clip_el_buf,
	draw_monoid_buf,
	clip_bbox_buf,
	],
	);
	}
	let draw_bbox_buf = ResourceProxy::new_buf(n_paths as u64 * DRAW_BBOX_SIZE);
	let bump_buf = BufProxy::new(BUMP_SIZE);
	let width_in_bins = (config.width_in_tiles + 15) / 16;
	let height_in_bins = (config.height_in_tiles + 15) / 16;
	let bin_header_buf = ResourceProxy::new_buf((256 * drawobj_wgs) as u64 * BIN_HEADER_SIZE);
	recording.clear_all(bump_buf);
	let bump_buf = ResourceProxy::Buf(bump_buf);
	recording.dispatch(
	shaders.binning,
	(drawobj_wgs, 1, 1),
	[
	config_buf,
	draw_monoid_buf,
	path_bbox_buf,
	clip_bbox_buf,
	draw_bbox_buf,
	bump_buf,
	info_bin_data_buf,
	bin_header_buf,
	],
	);
	// Note: this only needs to be rounded up because of the workaround to store the tile_offset
	// in storage rather than workgroup memory.
	let n_path_aligned = align_up(n_paths as usize, 256);
	let path_buf = ResourceProxy::new_buf(n_path_aligned as u64 * PATH_SIZE);
	let tile_buf = ResourceProxy::new_buf(1 << 20);
	let path_wgs = (n_paths + shaders::PATH_BBOX_WG - 1) / shaders::PATH_BBOX_WG;
	recording.dispatch(
	shaders.tile_alloc,
	(path_wgs, 1, 1),
	[
	config_buf,
	scene_buf,
	draw_bbox_buf,
	bump_buf,
	path_buf,
	tile_buf,
	],
	);

	let segments_buf = ResourceProxy::new_buf(1 << 24);
	recording.dispatch(
	shaders.path_coarse,
	(path_coarse_wgs, 1, 1),
	[
	config_buf,
	scene_buf,
	tagmonoid_buf,
	cubic_buf,
	path_buf,
	bump_buf,
	tile_buf,
	segments_buf,
	],
	);
	recording.dispatch(
	shaders.backdrop,
	(path_wgs, 1, 1),
	[config_buf, path_buf, tile_buf],
	);
	let ptcl_buf = ResourceProxy::new_buf(1 << 24);
	recording.dispatch(
	shaders.coarse,
	(width_in_bins, height_in_bins, 1),
	[
	config_buf,
	scene_buf,
	draw_monoid_buf,
	bin_header_buf,
	info_bin_data_buf,
	path_buf,
	tile_buf,
	bump_buf,
	ptcl_buf,
	],
	);
	let out_image = ImageProxy::new(width, height, ImageFormat::Rgba8);
	recording.dispatch(
	shaders.fine,
	(config.width_in_tiles, config.height_in_tiles, 1),
	[
	config_buf,
	tile_buf,
	segments_buf,
	ResourceProxy::Image(out_image),
	ptcl_buf,
	gradient_image,
	info_bin_data_buf,
	],
	);
	(recording, ResourceProxy::Image(out_image))
	}

	pub fn align_up(len: usize, alignment: u32) -> usize {
	len + (len.wrapping_neg() & alignment as usize - 1)
	}