| // SPDX-License-Identifier: Apache-2.0 OR MIT OR Unlicense |
| |
| #import config |
| #import pathtag |
| |
| @group(0) @binding(0) |
| var<uniform> config: Config; |
| |
| @group(0) @binding(1) |
| var<storage> scene: array<u32>; |
| |
| @group(0) @binding(2) |
| var<storage> reduced: array<TagMonoid>; |
| |
| @group(0) @binding(3) |
| var<storage, read_write> tag_monoids: array<TagMonoid>; |
| |
| let LG_WG_SIZE = 8u; |
| let WG_SIZE = 256u; |
| |
| #ifdef small |
| var<workgroup> sh_parent: array<TagMonoid, WG_SIZE>; |
| #endif |
| // These could be combined? |
| var<workgroup> sh_monoid: array<TagMonoid, WG_SIZE>; |
| |
| @compute @workgroup_size(256) |
| fn main( |
| @builtin(global_invocation_id) global_id: vec3<u32>, |
| @builtin(local_invocation_id) local_id: vec3<u32>, |
| @builtin(workgroup_id) wg_id: vec3<u32>, |
| ) { |
| #ifdef small |
| var agg = tag_monoid_identity(); |
| if local_id.x < wg_id.x { |
| agg = reduced[local_id.x]; |
| } |
| sh_parent[local_id.x] = agg; |
| for (var i = 0u; i < LG_WG_SIZE; i += 1u) { |
| workgroupBarrier(); |
| if local_id.x + (1u << i) < WG_SIZE { |
| let other = sh_parent[local_id.x + (1u << i)]; |
| agg = combine_tag_monoid(agg, other); |
| } |
| workgroupBarrier(); |
| sh_parent[local_id.x] = agg; |
| } |
| #endif |
| |
| let ix = global_id.x; |
| let tag_word = scene[config.pathtag_base + ix]; |
| var agg_part = reduce_tag(tag_word); |
| sh_monoid[local_id.x] = agg_part; |
| for (var i = 0u; i < LG_WG_SIZE; i += 1u) { |
| workgroupBarrier(); |
| if local_id.x >= 1u << i { |
| let other = sh_monoid[local_id.x - (1u << i)]; |
| agg_part = combine_tag_monoid(other, agg_part); |
| } |
| workgroupBarrier(); |
| sh_monoid[local_id.x] = agg_part; |
| } |
| workgroupBarrier(); |
| // prefix up to this workgroup |
| #ifdef small |
| var tm = sh_parent[0]; |
| #else |
| var tm = reduced[wg_id.x]; |
| #endif |
| if local_id.x > 0u { |
| tm = combine_tag_monoid(tm, sh_monoid[local_id.x - 1u]); |
| } |
| // exclusive prefix sum, granularity of 4 tag bytes |
| tag_monoids[ix] = tm; |
| } |