Skip to content

Commit 7e113d6

Browse files
authored
Tweak Particle Sample (#492)
I was investigating why this sample didn't work on compat mode in Chrome. I found 1 issue in the code which is the shader that makes the probability map only worked if the source image is was a multiple of 64 pixels wide. This was because it was not conditionally skipping out of bounds pixels and so processing those pixels would end up overwriting other results. This issue does not come up in the sample but if you change the image to some image that is not a multiple of 64 pixels across the issue comes up. In debugging why GL was failing, one my paths was to make a 16x16 pixel `F` using the canvas 2D api and passing that in so that I could print all of the data. With that I ran into this issue. So, I added the skipping. Thank's to Peter McNeeley for finding that issue. While pursing the code I find somethings I though maybe should be refactored? * Calculating the number of mip level was done in a loop. Changed it to just math. * Moving some calculations to use properties on the texture. I can revert these changes. They were useful when I switched the source image to a canvas since then the code didn't depend on variables that were no longer available. * Getting rid of `struct Buffer` I can revert these changes. I get the impression that this was a limitation of an earlier version of WGSL? It seems more confusing to me personally to have a struct with a single array in it than to just have the array. * Simpler math I can revert this but, changed `sum = dot(vec4f(a, b, c, d), vec4f(1.0))` to `sum = a + b + c + d`. Note that, even with the change for the first pass, the code only works for square power-of-2 images. Both the probability generation and the usage of that data require each mip level to be exactly 1/2 the size of the previous level. So, added some asserts so people copying this won't stumble into issues.
1 parent 7dfbacd commit 7e113d6

File tree

2 files changed

+58
-60
lines changed

2 files changed

+58
-60
lines changed

sample/particles/main.ts

+36-39
Original file line numberDiff line numberDiff line change
@@ -182,39 +182,30 @@ quadVertexBuffer.unmap();
182182
//////////////////////////////////////////////////////////////////////////////
183183
// Texture
184184
//////////////////////////////////////////////////////////////////////////////
185-
let texture: GPUTexture;
186-
let textureWidth = 1;
187-
let textureHeight = 1;
188-
let numMipLevels = 1;
189-
{
190-
const response = await fetch('../../assets/img/webgpu.png');
191-
const imageBitmap = await createImageBitmap(await response.blob());
192-
193-
// Calculate number of mip levels required to generate the probability map
194-
while (
195-
textureWidth < imageBitmap.width ||
196-
textureHeight < imageBitmap.height
197-
) {
198-
textureWidth *= 2;
199-
textureHeight *= 2;
200-
numMipLevels++;
201-
}
202-
texture = device.createTexture({
203-
size: [imageBitmap.width, imageBitmap.height, 1],
204-
mipLevelCount: numMipLevels,
205-
format: 'rgba8unorm',
206-
usage:
207-
GPUTextureUsage.TEXTURE_BINDING |
208-
GPUTextureUsage.STORAGE_BINDING |
209-
GPUTextureUsage.COPY_DST |
210-
GPUTextureUsage.RENDER_ATTACHMENT,
211-
});
212-
device.queue.copyExternalImageToTexture(
213-
{ source: imageBitmap },
214-
{ texture: texture },
215-
[imageBitmap.width, imageBitmap.height]
216-
);
217-
}
185+
const isPowerOf2 = (v: number) => Math.log2(v) % 1 === 0;
186+
const response = await fetch('../../assets/img/webgpu.png');
187+
const imageBitmap = await createImageBitmap(await response.blob());
188+
assert(imageBitmap.width === imageBitmap.height, 'image must be square');
189+
assert(isPowerOf2(imageBitmap.width), 'image must be a power of 2');
190+
191+
// Calculate number of mip levels required to generate the probability map
192+
const mipLevelCount =
193+
(Math.log2(Math.max(imageBitmap.width, imageBitmap.height)) + 1) | 0;
194+
const texture = device.createTexture({
195+
size: [imageBitmap.width, imageBitmap.height, 1],
196+
mipLevelCount,
197+
format: 'rgba8unorm',
198+
usage:
199+
GPUTextureUsage.TEXTURE_BINDING |
200+
GPUTextureUsage.STORAGE_BINDING |
201+
GPUTextureUsage.COPY_DST |
202+
GPUTextureUsage.RENDER_ATTACHMENT,
203+
});
204+
device.queue.copyExternalImageToTexture(
205+
{ source: imageBitmap },
206+
{ texture: texture },
207+
[imageBitmap.width, imageBitmap.height]
208+
);
218209

219210
//////////////////////////////////////////////////////////////////////////////
220211
// Probability map generation
@@ -247,22 +238,22 @@ let numMipLevels = 1;
247238
usage: GPUBufferUsage.UNIFORM | GPUBufferUsage.COPY_DST,
248239
});
249240
const buffer_a = device.createBuffer({
250-
size: textureWidth * textureHeight * 4,
241+
size: texture.width * texture.height * 4,
251242
usage: GPUBufferUsage.STORAGE,
252243
});
253244
const buffer_b = device.createBuffer({
254-
size: textureWidth * textureHeight * 4,
245+
size: buffer_a.size,
255246
usage: GPUBufferUsage.STORAGE,
256247
});
257248
device.queue.writeBuffer(
258249
probabilityMapUBOBuffer,
259250
0,
260-
new Int32Array([textureWidth])
251+
new Uint32Array([texture.width])
261252
);
262253
const commandEncoder = device.createCommandEncoder();
263-
for (let level = 0; level < numMipLevels; level++) {
264-
const levelWidth = textureWidth >> level;
265-
const levelHeight = textureHeight >> level;
254+
for (let level = 0; level < texture.mipLevelCount; level++) {
255+
const levelWidth = Math.max(1, texture.width >> level);
256+
const levelHeight = Math.max(1, texture.height >> level);
266257
const pipeline =
267258
level == 0
268259
? probabilityMapImportLevelPipeline.getBindGroupLayout(0)
@@ -472,3 +463,9 @@ function frame() {
472463
}
473464
configureContext();
474465
requestAnimationFrame(frame);
466+
467+
function assert(cond: boolean, msg = '') {
468+
if (!cond) {
469+
throw new Error(msg);
470+
}
471+
}

sample/particles/probabilityMap.wgsl

+22-21
Original file line numberDiff line numberDiff line change
@@ -2,17 +2,12 @@ struct UBO {
22
width : u32,
33
}
44

5-
struct Buffer {
6-
weights : array<f32>,
7-
}
8-
95
@binding(0) @group(0) var<uniform> ubo : UBO;
10-
@binding(1) @group(0) var<storage, read> buf_in : Buffer;
11-
@binding(2) @group(0) var<storage, read_write> buf_out : Buffer;
6+
@binding(1) @group(0) var<storage, read> buf_in : array<f32>;
7+
@binding(2) @group(0) var<storage, read_write> buf_out : array<f32>;
128
@binding(3) @group(0) var tex_in : texture_2d<f32>;
139
@binding(3) @group(0) var tex_out : texture_storage_2d<rgba8unorm, write>;
1410

15-
1611
////////////////////////////////////////////////////////////////////////////////
1712
// import_level
1813
//
@@ -21,9 +16,13 @@ struct Buffer {
2116
////////////////////////////////////////////////////////////////////////////////
2217
@compute @workgroup_size(64)
2318
fn import_level(@builtin(global_invocation_id) coord : vec3u) {
24-
_ = &buf_in;
19+
_ = &buf_in; // so the bindGroups are similar.
20+
if (!all(coord.xy < vec2u(textureDimensions(tex_in)))) {
21+
return;
22+
}
23+
2524
let offset = coord.x + coord.y * ubo.width;
26-
buf_out.weights[offset] = textureLoad(tex_in, vec2i(coord.xy), 0).w;
25+
buf_out[offset] = textureLoad(tex_in, vec2i(coord.xy), 0).w;
2726
}
2827

2928
////////////////////////////////////////////////////////////////////////////////
@@ -36,19 +35,21 @@ fn import_level(@builtin(global_invocation_id) coord : vec3u) {
3635
////////////////////////////////////////////////////////////////////////////////
3736
@compute @workgroup_size(64)
3837
fn export_level(@builtin(global_invocation_id) coord : vec3u) {
39-
if (all(coord.xy < vec2u(textureDimensions(tex_out)))) {
40-
let dst_offset = coord.x + coord.y * ubo.width;
41-
let src_offset = coord.x*2u + coord.y*2u * ubo.width;
38+
if (!all(coord.xy < vec2u(textureDimensions(tex_out)))) {
39+
return;
40+
}
4241

43-
let a = buf_in.weights[src_offset + 0u];
44-
let b = buf_in.weights[src_offset + 1u];
45-
let c = buf_in.weights[src_offset + 0u + ubo.width];
46-
let d = buf_in.weights[src_offset + 1u + ubo.width];
47-
let sum = dot(vec4f(a, b, c, d), vec4f(1.0));
42+
let dst_offset = coord.x + coord.y * ubo.width;
43+
let src_offset = coord.x*2u + coord.y*2u * ubo.width;
4844

49-
buf_out.weights[dst_offset] = sum / 4.0;
45+
let a = buf_in[src_offset + 0u];
46+
let b = buf_in[src_offset + 1u];
47+
let c = buf_in[src_offset + 0u + ubo.width];
48+
let d = buf_in[src_offset + 1u + ubo.width];
49+
let sum = a + b + c + d;
5050

51-
let probabilities = vec4f(a, a+b, a+b+c, sum) / max(sum, 0.0001);
52-
textureStore(tex_out, vec2i(coord.xy), probabilities);
53-
}
51+
buf_out[dst_offset] = sum / 4.0;
52+
53+
let probabilities = vec4f(a, a+b, a+b+c, sum) / max(sum, 0.0001);
54+
textureStore(tex_out, vec2i(coord.xy), probabilities);
5455
}

0 commit comments

Comments
 (0)