From 4cfc2c101e4cfe2a57223ee5e593247fdc72c874 Mon Sep 17 00:00:00 2001 From: Gregg Tavares Date: Mon, 16 Dec 2024 11:50:01 +0900 Subject: [PATCH] Refactor discard test for no storage buffers --- .../execution/statement/discard.spec.ts | 229 ++++++++++++------ 1 file changed, 157 insertions(+), 72 deletions(-) diff --git a/src/webgpu/shader/execution/statement/discard.spec.ts b/src/webgpu/shader/execution/statement/discard.spec.ts index 53f03b7edca0..4e0589bf34e7 100644 --- a/src/webgpu/shader/execution/statement/discard.spec.ts +++ b/src/webgpu/shader/execution/statement/discard.spec.ts @@ -15,10 +15,10 @@ Conditions that still occur: import { makeTestGroup } from '../../../../common/framework/test_group.js'; import { iterRange } from '../../../../common/util/util.js'; -import { GPUTest } from '../../../gpu_test.js'; +import { GPUTest, MaxLimitsTestMixin } from '../../../gpu_test.js'; import { checkElementsPassPredicate } from '../../../util/check_contents.js'; -export const g = makeTestGroup(GPUTest); +export const g = makeTestGroup(MaxLimitsTestMixin(GPUTest)); // Framebuffer dimensions const kWidth = 64; @@ -27,7 +27,7 @@ const kHeight = 64; const kSharedCode = ` @group(0) @binding(0) var output: array; @group(0) @binding(1) var atomicIndex : atomic; -@group(0) @binding(2) var uniformValues : array; +@group(0) @binding(2) var uniformValues : array; @vertex fn vsMain(@builtin(vertex_index) index : u32) -> @builtin(position) vec4f { @@ -48,6 +48,10 @@ fn vsMain(@builtin(vertex_index) index : u32) -> @builtin(position) vec4f { } `; +function hasStorageBuffers(t: GPUTest) { + return t.isCompatibility ? t.device.limits.maxStorageBuffersInFragmentStage! >= 2 : true; +} + function drawFullScreen( t: GPUTest, code: string, @@ -63,7 +67,7 @@ function drawFullScreen( fragment: { module: t.device.createShaderModule({ code }), entryPoint: 'fsMain', - targets: [{ format: 'r32uint' }], + targets: [{ format: 'rg32uint' }], }, primitive: { topology: 'triangle-list', @@ -78,13 +82,13 @@ function drawFullScreen( GPUTextureUsage.COPY_DST | GPUTextureUsage.RENDER_ATTACHMENT | GPUTextureUsage.TEXTURE_BINDING, - format: 'r32uint', + format: 'rg32uint', }); // Create a buffer to copy the framebuffer contents into. // Initialize with a sentinel value and load this buffer to detect unintended writes. const fbBuffer = t.makeBufferWithContents( - new Uint32Array([...iterRange(kWidth * kHeight, x => kWidth * kHeight)]), + new Uint32Array([...iterRange(kWidth * kHeight * 2, x => kWidth * kHeight)]), GPUBufferUsage.COPY_SRC | GPUBufferUsage.COPY_DST ); @@ -98,33 +102,44 @@ function drawFullScreen( usage: GPUBufferUsage.COPY_SRC | GPUBufferUsage.COPY_DST | GPUBufferUsage.STORAGE, }); - const uniformSize = bytesPerWord * 5; + const uniformSize = bytesPerWord * 5 * 4; const uniformBuffer = t.makeBufferWithContents( // Loop bound, [derivative constants]. - new Uint32Array([4, 1, 4, 4, 7]), - GPUBufferUsage.COPY_DST | GPUBufferUsage.STORAGE + // prettier-ignore + new Uint32Array([ + 4, 0, 0, 0, + 1, 0, 0, 0, + 4, 0, 0, 0, + 4, 0, 0, 0, + 7, 0, 0, 0, + ]), + GPUBufferUsage.COPY_DST | GPUBufferUsage.UNIFORM ); // 'atomicIndex' packed at the end of the buffer. const bg = t.device.createBindGroup({ layout: pipeline.getBindGroupLayout(0), entries: [ - { - binding: 0, - resource: { - buffer: dataBuffer, - offset: 0, - size: dataSize, - }, - }, - { - binding: 1, - resource: { - buffer: dataBuffer, - offset: dataSize, - size: bytesPerWord, - }, - }, + ...(hasStorageBuffers(t) + ? [ + { + binding: 0, + resource: { + buffer: dataBuffer, + offset: 0, + size: dataSize, + }, + }, + { + binding: 1, + resource: { + buffer: dataBuffer, + offset: dataSize, + size: bytesPerWord, + }, + }, + ] + : []), { binding: 2, resource: { @@ -141,7 +156,7 @@ function drawFullScreen( { buffer: fbBuffer, offset: 0, - bytesPerRow: kWidth * bytesPerWord, + bytesPerRow: kWidth * bytesPerWord * 2, rowsPerImage: kHeight, }, { texture: framebuffer }, @@ -165,21 +180,23 @@ function drawFullScreen( { buffer: fbBuffer, offset: 0, - bytesPerRow: kWidth * bytesPerWord, + bytesPerRow: kWidth * bytesPerWord * 2, rowsPerImage: kHeight, }, { width: kWidth, height: kHeight } ); t.queue.submit([encoder.finish()]); - t.expectGPUBufferValuesPassCheck(dataBuffer, dataChecker, { - type: Float32Array, - typedLength: dataSize / bytesPerWord, - }); + if (hasStorageBuffers(t)) { + t.expectGPUBufferValuesPassCheck(dataBuffer, dataChecker, { + type: Float32Array, + typedLength: dataSize / bytesPerWord, + }); + } t.expectGPUBufferValuesPassCheck(fbBuffer, framebufferChecker, { type: Uint32Array, - typedLength: kWidth * kHeight, + typedLength: kWidth * kHeight * 2, }); } @@ -190,12 +207,18 @@ g.test('all') ${kSharedCode} @fragment -fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { +fn fsMain(@builtin(position) pos : vec4f) -> @location(0) vec2u { _ = uniformValues[0]; discard; + ${ + hasStorageBuffers(t) + ? ` let idx = atomicAdd(&atomicIndex, 1); output[idx] = pos.xy; - return 1; + ` + : '' + } + return vec2u(1); } `; @@ -249,14 +272,23 @@ g.test('three_quarters') ${kSharedCode} @fragment -fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { +fn fsMain(@builtin(position) pos : vec4f) -> @location(0) vec2u { _ = uniformValues[0]; if (pos.x >= 0.5 * ${kWidth} || pos.y >= 0.5 * ${kHeight}) { discard; } + ${ + hasStorageBuffers(t) + ? ` let idx = atomicAdd(&atomicIndex, 1); output[idx] = pos.xy; - return idx; + return vec2u(idx); + ` + : ` + return vec2(u32(pos.x), u32(pos.y)); + + ` + } } `; @@ -301,17 +333,22 @@ fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { ); }; const fbChecker = (a: Uint32Array) => { + const discarded = (x: number, y: number) => x >= kWidth / 2 || y >= kHeight / 2; return checkElementsPassPredicate( a, (idx: number, value: number | bigint) => { - const x = idx % kWidth; - const y = Math.floor(idx / kWidth); - if (x < kWidth / 2 && y < kHeight / 2) { - return value < (kWidth * kHeight) / 4; - } else { + const fragId = (idx / 2) | 0; + const x = fragId % kWidth; + const y = (fragId / kWidth) | 0; + if (discarded(x, y)) { return value === kWidth * kHeight; + } else { + if (hasStorageBuffers(t)) { + return value < (kWidth * kHeight) / 4; + } else { + return value === (idx % 2 ? y : x); + } } - return value < (kWidth * kHeight) / 4; }, { predicatePrinter: [ @@ -320,10 +357,10 @@ fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { getValueForCell: (idx: number) => { const x = idx % kWidth; const y = Math.floor(idx / kWidth); - if (x < kWidth / 2 && y < kHeight / 2) { - return 'any'; - } else { + if (discarded(x, y)) { return 0; + } else { + return hasStorageBuffers(t) ? 'any' : idx % 2 ? y : x; } }, }, @@ -352,12 +389,20 @@ fn foo(pos : vec2f) { } @fragment -fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { +fn fsMain(@builtin(position) pos : vec4f) -> @location(0) vec2u { _ = uniformValues[0]; foo(pos.xy); + ${ + hasStorageBuffers(t) + ? ` let idx = atomicAdd(&atomicIndex, 1); output[idx] = pos.xy; - return idx; + return vec2u(idx); + ` + : ` + return vec2u(u32(pos.x), u32(pos.y)); + ` + } } `; @@ -396,15 +441,22 @@ fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { ); }; const fbChecker = (a: Uint32Array) => { + const discarded = (x: number, y: number) => + (x >= kWidth / 2 && y >= kHeight / 2) || (x <= kWidth / 2 && y <= kHeight / 2); return checkElementsPassPredicate( a, (idx: number, value: number | bigint) => { - const x = idx % kWidth; - const y = Math.floor(idx / kWidth); - if ((x >= kWidth / 2 && y >= kHeight / 2) || (x <= kWidth / 2 && y <= kHeight / 2)) { + const fragId = (idx / 2) | 0; + const x = fragId % kWidth; + const y = (fragId / kWidth) | 0; + if (discarded(x, y)) { return value === kWidth * kHeight; } else { - return value < (kWidth * kHeight) / 2; + if (hasStorageBuffers(t)) { + return value < (kWidth * kHeight) / 2; + } else { + return value === (idx % 2 ? y : x); + } } }, { @@ -414,13 +466,10 @@ fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { getValueForCell: (idx: number) => { const x = idx % kWidth; const y = Math.floor(idx / kWidth); - if ( - (x <= kWidth / 2 && y <= kHeight / 2) || - (x >= kWidth / 2 && y >= kHeight / 2) - ) { + if (discarded(x, y)) { return kWidth * kHeight; } - return 'any'; + return hasStorageBuffers(t) ? 'any' : idx % 2 ? y : x; }, }, ], @@ -438,16 +487,22 @@ g.test('loop') ${kSharedCode} @fragment -fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { +fn fsMain(@builtin(position) pos : vec4f) -> @location(0) vec2u { _ = uniformValues[0]; for (var i = 0; i < 2; i++) { if i > 0 { discard; } } + ${ + hasStorageBuffers(t) + ? ` let idx = atomicAdd(&atomicIndex, 1); output[idx] = pos.xy; - return 1; + ` + : '' + } + return vec2u(1); } `; @@ -501,7 +556,7 @@ g.test('continuing') ${kSharedCode} @fragment -fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { +fn fsMain(@builtin(position) pos : vec4f) -> @location(0) vec2u { _ = uniformValues[0]; var i = 0; loop { @@ -513,9 +568,15 @@ fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { break if i >= 2; } } + ${ + hasStorageBuffers(t) + ? ` let idx = atomicAdd(&atomicIndex, 1); output[idx] = pos.xy; - return 1; + ` + : '' + } + return vec2u(1); } `; @@ -569,13 +630,19 @@ g.test('uniform_read_loop') ${kSharedCode} @fragment -fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { +fn fsMain(@builtin(position) pos : vec4f) -> @location(0) vec2u { discard; - for (var i = 0u; i < uniformValues[0]; i++) { + for (var i = 0u; i < uniformValues[0].x; i++) { } + ${ + hasStorageBuffers(t) + ? ` let idx = atomicAdd(&atomicIndex, 1); output[idx] = pos.xy; - return 1; + ` + : '' + } + return vec2u(1); } `; @@ -629,7 +696,7 @@ g.test('derivatives') ${kSharedCode} @fragment -fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { +fn fsMain(@builtin(position) pos : vec4f) -> @location(0) vec2u { let ipos = vec2i(pos.xy); let lsb = ipos & vec2(0x1); let left_sel = select(2, 4, lsb.y == 1); @@ -639,12 +706,20 @@ fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { discard; } - let v = uniformValues[uidx]; - let idx = atomicAdd(&atomicIndex, 1); + let v = uniformValues[uidx].x; let dx = dpdx(f32(v)); let dy = dpdy(f32(v)); + ${ + hasStorageBuffers(t) + ? ` + let idx = atomicAdd(&atomicIndex, 1); output[idx] = vec2(dx, dy); - return idx; + return vec2u(idx); + ` + : ` + return bitcast(vec2f(dx, dy)); + ` + } } `; @@ -678,15 +753,25 @@ fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { // 3/4 of the fragments are written. const fbChecker = (a: Uint32Array) => { + const discarded = (x: number, y: number) => ((x | y) & 0x1) === 0; + const asF32 = new Float32Array(1); + const asU32 = new Uint32Array(asF32.buffer); return checkElementsPassPredicate( a, (idx: number, value: number | bigint) => { - const x = idx % kWidth; - const y = Math.floor(idx / kWidth); - if (((x | y) & 0x1) === 0) { + const fragId = (idx / 2) | 0; + const x = fragId % kWidth; + const y = (fragId / kWidth) | 0; + if (discarded(x, y)) { return value === kWidth * kHeight; } else { - return value < (3 * (kWidth * kHeight)) / 4; + if (hasStorageBuffers(t)) { + return value < (3 * (kWidth * kHeight)) / 4; + } else { + asU32[0] = value as number; + const v = asF32[0]; + return v === -3 || v === 3; + } } }, { @@ -699,7 +784,7 @@ fn fsMain(@builtin(position) pos : vec4f) -> @location(0) u32 { if (((x | y) & 0x1) === 0) { return kWidth * kHeight; } else { - return 'any'; + return hasStorageBuffers(t) ? 'any' : '+/- 3'; } }, },