-
Notifications
You must be signed in to change notification settings - Fork 86
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Execution tests for subgroupElect (#4089)
- Loading branch information
1 parent
80edca8
commit 726f4dd
Showing
2 changed files
with
388 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
384 changes: 384 additions & 0 deletions
384
src/webgpu/shader/execution/expression/call/builtin/subgroupElect.spec.ts
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,384 @@ | ||
export const description = ` | ||
Execution tests for subgroupElect | ||
`; | ||
|
||
import { makeTestGroup } from '../../../../../../common/framework/test_group.js'; | ||
import { keysOf } from '../../../../../../common/util/data_tables.js'; | ||
import { iterRange } from '../../../../../../common/util/util.js'; | ||
|
||
import { | ||
SubgroupTest, | ||
kFramebufferSizes, | ||
getUintsPerFramebuffer, | ||
kWGSizes, | ||
kDataSentinel, | ||
runComputeTest, | ||
runFragmentTest, | ||
kPredicateCases, | ||
} from './subgroup_util.js'; | ||
|
||
export const g = makeTestGroup(SubgroupTest); | ||
|
||
/** | ||
* Checks subgroupElect compute shader results | ||
* | ||
* @param metadata An array of uint32s containing: | ||
* * subgroup_invocation_id in first half | ||
* * subgroup_size in second half | ||
* @param output An array of uint32s containing elect results | ||
* @param filter A functor to determine active invocations | ||
*/ | ||
function checkCompute( | ||
metadata: Uint32Array, | ||
output: Uint32Array, | ||
filter: (id: number, size: number) => boolean | ||
): Error | undefined { | ||
const size = metadata[output.length]; | ||
let elected = 129; | ||
for (let i = 0; i < 128; i++) { | ||
if (filter(i, size)) { | ||
elected = i; | ||
break; | ||
} | ||
} | ||
|
||
for (let i = 0; i < output.length; i++) { | ||
const res = output[i]; | ||
const id = metadata[i]; | ||
let expected = kDataSentinel; | ||
if (filter(id, size)) { | ||
expected = elected === id ? 1 : 0; | ||
} | ||
if (res !== expected) { | ||
return new Error(`Invocation ${i}: incorrect result | ||
- expected: ${expected} | ||
- got: ${res}`); | ||
} | ||
} | ||
|
||
return undefined; | ||
} | ||
|
||
g.test('compute,all_active') | ||
.desc('Test subgroupElect in compute shader with all active invocations') | ||
.params(u => u.combine('wgSize', kWGSizes)) | ||
.beforeAllSubcases(t => { | ||
t.selectDeviceOrSkipTestCase('subgroups' as GPUFeatureName); | ||
}) | ||
.fn(async t => { | ||
const wgThreads = t.params.wgSize[0] * t.params.wgSize[1] * t.params.wgSize[2]; | ||
|
||
const wgsl = ` | ||
enable subgroups; | ||
@group(0) @binding(0) | ||
var<storage> inputs : array<u32>; // unused | ||
@group(0) @binding(1) | ||
var<storage, read_write> outputs : array<u32>; | ||
struct Metadata { | ||
id : array<u32, ${wgThreads}>, | ||
size : array<u32, ${wgThreads}>, | ||
} | ||
@group(0) @binding(2) | ||
var<storage, read_write> metadata : Metadata; | ||
@compute @workgroup_size(${t.params.wgSize[0]}, ${t.params.wgSize[1]}, ${t.params.wgSize[2]}) | ||
fn main( | ||
@builtin(subgroup_invocation_id) id : u32, | ||
@builtin(subgroup_size) subgroupSize : u32, | ||
@builtin(local_invocation_index) lid : u32, | ||
) { | ||
// Force usage. | ||
_ = inputs[0]; | ||
let e = subgroupElect(); | ||
outputs[lid] = select(0u, 1u, e); | ||
metadata.id[lid] = id; | ||
metadata.size[lid] = subgroupSize; | ||
}`; | ||
|
||
const uintsPerOutput = 1; | ||
await runComputeTest( | ||
t, | ||
wgsl, | ||
[t.params.wgSize[0], t.params.wgSize[1], t.params.wgSize[2]], | ||
uintsPerOutput, | ||
new Uint32Array([0]), // unused | ||
(metadata: Uint32Array, output: Uint32Array) => { | ||
return checkCompute(metadata, output, (id: number, size: number) => { | ||
return true; | ||
}); | ||
} | ||
); | ||
}); | ||
|
||
g.test('compute,split') | ||
.desc('Test subgroupElect in compute shader with partially active invocations') | ||
.params(u => | ||
u.combine('predicate', keysOf(kPredicateCases)).beginSubcases().combine('wgSize', kWGSizes) | ||
) | ||
.beforeAllSubcases(t => { | ||
t.selectDeviceOrSkipTestCase('subgroups' as GPUFeatureName); | ||
}) | ||
.fn(async t => { | ||
const testcase = kPredicateCases[t.params.predicate]; | ||
const wgThreads = t.params.wgSize[0] * t.params.wgSize[1] * t.params.wgSize[2]; | ||
|
||
const wgsl = ` | ||
enable subgroups; | ||
diagnostic(off, subgroup_uniformity); | ||
@group(0) @binding(0) | ||
var<storage> inputs : array<u32>; // unused | ||
@group(0) @binding(1) | ||
var<storage, read_write> outputs : array<u32>; | ||
struct Metadata { | ||
id : array<u32, ${wgThreads}>, | ||
size : array<u32, ${wgThreads}>, | ||
} | ||
@group(0) @binding(2) | ||
var<storage, read_write> metadata : Metadata; | ||
@compute @workgroup_size(${t.params.wgSize[0]}, ${t.params.wgSize[1]}, ${t.params.wgSize[2]}) | ||
fn main( | ||
@builtin(subgroup_invocation_id) id : u32, | ||
@builtin(subgroup_size) subgroupSize : u32, | ||
@builtin(local_invocation_index) lid : u32, | ||
) { | ||
// Force usage. | ||
_ = inputs[0]; | ||
metadata.id[lid] = id; | ||
metadata.size[lid] = subgroupSize; | ||
if ${testcase.cond} { | ||
let e = subgroupElect(); | ||
outputs[lid] = select(0u, 1u, e); | ||
} else { | ||
return; | ||
} | ||
}`; | ||
|
||
const uintsPerOutput = 1; | ||
await runComputeTest( | ||
t, | ||
wgsl, | ||
[t.params.wgSize[0], t.params.wgSize[1], t.params.wgSize[2]], | ||
uintsPerOutput, | ||
new Uint32Array([0]), // unused | ||
(metadata: Uint32Array, output: Uint32Array) => { | ||
return checkCompute(metadata, output, testcase.filter); | ||
} | ||
); | ||
}); | ||
|
||
g.test('compute,each_invocation') | ||
.desc('Test subgroupElect in compute shader to elect each possible invocation') | ||
.params(u => | ||
u | ||
.combine('id', [...iterRange(128, x => x)]) | ||
.beginSubcases() | ||
.combine('wgSize', kWGSizes) | ||
) | ||
.beforeAllSubcases(t => { | ||
t.selectDeviceOrSkipTestCase('subgroups' as GPUFeatureName); | ||
}) | ||
.fn(async t => { | ||
const wgThreads = t.params.wgSize[0] * t.params.wgSize[1] * t.params.wgSize[2]; | ||
|
||
interface SubgroupProperties extends GPUAdapterInfo { | ||
subgroupMaxSize: number; | ||
} | ||
const { subgroupMaxSize } = t.device.adapterInfo as SubgroupProperties; | ||
t.skipIf(subgroupMaxSize <= t.params.id, 'No invocation selected'); | ||
|
||
const wgsl = ` | ||
enable subgroups; | ||
diagnostic(off, subgroup_uniformity); | ||
@group(0) @binding(0) | ||
var<storage> inputs : array<u32>; // unused | ||
@group(0) @binding(1) | ||
var<storage, read_write> outputs : array<u32>; | ||
struct Metadata { | ||
id : array<u32, ${wgThreads}>, | ||
size : array<u32, ${wgThreads}>, | ||
} | ||
@group(0) @binding(2) | ||
var<storage, read_write> metadata : Metadata; | ||
@compute @workgroup_size(${t.params.wgSize[0]}, ${t.params.wgSize[1]}, ${t.params.wgSize[2]}) | ||
fn main( | ||
@builtin(subgroup_invocation_id) id : u32, | ||
@builtin(subgroup_size) subgroupSize : u32, | ||
@builtin(local_invocation_index) lid : u32, | ||
) { | ||
// Force usage. | ||
_ = inputs[0]; | ||
metadata.id[lid] = id; | ||
metadata.size[lid] = subgroupSize; | ||
if id >= ${t.params.id} { | ||
let e = subgroupElect(); | ||
outputs[lid] = select(0u, 1u, e); | ||
} else { | ||
return; | ||
} | ||
}`; | ||
|
||
const uintsPerOutput = 1; | ||
await runComputeTest( | ||
t, | ||
wgsl, | ||
[t.params.wgSize[0], t.params.wgSize[1], t.params.wgSize[2]], | ||
uintsPerOutput, | ||
new Uint32Array([0]), // unused | ||
(metadata: Uint32Array, output: Uint32Array) => { | ||
return checkCompute(metadata, output, (id: number, size: number) => { | ||
return id >= t.params.id; | ||
}); | ||
} | ||
); | ||
}); | ||
|
||
/** | ||
* Checks subgroupElect results from a fragment shader. | ||
* | ||
* Avoids subgroups in last row or column to skip potential helper invocations. | ||
* @param data Framebuffer output | ||
* * component 0 is result | ||
* * component 1 is generated subgroup_invocation_id | ||
* * component 2 is generated subgroup id | ||
* @param format The framebuffer format | ||
* @param width Framebuffer width | ||
* @param height Framebuffer height | ||
*/ | ||
function checkFragment( | ||
data: Uint32Array, | ||
format: GPUTextureFormat, | ||
width: number, | ||
height: number | ||
): Error | undefined { | ||
const { uintsPerRow, uintsPerTexel } = getUintsPerFramebuffer(format, width, height); | ||
|
||
// Determine if the subgroup should be included in the checks. | ||
const inBounds = new Map<number, boolean>(); | ||
for (let row = 0; row < height; row++) { | ||
for (let col = 0; col < width; col++) { | ||
const offset = uintsPerRow * row + col * uintsPerTexel; | ||
const subgroup_id = data[offset + 2]; | ||
if (subgroup_id === 0) { | ||
return new Error(`Internal error: helper invocation at (${col}, ${row})`); | ||
} | ||
|
||
let ok = inBounds.get(subgroup_id) ?? true; | ||
ok = ok && row !== height - 1 && col !== width - 1; | ||
inBounds.set(subgroup_id, ok); | ||
} | ||
} | ||
|
||
let anyInBounds = false; | ||
for (const [_, value] of inBounds) { | ||
const ok = Boolean(value); | ||
anyInBounds = anyInBounds || ok; | ||
} | ||
if (!anyInBounds) { | ||
// This variant would not reliably test behavior. | ||
return undefined; | ||
} | ||
|
||
// Iteration skips subgroups in the last row or column to avoid helper | ||
// invocations because it is not guaranteed whether or not they participate | ||
// in the subgroup operation. | ||
for (let row = 0; row < height; row++) { | ||
for (let col = 0; col < width; col++) { | ||
const offset = uintsPerRow * row + col * uintsPerTexel; | ||
const subgroup_id = data[offset + 2]; | ||
|
||
if (subgroup_id === 0) { | ||
return new Error(`Internal error: helper invocation at (${col}, ${row})`); | ||
} | ||
|
||
const subgroupInBounds = inBounds.get(subgroup_id) ?? true; | ||
if (!subgroupInBounds) { | ||
continue; | ||
} | ||
|
||
const res = data[offset]; | ||
const id = data[offset + 1]; | ||
const expected = id === 0 ? 0x55555555 : 0xaaaaaaaa; | ||
if (res !== expected) { | ||
return new Error(`Row ${row}, col ${col}: incorrect result | ||
- expected: 0x${expected.toString(16)} | ||
- got: 0x${res.toString(16)}`); | ||
} | ||
} | ||
} | ||
|
||
return undefined; | ||
} | ||
|
||
g.test('fragment') | ||
.desc('Tests subgroupElect in fragment shaders') | ||
.params(u => | ||
u | ||
.combine('size', kFramebufferSizes) | ||
.beginSubcases() | ||
.combineWithParams([{ format: 'rgba32uint' }] as const) | ||
) | ||
.beforeAllSubcases(t => { | ||
t.selectDeviceOrSkipTestCase('subgroups' as GPUFeatureName); | ||
}) | ||
.fn(async t => { | ||
interface SubgroupProperties extends GPUAdapterInfo { | ||
subgroupMinSize: number; | ||
} | ||
const { subgroupMinSize } = t.device.adapterInfo as SubgroupProperties; | ||
const innerTexels = (t.params.size[0] - 1) * (t.params.size[1] - 1); | ||
t.skipIf(innerTexels < subgroupMinSize, 'Too few texels to be reliable'); | ||
|
||
const fsShader = ` | ||
enable subgroups; | ||
@group(0) @binding(0) | ||
var<storage, read_write> inputs : array<u32>; // unused | ||
@fragment | ||
fn main( | ||
@builtin(position) pos : vec4f, | ||
@builtin(subgroup_invocation_id) id : u32, | ||
) -> @location(0) vec4u { | ||
// Force usage | ||
_ = inputs[0]; | ||
// Generate a subgroup id based on linearized position, avoid 0. | ||
let linear = u32(pos.x) + u32(pos.y) * ${t.params.size[0]}; | ||
let subgroup_id = subgroupBroadcastFirst(linear + 1); | ||
let e = subgroupElect(); | ||
let res = select(0xaaaaaaaau, 0x55555555u, e); | ||
return vec4u(res, id, subgroup_id, 0); | ||
}`; | ||
|
||
await runFragmentTest( | ||
t, | ||
t.params.format, | ||
fsShader, | ||
t.params.size[0], | ||
t.params.size[1], | ||
new Uint32Array([0]), // unused, | ||
(data: Uint32Array) => { | ||
return checkFragment(data, t.params.format, t.params.size[0], t.params.size[1]); | ||
} | ||
); | ||
}); |