| #version 460 |
| |
| vec4 undeclared_errors(vec4 f4) |
| { |
| vec4 result; |
| gl_SubgroupSize; // ERROR, extension not enabled (basic) |
| gl_SubgroupInvocationID; // ERROR, extension not enabled (basic) |
| subgroupBarrier(); // ERROR, extension not enabled (basic) |
| subgroupMemoryBarrier(); // ERROR, extension not enabled (basic) |
| subgroupMemoryBarrierBuffer(); // ERROR, extension not enabled (basic) |
| subgroupMemoryBarrierImage(); // ERROR, extension not enabled (basic) |
| subgroupElect(); // ERROR, extension not enabled (basic) |
| gl_NumSubgroups; // ERROR, extension not enabled (basic) |
| gl_SubgroupID; // ERROR, extension not enabled (basic) |
| subgroupMemoryBarrierShared(); // ERROR, extension not enabled (basic) |
| |
| subgroupAll(true); // ERROR extension not enabled (vote) |
| subgroupAny(false); // ERROR extension not enabled (vote) |
| subgroupAllEqual(f4); // ERROR extension not enabled (vote) |
| |
| gl_SubgroupEqMask; // ERROR extension not enabled (ballot) |
| gl_SubgroupGeMask; // ERROR extension not enabled (ballot) |
| gl_SubgroupGtMask; // ERROR extension not enabled (ballot) |
| gl_SubgroupLeMask; // ERROR extension not enabled (ballot) |
| gl_SubgroupLtMask; // ERROR extension not enabled (ballot) |
| subgroupBroadcast(f4, 0); // ERROR extension not enabled (ballot) |
| subgroupBroadcastFirst(f4); // ERROR extension not enabled (ballot) |
| uvec4 ballot = subgroupBallot(false); // ERROR extension not enabled (ballot) |
| subgroupInverseBallot(uvec4(0x1)); // ERROR extension not enabled (ballot) |
| subgroupBallotBitExtract(ballot, 0); // ERROR extension not enabled (ballot) |
| subgroupBallotBitCount(ballot); // ERROR extension not enabled (ballot) |
| subgroupBallotInclusiveBitCount(ballot); // ERROR extension not enabled (ballot) |
| subgroupBallotExclusiveBitCount(ballot); // ERROR extension not enabled (ballot) |
| subgroupBallotFindLSB(ballot); // ERROR extension not enabled (ballot) |
| subgroupBallotFindMSB(ballot); // ERROR extension not enabled (ballot) |
| |
| subgroupShuffle(f4, 0); // ERROR extension not enabled (shuffle) |
| subgroupShuffleXor(f4, 0x1); // ERROR extension not enabled (shuffle) |
| subgroupShuffleUp(f4, 1); // ERROR extension not enabled (shuffle_relative) |
| subgroupShuffleDown(f4, 1); // ERROR extension not enabled (shuffle_relative) |
| |
| result = subgroupAdd(f4); // ERROR, extension not enabled (arith) |
| subgroupMul(f4); // ERROR, extension not enabled (arith) |
| subgroupMin(f4); // ERROR, extension not enabled (arith) |
| subgroupMax(f4); // ERROR, extension not enabled (arith) |
| subgroupAnd(ballot); // ERROR, extension not enabled (arith) |
| subgroupOr(ballot); // ERROR, extension not enabled (arith) |
| subgroupXor(ballot); // ERROR, extension not enabled (arith) |
| subgroupInclusiveAdd(f4); // ERROR, extension not enabled (arith) |
| subgroupInclusiveMul(f4); // ERROR, extension not enabled (arith) |
| subgroupInclusiveMin(f4); // ERROR, extension not enabled (arith) |
| subgroupInclusiveMax(f4); // ERROR, extension not enabled (arith) |
| subgroupInclusiveAnd(ballot); // ERROR, extension not enabled (arith) |
| subgroupInclusiveOr(ballot); // ERROR, extension not enabled (arith) |
| subgroupInclusiveXor(ballot); // ERROR, extension not enabled (arith) |
| subgroupExclusiveAdd(f4); // ERROR, extension not enabled (arith) |
| subgroupExclusiveMul(f4); // ERROR, extension not enabled (arith) |
| subgroupExclusiveMin(f4); // ERROR, extension not enabled (arith) |
| subgroupExclusiveMax(f4); // ERROR, extension not enabled (arith) |
| subgroupExclusiveAnd(ballot); // ERROR, extension not enabled (arith) |
| subgroupExclusiveOr(ballot); // ERROR, extension not enabled (arith) |
| subgroupExclusiveXor(ballot); // ERROR, extension not enabled (arith) |
| |
| subgroupClusteredAdd(f4, 2); // ERROR, extension not enabled (clustered) |
| subgroupClusteredMul(f4, 2); // ERROR, extension not enabled (clustered) |
| subgroupClusteredMin(f4, 2); // ERROR, extension not enabled (clustered) |
| subgroupClusteredMax(f4, 2); // ERROR, extension not enabled (clustered) |
| subgroupClusteredAnd(ballot, 2); // ERROR, extension not enabled (clustered) |
| subgroupClusteredOr(ballot, 2); // ERROR, extension not enabled (clustered) |
| subgroupClusteredXor(ballot, 2); // ERROR, extension not enabled (clustered) |
| |
| subgroupQuadBroadcast(f4, 0); // ERROR, extension not enabled (quad) |
| subgroupQuadSwapHorizontal(f4); // ERROR, extension not enabled (quad) |
| subgroupQuadSwapVertical(f4); // ERROR, extension not enabled (quad) |
| subgroupQuadSwapDiagonal(f4); // ERROR, extension not enabled (quad) |
| |
| uvec4 parti = subgroupPartitionNV(f4); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedAddNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedMulNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedMinNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedMaxNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedAndNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedOrNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedXorNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedInclusiveAddNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedInclusiveMulNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedInclusiveMinNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedInclusiveMaxNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedInclusiveAndNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedInclusiveOrNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedInclusiveXorNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedExclusiveAddNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedExclusiveMulNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedExclusiveMinNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedExclusiveMaxNV(f4, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedExclusiveAndNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedExclusiveOrNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| subgroupPartitionedExclusiveXorNV(ballot, parti); // ERROR, extension not enabled (partitioned) |
| |
| return result; |
| } |
| |
| #define MAX_VER 81 |
| #define MAX_PRIM 32 |
| |
| #define BARRIER() \ |
| memoryBarrierShared(); \ |
| barrier(); |
| |
| #extension GL_NV_mesh_shader : enable |
| |
| layout(local_size_x = 32) in; |
| |
| layout(max_vertices=MAX_VER) out; |
| layout(max_primitives=MAX_PRIM) out; |
| layout(triangles) out; |
| |
| // test use of builtins in mesh shaders: |
| |
| void main() |
| { |
| uint iid = gl_LocalInvocationID.x; |
| uint gid = gl_WorkGroupID.x; |
| |
| gl_MeshVerticesNV[iid].gl_Position = vec4(1.0); |
| gl_MeshVerticesNV[iid].gl_PointSize = 2.0; |
| gl_MeshVerticesNV[iid].gl_ClipDistance[3] = 3.0; |
| gl_MeshVerticesNV[iid].gl_CullDistance[2] = 4.0; |
| |
| BARRIER(); |
| |
| gl_MeshVerticesNV[iid+1].gl_Position = gl_MeshVerticesNV[iid].gl_Position; |
| gl_MeshVerticesNV[iid+1].gl_PointSize = gl_MeshVerticesNV[iid].gl_PointSize; |
| gl_MeshVerticesNV[iid+1].gl_ClipDistance[3] = gl_MeshVerticesNV[iid].gl_ClipDistance[3]; |
| gl_MeshVerticesNV[iid+1].gl_CullDistance[2] = gl_MeshVerticesNV[iid].gl_CullDistance[2]; |
| |
| BARRIER(); |
| |
| gl_MeshPrimitivesNV[iid].gl_PrimitiveID = 6; |
| gl_MeshPrimitivesNV[iid].gl_Layer = 7; |
| gl_MeshPrimitivesNV[iid].gl_ViewportIndex = 8; |
| gl_MeshPrimitivesNV[iid].gl_ViewportMask[0] = 9; |
| |
| BARRIER(); |
| |
| gl_MeshPrimitivesNV[iid+1].gl_PrimitiveID = gl_MeshPrimitivesNV[iid].gl_PrimitiveID; |
| gl_MeshPrimitivesNV[iid+1].gl_Layer = gl_MeshPrimitivesNV[iid].gl_Layer; |
| gl_MeshPrimitivesNV[iid+1].gl_ViewportIndex = gl_MeshPrimitivesNV[iid].gl_ViewportIndex; |
| gl_MeshPrimitivesNV[iid+1].gl_ViewportMask[0] = gl_MeshPrimitivesNV[iid].gl_ViewportMask[0]; |
| |
| BARRIER(); |
| |
| // check bound limits |
| gl_PrimitiveIndicesNV[0] = 257; // should truncate 257 -> 1 |
| gl_PrimitiveIndicesNV[(MAX_PRIM * 3) - 1] = 2; |
| gl_PrimitiveIndicesNV[gid] = gl_PrimitiveIndicesNV[gid-1]; |
| |
| // writes 4 indices at offset gl_DrawID |
| writePackedPrimitiveIndices4x8NV(gl_DrawID, 0x01020304); |
| |
| gl_PrimitiveCountNV = MAX_PRIM * 3; |
| |
| BARRIER(); |
| } |
| |
| #extension GL_KHR_shader_subgroup_basic: enable |
| void basic_works (void) |
| { |
| gl_SubgroupSize; |
| gl_SubgroupInvocationID; |
| subgroupBarrier(); |
| subgroupMemoryBarrier(); |
| subgroupMemoryBarrierBuffer(); |
| subgroupMemoryBarrierImage(); |
| subgroupElect(); |
| gl_NumSubgroups; // allowed in mesh |
| gl_SubgroupID; // allowed in mesh |
| subgroupMemoryBarrierShared(); // allowed in mesh |
| } |
| |
| #extension GL_KHR_shader_subgroup_ballot: enable |
| void ballot_works(vec4 f4) { |
| gl_SubgroupEqMask; |
| gl_SubgroupGeMask; |
| gl_SubgroupGtMask; |
| gl_SubgroupLeMask; |
| gl_SubgroupLtMask; |
| subgroupBroadcast(f4, 0); |
| subgroupBroadcastFirst(f4); |
| uvec4 ballot = subgroupBallot(false); |
| subgroupInverseBallot(uvec4(0x1)); |
| subgroupBallotBitExtract(ballot, 0); |
| subgroupBallotBitCount(ballot); |
| subgroupBallotInclusiveBitCount(ballot); |
| subgroupBallotExclusiveBitCount(ballot); |
| subgroupBallotFindLSB(ballot); |
| subgroupBallotFindMSB(ballot); |
| } |
| |
| #extension GL_KHR_shader_subgroup_vote: enable |
| void vote_works(vec4 f4) |
| { |
| subgroupAll(true); |
| subgroupAny(false); |
| subgroupAllEqual(f4); |
| } |
| |
| #extension GL_KHR_shader_subgroup_shuffle: enable |
| #extension GL_KHR_shader_subgroup_shuffle_relative: enable |
| void shuffle_works(vec4 f4) |
| { |
| subgroupShuffle(f4, 0); |
| subgroupShuffleXor(f4, 0x1); |
| subgroupShuffleUp(f4, 1); |
| subgroupShuffleDown(f4, 1); |
| } |
| |
| #extension GL_KHR_shader_subgroup_arithmetic: enable |
| void arith_works(vec4 f4) |
| { |
| uvec4 ballot; |
| subgroupAdd(f4); |
| subgroupMul(f4); |
| subgroupMin(f4); |
| subgroupMax(f4); |
| subgroupAnd(ballot); |
| subgroupOr(ballot); |
| subgroupXor(ballot); |
| subgroupInclusiveAdd(f4); |
| subgroupInclusiveMul(f4); |
| subgroupInclusiveMin(f4); |
| subgroupInclusiveMax(f4); |
| subgroupInclusiveAnd(ballot); |
| subgroupInclusiveOr(ballot); |
| subgroupInclusiveXor(ballot); |
| subgroupExclusiveAdd(f4); |
| subgroupExclusiveMul(f4); |
| subgroupExclusiveMin(f4); |
| subgroupExclusiveMax(f4); |
| subgroupExclusiveAnd(ballot); |
| subgroupExclusiveOr(ballot); |
| subgroupExclusiveXor(ballot); |
| } |
| |
| #extension GL_KHR_shader_subgroup_clustered: enable |
| void clustered_works(vec4 f4) |
| { |
| uvec4 ballot = uvec4(0x55,0,0,0); |
| subgroupClusteredAdd(f4, 2); |
| subgroupClusteredMul(f4, 2); |
| subgroupClusteredMin(f4, 2); |
| subgroupClusteredMax(f4, 2); |
| subgroupClusteredAnd(ballot, 2); |
| subgroupClusteredOr(ballot, 2); |
| subgroupClusteredXor(ballot, 2); |
| } |
| |
| #extension GL_KHR_shader_subgroup_quad: enable |
| void quad_works(vec4 f4) |
| { |
| subgroupQuadBroadcast(f4, 0); |
| subgroupQuadSwapHorizontal(f4); |
| subgroupQuadSwapVertical(f4); |
| subgroupQuadSwapDiagonal(f4); |
| } |
| |
| #extension GL_NV_shader_subgroup_partitioned: enable |
| void partitioned_works(vec4 f4) |
| { |
| uvec4 parti = subgroupPartitionNV(f4); |
| uvec4 ballot = uvec4(0x55,0,0,0); |
| subgroupPartitionedAddNV(f4, parti); |
| subgroupPartitionedMulNV(f4, parti); |
| subgroupPartitionedMinNV(f4, parti); |
| subgroupPartitionedMaxNV(f4, parti); |
| subgroupPartitionedAndNV(ballot, parti); |
| subgroupPartitionedOrNV(ballot, parti); |
| subgroupPartitionedXorNV(ballot, parti); |
| subgroupPartitionedInclusiveAddNV(f4, parti); |
| subgroupPartitionedInclusiveMulNV(f4, parti); |
| subgroupPartitionedInclusiveMinNV(f4, parti); |
| subgroupPartitionedInclusiveMaxNV(f4, parti); |
| subgroupPartitionedInclusiveAndNV(ballot, parti); |
| subgroupPartitionedInclusiveOrNV(ballot, parti); |
| subgroupPartitionedInclusiveXorNV(ballot, parti); |
| subgroupPartitionedExclusiveAddNV(f4, parti); |
| subgroupPartitionedExclusiveMulNV(f4, parti); |
| subgroupPartitionedExclusiveMinNV(f4, parti); |
| subgroupPartitionedExclusiveMaxNV(f4, parti); |
| subgroupPartitionedExclusiveAndNV(ballot, parti); |
| subgroupPartitionedExclusiveOrNV(ballot, parti); |
| subgroupPartitionedExclusiveXorNV(ballot, parti); |
| } |
| |
| // tests for NV_shader_sm_builtins |
| void sm_builtins_err() |
| { |
| gl_WarpsPerSMNV; // ERROR, no extension |
| gl_SMCountNV; // ERROR, no extension |
| gl_WarpIDNV; // ERROR, no extension |
| gl_SMIDNV; // ERROR, no extension |
| } |
| |
| #ifdef GL_NV_shader_sm_builtins |
| #extension GL_NV_shader_sm_builtins : enable |
| #endif |
| |
| void sm_builtins() |
| { |
| gl_WarpsPerSMNV; |
| gl_SMCountNV; |
| gl_WarpIDNV; |
| gl_SMIDNV; |
| } |