Commit 12bc9aa9 by steve-lunarg

WIP: HLSL: add Append/ConsumeBuffer support

parent 8e26feb8
...@@ -54,11 +54,14 @@ gl_FragCoord origin is upper left ...@@ -54,11 +54,14 @@ gl_FragCoord origin is upper left
0:16 Sequence 0:16 Sequence
0:16 move second child to first child ( temp uint) 0:16 move second child to first child ( temp uint)
0:16 'c2' ( temp uint) 0:16 'c2' ( temp uint)
0:16 AtomicAdd ( temp uint) 0:16 add ( temp uint)
0:16 @count: direct index for structure ( temp int) 0:16 AtomicAdd ( temp uint)
0:16 'sbuf_rw_d@count' (layout( row_major std430) buffer block{layout( row_major std430) buffer int @count}) 0:16 @count: direct index for structure ( temp int)
0:16 'sbuf_rw_d@count' (layout( row_major std430) buffer block{layout( row_major std430) buffer int @count})
0:16 Constant:
0:16 0 (const int)
0:16 Constant: 0:16 Constant:
0:16 0 (const int) 0:16 -1 (const int)
0:16 Constant: 0:16 Constant:
0:16 -1 (const int) 0:16 -1 (const int)
0:18 Branch: Return with expression 0:18 Branch: Return with expression
...@@ -155,11 +158,14 @@ gl_FragCoord origin is upper left ...@@ -155,11 +158,14 @@ gl_FragCoord origin is upper left
0:16 Sequence 0:16 Sequence
0:16 move second child to first child ( temp uint) 0:16 move second child to first child ( temp uint)
0:16 'c2' ( temp uint) 0:16 'c2' ( temp uint)
0:16 AtomicAdd ( temp uint) 0:16 add ( temp uint)
0:16 @count: direct index for structure ( temp int) 0:16 AtomicAdd ( temp uint)
0:16 'sbuf_rw_d@count' (layout( row_major std430) buffer block{layout( row_major std430) buffer int @count}) 0:16 @count: direct index for structure ( temp int)
0:16 'sbuf_rw_d@count' (layout( row_major std430) buffer block{layout( row_major std430) buffer int @count})
0:16 Constant:
0:16 0 (const int)
0:16 Constant: 0:16 Constant:
0:16 0 (const int) 0:16 -1 (const int)
0:16 Constant: 0:16 Constant:
0:16 -1 (const int) 0:16 -1 (const int)
0:18 Branch: Return with expression 0:18 Branch: Return with expression
...@@ -199,12 +205,12 @@ gl_FragCoord origin is upper left ...@@ -199,12 +205,12 @@ gl_FragCoord origin is upper left
// Module Version 10000 // Module Version 10000
// Generated by (magic number): 80001 // Generated by (magic number): 80001
// Id's are bound by 69 // Id's are bound by 70
Capability Shader Capability Shader
1: ExtInstImport "GLSL.std.450" 1: ExtInstImport "GLSL.std.450"
MemoryModel Logical GLSL450 MemoryModel Logical GLSL450
EntryPoint Fragment 4 "main" 62 65 EntryPoint Fragment 4 "main" 63 66
ExecutionMode 4 OriginUpperLeft ExecutionMode 4 OriginUpperLeft
Source HLSL 500 Source HLSL 500
Name 4 "main" Name 4 "main"
...@@ -222,10 +228,10 @@ gl_FragCoord origin is upper left ...@@ -222,10 +228,10 @@ gl_FragCoord origin is upper left
Name 36 "sbuf_rw_i@count" Name 36 "sbuf_rw_i@count"
Name 42 "c2" Name 42 "c2"
Name 43 "sbuf_rw_d@count" Name 43 "sbuf_rw_d@count"
Name 60 "pos" Name 61 "pos"
Name 62 "pos" Name 63 "pos"
Name 65 "@entryPointOutput" Name 66 "@entryPointOutput"
Name 66 "param" Name 67 "param"
Decorate 19 ArrayStride 16 Decorate 19 ArrayStride 16
MemberDecorate 20(sbuf_rw_i) 0 Offset 0 MemberDecorate 20(sbuf_rw_i) 0 Offset 0
Decorate 20(sbuf_rw_i) BufferBlock Decorate 20(sbuf_rw_i) BufferBlock
...@@ -236,8 +242,8 @@ gl_FragCoord origin is upper left ...@@ -236,8 +242,8 @@ gl_FragCoord origin is upper left
Decorate 34(sbuf_rw_i@count) BufferBlock Decorate 34(sbuf_rw_i@count) BufferBlock
Decorate 36(sbuf_rw_i@count) DescriptorSet 0 Decorate 36(sbuf_rw_i@count) DescriptorSet 0
Decorate 43(sbuf_rw_d@count) DescriptorSet 0 Decorate 43(sbuf_rw_d@count) DescriptorSet 0
Decorate 62(pos) Location 0 Decorate 63(pos) Location 0
Decorate 65(@entryPointOutput) Location 0 Decorate 66(@entryPointOutput) Location 0
2: TypeVoid 2: TypeVoid
3: TypeFunction 2 3: TypeFunction 2
6: TypeInt 32 0 6: TypeInt 32 0
...@@ -270,20 +276,20 @@ gl_FragCoord origin is upper left ...@@ -270,20 +276,20 @@ gl_FragCoord origin is upper left
40: 6(int) Constant 1 40: 6(int) Constant 1
43(sbuf_rw_d@count): 35(ptr) Variable Uniform 43(sbuf_rw_d@count): 35(ptr) Variable Uniform
45: 23(int) Constant 4294967295 45: 23(int) Constant 4294967295
61: TypePointer Input 6(int) 62: TypePointer Input 6(int)
62(pos): 61(ptr) Variable Input 63(pos): 62(ptr) Variable Input
64: TypePointer Output 9(fvec4) 65: TypePointer Output 9(fvec4)
65(@entryPointOutput): 64(ptr) Variable Output 66(@entryPointOutput): 65(ptr) Variable Output
4(main): 2 Function None 3 4(main): 2 Function None 3
5: Label 5: Label
60(pos): 7(ptr) Variable Function 61(pos): 7(ptr) Variable Function
66(param): 7(ptr) Variable Function 67(param): 7(ptr) Variable Function
63: 6(int) Load 62(pos) 64: 6(int) Load 63(pos)
Store 60(pos) 63 Store 61(pos) 64
67: 6(int) Load 60(pos) 68: 6(int) Load 61(pos)
Store 66(param) 67 Store 67(param) 68
68: 9(fvec4) FunctionCall 12(@main(u1;) 66(param) 69: 9(fvec4) FunctionCall 12(@main(u1;) 67(param)
Store 65(@entryPointOutput) 68 Store 66(@entryPointOutput) 69
Return Return
FunctionEnd FunctionEnd
12(@main(u1;): 9(fvec4) Function None 10 12(@main(u1;): 9(fvec4) Function None 10
...@@ -300,17 +306,18 @@ gl_FragCoord origin is upper left ...@@ -300,17 +306,18 @@ gl_FragCoord origin is upper left
Store 33(c1) 41 Store 33(c1) 41
44: 37(ptr) AccessChain 43(sbuf_rw_d@count) 24 44: 37(ptr) AccessChain 43(sbuf_rw_d@count) 24
46: 6(int) AtomicIAdd 44 40 17 45 46: 6(int) AtomicIAdd 44 40 17 45
Store 42(c2) 46 47: 6(int) IAdd 46 45
47: 7(ptr) AccessChain 16(result) 17 Store 42(c2) 47
48: 6(int) Load 47 48: 7(ptr) AccessChain 16(result) 17
49: 8(float) ConvertUToF 48 49: 6(int) Load 48
50: 7(ptr) AccessChain 16(result) 40 50: 8(float) ConvertUToF 49
51: 6(int) Load 50 51: 7(ptr) AccessChain 16(result) 40
52: 8(float) ConvertUToF 51 52: 6(int) Load 51
53: 6(int) Load 33(c1) 53: 8(float) ConvertUToF 52
54: 8(float) ConvertUToF 53 54: 6(int) Load 33(c1)
55: 6(int) Load 42(c2) 55: 8(float) ConvertUToF 54
56: 8(float) ConvertUToF 55 56: 6(int) Load 42(c2)
57: 9(fvec4) CompositeConstruct 49 52 54 56 57: 8(float) ConvertUToF 56
ReturnValue 57 58: 9(fvec4) CompositeConstruct 50 53 55 57
ReturnValue 58
FunctionEnd FunctionEnd
AppendStructuredBuffer<float4> sbuf_a;
ConsumeStructuredBuffer<float4> sbuf_c;
AppendStructuredBuffer<float4> sbuf_unused;
float4 main(uint pos : FOO) : SV_Target0
{
sbuf_a.Append(float4(1,2,3,4));
return sbuf_c.Consume();
}
...@@ -245,6 +245,7 @@ INSTANTIATE_TEST_CASE_P( ...@@ -245,6 +245,7 @@ INSTANTIATE_TEST_CASE_P(
{"hlsl.structarray.flatten.frag", "main"}, {"hlsl.structarray.flatten.frag", "main"},
{"hlsl.structarray.flatten.geom", "main"}, {"hlsl.structarray.flatten.geom", "main"},
{"hlsl.structbuffer.frag", "main"}, {"hlsl.structbuffer.frag", "main"},
{"hlsl.structbuffer.append.frag", "main"},
{"hlsl.structbuffer.atomics.frag", "main"}, {"hlsl.structbuffer.atomics.frag", "main"},
{"hlsl.structbuffer.byte.frag", "main"}, {"hlsl.structbuffer.byte.frag", "main"},
{"hlsl.structbuffer.coherent.frag", "main"}, {"hlsl.structbuffer.coherent.frag", "main"},
......
...@@ -2454,7 +2454,7 @@ bool HlslParseContext::hasStructBuffCounter(const TString& name) const ...@@ -2454,7 +2454,7 @@ bool HlslParseContext::hasStructBuffCounter(const TString& name) const
case EbvRWStructuredBuffer: // ... case EbvRWStructuredBuffer: // ...
return true; return true;
default: default:
return false; // other builtin types do not have. return false; // the other structuredbfufer types do not have a counter.
} }
} }
...@@ -2533,6 +2533,35 @@ void HlslParseContext::decomposeStructBufferMethods(const TSourceLoc& loc, TInte ...@@ -2533,6 +2533,35 @@ void HlslParseContext::decomposeStructBufferMethods(const TSourceLoc& loc, TInte
bufferObj = arguments->getAsSymbolNode(); bufferObj = arguments->getAsSymbolNode();
} }
if (bufferObj == nullptr || bufferObj->getAsSymbolNode() == nullptr)
return;
TString bufferName(bufferObj->getAsSymbolNode()->getName());
const auto bivIt = structBufferBuiltIn.find(bufferName);
if (bivIt == structBufferBuiltIn.end())
return;
const TBuiltInVariable builtInType = bivIt->second;
// Some methods require a hidden internal counter, obtained via getStructBufferCounter().
// This lambda adds something to it and returns the old value.
const auto incDecCounter = [&](int incval) -> TIntermTyped* {
TIntermTyped* incrementValue = intermediate.addConstantUnion(incval, loc, true);
TIntermTyped* counter = getStructBufferCounter(loc, bufferObj); // obtain the counter member
if (counter == nullptr)
return nullptr;
TIntermAggregate* counterIncrement = new TIntermAggregate(EOpAtomicAdd);
counterIncrement->setType(TType(EbtUint, EvqTemporary));
counterIncrement->setLoc(loc);
counterIncrement->getSequence().push_back(counter);
counterIncrement->getSequence().push_back(incrementValue);
return counterIncrement;
};
// Index to obtain the runtime sized array out of the buffer. // Index to obtain the runtime sized array out of the buffer.
TIntermTyped* argArray = indexStructBufferContent(loc, bufferObj); TIntermTyped* argArray = indexStructBufferContent(loc, bufferObj);
if (argArray == nullptr) if (argArray == nullptr)
...@@ -2545,7 +2574,9 @@ void HlslParseContext::decomposeStructBufferMethods(const TSourceLoc& loc, TInte ...@@ -2545,7 +2574,9 @@ void HlslParseContext::decomposeStructBufferMethods(const TSourceLoc& loc, TInte
// Byte address buffers index in bytes (only multiples of 4 permitted... not so much a byte address // Byte address buffers index in bytes (only multiples of 4 permitted... not so much a byte address
// buffer then, but that's what it calls itself. // buffer then, but that's what it calls itself.
const bool isByteAddressBuffer = (argArray->getBasicType() == EbtUint); const bool isByteAddressBuffer = (builtInType == EbvByteAddressBuffer ||
builtInType == EbvRWByteAddressBuffer);
if (isByteAddressBuffer) if (isByteAddressBuffer)
argIndex = intermediate.addBinaryNode(EOpRightShift, argIndex, intermediate.addConstantUnion(2, loc, true), argIndex = intermediate.addBinaryNode(EOpRightShift, argIndex, intermediate.addConstantUnion(2, loc, true),
loc, TType(EbtInt)); loc, TType(EbtInt));
...@@ -2746,28 +2777,50 @@ void HlslParseContext::decomposeStructBufferMethods(const TSourceLoc& loc, TInte ...@@ -2746,28 +2777,50 @@ void HlslParseContext::decomposeStructBufferMethods(const TSourceLoc& loc, TInte
} }
break; break;
case EOpMethodIncrementCounter: case EOpMethodIncrementCounter:
{
node = incDecCounter(1);
break;
}
case EOpMethodDecrementCounter: case EOpMethodDecrementCounter:
{ {
// These methods require a hidden internal counter, obtained via getStructBufferCounter() TIntermTyped* preIncValue = incDecCounter(-1); // result is original value
TIntermTyped* incrementValue = intermediate.addConstantUnion(op == EOpMethodIncrementCounter ? 1 : -1, loc, true); node = intermediate.addBinaryNode(EOpAdd, preIncValue, intermediate.addConstantUnion(-1, loc, true), loc,
TIntermTyped* counter = getStructBufferCounter(loc, bufferObj); // obtain the counter member preIncValue->getType());
break;
}
node = incrementValue; case EOpMethodAppend:
{
TIntermTyped* oldCounter = incDecCounter(1);
if (counter == nullptr) TIntermTyped* lValue = intermediate.addIndex(EOpIndexIndirect, argArray, oldCounter, loc);
break; TIntermTyped* rValue = argAggregate->getSequence()[1]->getAsTyped();
const TType derefType(argArray->getType(), 0);
lValue->setType(derefType);
node = intermediate.addAssign(EOpAssign, lValue, rValue, loc);
node->setType(TType(EbtVoid)); // Append is a void return type
break;
}
case EOpMethodConsume:
{
TIntermTyped* oldCounter = incDecCounter(-1);
TIntermTyped* newCounter = intermediate.addBinaryNode(EOpAdd, oldCounter, intermediate.addConstantUnion(-1, loc, true), loc,
oldCounter->getType());
TIntermAggregate* counterIncrement = new TIntermAggregate(EOpAtomicAdd); node = intermediate.addIndex(EOpIndexIndirect, argArray, newCounter, loc);
counterIncrement->setType(TType(EbtUint, EvqTemporary));
counterIncrement->setLoc(loc);
counterIncrement->getSequence().push_back(counter);
counterIncrement->getSequence().push_back(incrementValue);
node = counterIncrement; const TType derefType(argArray->getType(), 0);
node->setType(derefType);
break;
} }
break;
default: default:
break; // most pass through unchanged break; // most pass through unchanged
...@@ -5954,7 +6007,9 @@ const TFunction* HlslParseContext::findFunction(const TSourceLoc& loc, TFunction ...@@ -5954,7 +6007,9 @@ const TFunction* HlslParseContext::findFunction(const TSourceLoc& loc, TFunction
(candidateList[0]->getBuiltInOp() == EOpMethodAppend || (candidateList[0]->getBuiltInOp() == EOpMethodAppend ||
candidateList[0]->getBuiltInOp() == EOpMethodRestartStrip || candidateList[0]->getBuiltInOp() == EOpMethodRestartStrip ||
candidateList[0]->getBuiltInOp() == EOpMethodIncrementCounter || candidateList[0]->getBuiltInOp() == EOpMethodIncrementCounter ||
candidateList[0]->getBuiltInOp() == EOpMethodDecrementCounter)) { candidateList[0]->getBuiltInOp() == EOpMethodDecrementCounter ||
candidateList[0]->getBuiltInOp() == EOpMethodAppend ||
candidateList[0]->getBuiltInOp() == EOpMethodConsume)) {
return candidateList[0]; return candidateList[0];
} }
......
...@@ -873,6 +873,7 @@ void TBuiltInParseablesHlsl::initialize(int /*version*/, EProfile /*profile*/, c ...@@ -873,6 +873,7 @@ void TBuiltInParseablesHlsl::initialize(int /*version*/, EProfile /*profile*/, c
{ "InterlockedXor", nullptr, nullptr, "-", "-", EShLangAll, true }, { "InterlockedXor", nullptr, nullptr, "-", "-", EShLangAll, true },
{ "IncrementCounter", nullptr, nullptr, "-", "-", EShLangAll, true }, { "IncrementCounter", nullptr, nullptr, "-", "-", EShLangAll, true },
{ "DecrementCounter", nullptr, nullptr, "-", "-", EShLangAll, true }, { "DecrementCounter", nullptr, nullptr, "-", "-", EShLangAll, true },
{ "Consume", nullptr, nullptr, "-", "-", EShLangAll, true },
// Mark end of list, since we want to avoid a range-based for, as some compilers don't handle it yet. // Mark end of list, since we want to avoid a range-based for, as some compilers don't handle it yet.
{ nullptr, nullptr, nullptr, nullptr, nullptr, 0, false }, { nullptr, nullptr, nullptr, nullptr, nullptr, 0, false },
...@@ -1184,7 +1185,7 @@ void TBuiltInParseablesHlsl::identifyBuiltIns(int /*version*/, EProfile /*profil ...@@ -1184,7 +1185,7 @@ void TBuiltInParseablesHlsl::identifyBuiltIns(int /*version*/, EProfile /*profil
symbolTable.relateToOperator(BUILTIN_PREFIX "Store4", EOpMethodStore4); symbolTable.relateToOperator(BUILTIN_PREFIX "Store4", EOpMethodStore4);
symbolTable.relateToOperator(BUILTIN_PREFIX "IncrementCounter", EOpMethodIncrementCounter); symbolTable.relateToOperator(BUILTIN_PREFIX "IncrementCounter", EOpMethodIncrementCounter);
symbolTable.relateToOperator(BUILTIN_PREFIX "DecrementCounter", EOpMethodDecrementCounter); symbolTable.relateToOperator(BUILTIN_PREFIX "DecrementCounter", EOpMethodDecrementCounter);
symbolTable.relateToOperator(BUILTIN_PREFIX "Append", EOpMethodAppend); // Append is also a GS method: we don't add it twice
symbolTable.relateToOperator(BUILTIN_PREFIX "Consume", EOpMethodConsume); symbolTable.relateToOperator(BUILTIN_PREFIX "Consume", EOpMethodConsume);
symbolTable.relateToOperator(BUILTIN_PREFIX "InterlockedAdd", EOpInterlockedAdd); symbolTable.relateToOperator(BUILTIN_PREFIX "InterlockedAdd", EOpInterlockedAdd);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment