Commit 54ac5e82 by Nicolas Capens

Fix transpose2x4().

Change-Id: I079991d257be4aa00a0aef938ccf0110cd005bcd Reviewed-on: https://swiftshader-review.googlesource.com/8288Tested-by: 's avatarNicolas Capens <capn@google.com> Reviewed-by: 's avatarNicolas Capens <capn@google.com>
parent 5b41ba36
......@@ -475,18 +475,13 @@ namespace sw
void transpose2x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3)
{
row0 = UnpackLow(row0, row1);
row1 = Float4(row0.zw, row1.zw);
row2 = UnpackHigh(row0, row1);
row3 = Float4(row2.zw, row3.zw);
}
Float4 tmp01 = UnpackLow(row0, row1);
Float4 tmp23 = UnpackHigh(row0, row1);
void transpose2x4h(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3)
{
row0 = UnpackLow(row2, row3);
row1 = Float4(row0.zw, row1.zw);
row2 = UnpackHigh(row2, row3);
row3 = Float4(row2.zw, row3.zw);
row0 = tmp01;
row1 = Float4(tmp01.zw, row1.zw);
row2 = tmp23;
row3 = Float4(tmp23.zw, row3.zw);
}
void transpose4xN(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3, int N)
......
......@@ -87,7 +87,6 @@ namespace sw
void transpose4x2(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3);
void transpose4x1(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3);
void transpose2x4(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3);
void transpose2x4h(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3);
void transpose4xN(Float4 &row0, Float4 &row1, Float4 &row2, Float4 &row3, int N);
class Register
......
......@@ -687,7 +687,7 @@ namespace sw
}
else
{
if(state.output[i].write == 0x02)
if(state.output[i].write == 0x03)
{
transpose2x4(v.x, v.y, v.z, v.w);
}
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment