/*-------------------------------------------------------------------------
* drawElements Quality Program OpenGL ES 3.0 Module
* -------------------------------------------------
*
* Copyright 2014 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
*//*!
* \file
* \brief Shader precision tests.
*
* \note Floating-point case uses R32UI render target and uses
* floatBitsToUint() in shader to write out floating-point value bits.
* This is done since ES3 core doesn't support FP render targets.
*//*--------------------------------------------------------------------*/
#include "es3fShaderPrecisionTests.hpp"
#include "tcuVector.hpp"
#include "tcuTestLog.hpp"
#include "tcuVectorUtil.hpp"
#include "tcuFloat.hpp"
#include "tcuFormatUtil.hpp"
#include "gluRenderContext.hpp"
#include "gluShaderProgram.hpp"
#include "gluShaderUtil.hpp"
#include "gluDrawUtil.hpp"
#include "deRandom.hpp"
#include "deString.h"
#include "glwEnums.hpp"
#include "glwFunctions.hpp"
#include <algorithm>
namespace deqp
{
namespace gles3
{
namespace Functional
{
using std::string;
using std::vector;
using std::ostringstream;
using tcu::TestLog;
enum
{
FRAMEBUFFER_WIDTH = 32,
FRAMEBUFFER_HEIGHT = 32
};
static glu::ShaderProgram* createFloatPrecisionEvalProgram (const glu::RenderContext& context, glu::Precision precision, const char* evalOp, bool isVertexCase)
{
glu::DataType type = glu::TYPE_FLOAT;
glu::DataType outType = glu::TYPE_UINT;
const char* typeName = glu::getDataTypeName(type);
const char* outTypeName = glu::getDataTypeName(outType);
const char* precName = glu::getPrecisionName(precision);
ostringstream vtx;
ostringstream frag;
ostringstream& op = isVertexCase ? vtx : frag;
vtx << "#version 300 es\n"
<< "in highp vec4 a_position;\n"
<< "in " << precName << " " << typeName << " a_in0;\n"
<< "in " << precName << " " << typeName << " a_in1;\n";
frag << "#version 300 es\n"
<< "layout(location = 0) out highp " << outTypeName << " o_out;\n";
if (isVertexCase)
{
vtx << "flat out " << precName << " " << typeName << " v_out;\n";
frag << "flat in " << precName << " " << typeName << " v_out;\n";
}
else
{
vtx << "flat out " << precName << " " << typeName << " v_in0;\n"
<< "flat out " << precName << " " << typeName << " v_in1;\n";
frag << "flat in " << precName << " " << typeName << " v_in0;\n"
<< "flat in " << precName << " " << typeName << " v_in1;\n";
}
vtx << "\nvoid main (void)\n{\n"
<< " gl_Position = a_position;\n";
frag << "\nvoid main (void)\n{\n";
op << "\t" << precName << " " << typeName << " in0 = " << (isVertexCase ? "a_" : "v_") << "in0;\n"
<< "\t" << precName << " " << typeName << " in1 = " << (isVertexCase ? "a_" : "v_") << "in1;\n";
if (!isVertexCase)
op << "\t" << precName << " " << typeName << " res;\n";
op << "\t" << (isVertexCase ? "v_out" : "res") << " = " << evalOp << ";\n";
if (isVertexCase)
{
frag << " o_out = floatBitsToUint(v_out);\n";
}
else
{
vtx << " v_in0 = a_in0;\n"
<< " v_in1 = a_in1;\n";
frag << " o_out = floatBitsToUint(res);\n";
}
vtx << "}\n";
frag << "}\n";
return new glu::ShaderProgram(context, glu::makeVtxFragSources(vtx.str(), frag.str()));
}
static glu::ShaderProgram* createIntUintPrecisionEvalProgram (const glu::RenderContext& context, glu::DataType type, glu::Precision precision, const char* evalOp, bool isVertexCase)
{
const char* typeName = glu::getDataTypeName(type);
const char* precName = glu::getPrecisionName(precision);
ostringstream vtx;
ostringstream frag;
ostringstream& op = isVertexCase ? vtx : frag;
vtx << "#version 300 es\n"
<< "in highp vec4 a_position;\n"
<< "in " << precName << " " << typeName << " a_in0;\n"
<< "in " << precName << " " << typeName << " a_in1;\n";
frag << "#version 300 es\n"
<< "layout(location = 0) out " << precName << " " << typeName << " o_out;\n";
if (isVertexCase)
{
vtx << "flat out " << precName << " " << typeName << " v_out;\n";
frag << "flat in " << precName << " " << typeName << " v_out;\n";
}
else
{
vtx << "flat out " << precName << " " << typeName << " v_in0;\n"
<< "flat out " << precName << " " << typeName << " v_in1;\n";
frag << "flat in " << precName << " " << typeName << " v_in0;\n"
<< "flat in " << precName << " " << typeName << " v_in1;\n";
}
vtx << "\nvoid main (void)\n{\n"
<< " gl_Position = a_position;\n";
frag << "\nvoid main (void)\n{\n";
op << "\t" << precName << " " << typeName << " in0 = " << (isVertexCase ? "a_" : "v_") << "in0;\n"
<< "\t" << precName << " " << typeName << " in1 = " << (isVertexCase ? "a_" : "v_") << "in1;\n";
op << "\t" << (isVertexCase ? "v_" : "o_") << "out = " << evalOp << ";\n";
if (isVertexCase)
{
frag << " o_out = v_out;\n";
}
else
{
vtx << " v_in0 = a_in0;\n"
<< " v_in1 = a_in1;\n";
}
vtx << "}\n";
frag << "}\n";
return new glu::ShaderProgram(context, glu::makeVtxFragSources(vtx.str(), frag.str()));
}
class ShaderFloatPrecisionCase : public TestCase
{
public:
typedef double (*EvalFunc) (double in0, double in1);
ShaderFloatPrecisionCase (Context& context, const char* name, const char* desc, const char* op, EvalFunc evalFunc, glu::Precision precision, const tcu::Vec2& rangeA, const tcu::Vec2& rangeB, bool isVertexCase);
~ShaderFloatPrecisionCase (void);
void init (void);
void deinit (void);
IterateResult iterate (void);
protected:
bool compare (float in0, float in1, double reference, float result)
#if (DE_COMPILER == DE_COMPILER_GCC) && (DE_CPU == DE_CPU_ARM_64)
# if (__GNUC__ == 4) && (__GNUC_MINOR__ == 9) && (__GNUC_PATCHLEVEL__ == 0)
// Some prerelease GCC 4.9 versions have a bug in shift right when
// targeting ARMv8.
//
// If compiler wants to perform logical shift by variable/register
// in fp/vector registers it uses USHL that selects shift direction
// based on shift operand value. Thus for right shifts the shift
// operand needs to be negated.
//
// The bug is in right shift pattern; it doesn't mark shift operand
// as clobbered and thus later code using that same register may
// see the negated value.
//
// Workaround is to disable optimization for this function.
//
// See https://gcc.gnu.org/bugzilla/show_bug.cgi?id=61633
__attribute__((optimize(0)))
# endif
#endif
;
private:
ShaderFloatPrecisionCase (const ShaderFloatPrecisionCase& other);
ShaderFloatPrecisionCase& operator= (const ShaderFloatPrecisionCase& other);
// Case parameters.
std::string m_op;
EvalFunc m_evalFunc;
glu::Precision m_precision;
tcu::Vec2 m_rangeA;
tcu::Vec2 m_rangeB;
bool m_isVertexCase;
int m_numTestsPerIter;
int m_numIters;
de::Random m_rnd;
// Iteration state.
glu::ShaderProgram* m_program;
deUint32 m_framebuffer;
deUint32 m_renderbuffer;
int m_iterNdx;
};
ShaderFloatPrecisionCase::ShaderFloatPrecisionCase (Context& context, const char* name, const char* desc, const char* op, EvalFunc evalFunc, glu::Precision precision, const tcu::Vec2& rangeA, const tcu::Vec2& rangeB, bool isVertexCase)
: TestCase (context, name, desc)
, m_op (op)
, m_evalFunc (evalFunc)
, m_precision (precision)
, m_rangeA (rangeA)
, m_rangeB (rangeB)
, m_isVertexCase (isVertexCase)
, m_numTestsPerIter (32)
, m_numIters (4)
, m_rnd (deStringHash(name))
, m_program (DE_NULL)
, m_framebuffer (0)
, m_renderbuffer (0)
, m_iterNdx (0)
{
}
ShaderFloatPrecisionCase::~ShaderFloatPrecisionCase (void)
{
ShaderFloatPrecisionCase::deinit();
}
void ShaderFloatPrecisionCase::init (void)
{
const glw::Functions& gl = m_context.getRenderContext().getFunctions();
TestLog& log = m_testCtx.getLog();
DE_ASSERT(!m_program && !m_framebuffer && !m_renderbuffer);
// Create program.
m_program = createFloatPrecisionEvalProgram(m_context.getRenderContext(), m_precision, m_op.c_str(), m_isVertexCase);
log << *m_program;
TCU_CHECK(m_program->isOk());
// Create framebuffer.
gl.genFramebuffers(1, &m_framebuffer);
gl.genRenderbuffers(1, &m_renderbuffer);
gl.bindRenderbuffer(GL_RENDERBUFFER, m_renderbuffer);
gl.renderbufferStorage(GL_RENDERBUFFER, GL_R32UI, FRAMEBUFFER_WIDTH, FRAMEBUFFER_HEIGHT);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_framebuffer);
gl.framebufferRenderbuffer(GL_FRAMEBUFFER, GL_COLOR_ATTACHMENT0, GL_RENDERBUFFER, m_renderbuffer);
GLU_EXPECT_NO_ERROR(gl.getError(), "Post framebuffer setup");
TCU_CHECK(gl.checkFramebufferStatus(GL_FRAMEBUFFER) == GL_FRAMEBUFFER_COMPLETE);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_context.getRenderContext().getDefaultFramebuffer());
// Initialize test result to pass.
m_testCtx.setTestResult(QP_TEST_RESULT_PASS, "Pass");
m_iterNdx = 0;
}
void ShaderFloatPrecisionCase::deinit (void)
{
delete m_program;
if (m_framebuffer)
m_context.getRenderContext().getFunctions().deleteFramebuffers(1, &m_framebuffer);
if (m_renderbuffer)
m_context.getRenderContext().getFunctions().deleteRenderbuffers(1, &m_renderbuffer);
m_program = DE_NULL;
m_framebuffer = 0;
m_renderbuffer = 0;
}
bool ShaderFloatPrecisionCase::compare (float in0, float in1, double reference, float result)
{
// Comparison is done using 64-bit reference value to accurately evaluate rounding mode error.
// If 32-bit reference value is used, 2 bits of rounding error must be allowed.
// For mediump and lowp types the comparison currently allows 3 bits of rounding error:
// two bits from conversions and one from actual operation.
// \todo [2013-09-30 pyry] Make this more strict: determine if rounding can actually happen.
const int mantissaBits = m_precision == glu::PRECISION_HIGHP ? 23 : 10;
const int numPrecBits = 52 - mantissaBits;
const int in0Exp = tcu::Float32(in0).exponent();
const int in1Exp = tcu::Float32(in1).exponent();
const int resExp = tcu::Float32(result).exponent();
const int numLostBits = de::max(de::max(in0Exp-resExp, in1Exp-resExp), 0); // Lost due to mantissa shift.
const int roundingUlpError = m_precision == glu::PRECISION_HIGHP ? 1 : 3;
const int maskBits = numLostBits + numPrecBits;
m_testCtx.getLog() << TestLog::Message << "Assuming " << mantissaBits << " mantissa bits, " << numLostBits << " bits lost in operation, and " << roundingUlpError << " ULP rounding error."
<< TestLog::EndMessage;
{
const deUint64 refBits = tcu::Float64(reference).bits();
const deUint64 resBits = tcu::Float64(result).bits();
const deUint64 accurateRefBits = maskBits < 64 ? refBits >> (deUint64)maskBits : 0u;
const deUint64 accurateResBits = maskBits < 64 ? resBits >> (deUint64)maskBits : 0u;
const deUint64 ulpDiff = (deUint64)de::abs((deInt64)accurateRefBits - (deInt64)accurateResBits);
if (ulpDiff > (deUint64)roundingUlpError)
{
m_testCtx.getLog() << TestLog::Message << "ERROR: comparison failed! ULP diff (ignoring lost/undefined bits) = " << ulpDiff << TestLog::EndMessage;
return false;
}
else
return true;
}
}
ShaderFloatPrecisionCase::IterateResult ShaderFloatPrecisionCase::iterate (void)
{
// Constant data.
const float position[] =
{
-1.0f, -1.0f, 0.0f, 1.0f,
-1.0f, 1.0f, 0.0f, 1.0f,
1.0f, -1.0f, 0.0f, 1.0f,
1.0f, 1.0f, 0.0f, 1.0f
};
const deUint16 indices[] = { 0, 1, 2, 2, 1, 3 };
const int numVertices = 4;
float in0Arr[4] = { 0.0f };
float in1Arr[4] = { 0.0f };
TestLog& log = m_testCtx.getLog();
const glw::Functions& gl = m_context.getRenderContext().getFunctions();
vector<glu::VertexArrayBinding> vertexArrays;
// Image read from GL.
std::vector<float> pixels (FRAMEBUFFER_WIDTH*FRAMEBUFFER_HEIGHT*4);
// \todo [2012-05-03 pyry] Could be cached.
deUint32 prog = m_program->getProgram();
gl.useProgram(prog);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_framebuffer);
vertexArrays.push_back(glu::va::Float("a_position", 4, numVertices, 0, &position[0]));
vertexArrays.push_back(glu::va::Float("a_in0", 1, numVertices, 0, &in0Arr[0]));
vertexArrays.push_back(glu::va::Float("a_in1", 1, numVertices, 0, &in1Arr[0]));
GLU_EXPECT_NO_ERROR(gl.getError(), "After program setup");
// Compute values and reference.
for (int testNdx = 0; testNdx < m_numTestsPerIter; testNdx++)
{
const float in0 = m_rnd.getFloat(m_rangeA.x(), m_rangeA.y());
const float in1 = m_rnd.getFloat(m_rangeB.x(), m_rangeB.y());
const double refD = m_evalFunc((double)in0, (double)in1);
const float refF = tcu::Float64(refD).asFloat(); // Uses RTE rounding mode.
log << TestLog::Message << "iter " << m_iterNdx << ", test " << testNdx << ": "
<< "in0 = " << in0 << " / " << tcu::toHex(tcu::Float32(in0).bits())
<< ", in1 = " << in1 << " / " << tcu::toHex(tcu::Float32(in1).bits())
<< TestLog::EndMessage
<< TestLog::Message << " reference = " << refF << " / " << tcu::toHex(tcu::Float32(refF).bits()) << TestLog::EndMessage;
std::fill(&in0Arr[0], &in0Arr[0] + DE_LENGTH_OF_ARRAY(in0Arr), in0);
std::fill(&in1Arr[0], &in1Arr[0] + DE_LENGTH_OF_ARRAY(in1Arr), in1);
glu::draw(m_context.getRenderContext(), prog, (int)vertexArrays.size(), &vertexArrays[0],
glu::pr::Triangles(DE_LENGTH_OF_ARRAY(indices), &indices[0]));
gl.readPixels(0, 0, FRAMEBUFFER_WIDTH, FRAMEBUFFER_HEIGHT, GL_RGBA_INTEGER, GL_UNSIGNED_INT, &pixels[0]);
GLU_EXPECT_NO_ERROR(gl.getError(), "After render");
log << TestLog::Message << " result = " << pixels[0] << " / " << tcu::toHex(tcu::Float32(pixels[0]).bits()) << TestLog::EndMessage;
// Verify results
{
const bool firstPixelOk = compare(in0, in1, refD, pixels[0]);
if (firstPixelOk)
{
// Check that rest of pixels match to first one.
const deUint32 firstPixelBits = tcu::Float32(pixels[0]).bits();
bool allPixelsOk = true;
for (int y = 0; y < FRAMEBUFFER_HEIGHT; y++)
{
for (int x = 0; x < FRAMEBUFFER_WIDTH; x++)
{
const deUint32 pixelBits = tcu::Float32(pixels[(y*FRAMEBUFFER_WIDTH + x)*4]).bits();
if (pixelBits != firstPixelBits)
{
log << TestLog::Message << "ERROR: Inconsistent results, got " << tcu::toHex(pixelBits) << " at (" << x << ", " << y << ")" << TestLog::EndMessage;
allPixelsOk = false;
}
}
if (!allPixelsOk)
break;
}
if (!allPixelsOk)
m_testCtx.setTestResult(QP_TEST_RESULT_FAIL, "Inconsistent values in framebuffer");
}
else
m_testCtx.setTestResult(QP_TEST_RESULT_FAIL, "Result comparison failed");
}
if (m_testCtx.getTestResult() != QP_TEST_RESULT_PASS)
break;
}
gl.bindFramebuffer(GL_FRAMEBUFFER, m_context.getRenderContext().getDefaultFramebuffer());
GLU_EXPECT_NO_ERROR(gl.getError(), "After iteration");
m_iterNdx += 1;
return (m_iterNdx < m_numIters && m_testCtx.getTestResult() == QP_TEST_RESULT_PASS) ? CONTINUE : STOP;
}
class ShaderIntPrecisionCase : public TestCase
{
public:
typedef int (*EvalFunc) (int a, int b);
ShaderIntPrecisionCase (Context& context, const char* name, const char* desc, const char* op, EvalFunc evalFunc, glu::Precision precision, int bits, const tcu::IVec2& rangeA, const tcu::IVec2& rangeB, bool isVertexCase);
~ShaderIntPrecisionCase (void);
void init (void);
void deinit (void);
IterateResult iterate (void);
private:
ShaderIntPrecisionCase (const ShaderIntPrecisionCase& other);
ShaderIntPrecisionCase& operator= (const ShaderIntPrecisionCase& other);
// Case parameters.
std::string m_op;
EvalFunc m_evalFunc;
glu::Precision m_precision;
int m_bits;
tcu::IVec2 m_rangeA;
tcu::IVec2 m_rangeB;
bool m_isVertexCase;
int m_numTestsPerIter;
int m_numIters;
de::Random m_rnd;
// Iteration state.
glu::ShaderProgram* m_program;
deUint32 m_framebuffer;
deUint32 m_renderbuffer;
int m_iterNdx;
};
ShaderIntPrecisionCase::ShaderIntPrecisionCase (Context& context, const char* name, const char* desc, const char* op, EvalFunc evalFunc, glu::Precision precision, int bits, const tcu::IVec2& rangeA, const tcu::IVec2& rangeB, bool isVertexCase)
: TestCase (context, name, desc)
, m_op (op)
, m_evalFunc (evalFunc)
, m_precision (precision)
, m_bits (bits)
, m_rangeA (rangeA)
, m_rangeB (rangeB)
, m_isVertexCase (isVertexCase)
, m_numTestsPerIter (32)
, m_numIters (4)
, m_rnd (deStringHash(name))
, m_program (DE_NULL)
, m_framebuffer (0)
, m_renderbuffer (0)
, m_iterNdx (0)
{
}
ShaderIntPrecisionCase::~ShaderIntPrecisionCase (void)
{
ShaderIntPrecisionCase::deinit();
}
void ShaderIntPrecisionCase::init (void)
{
const glw::Functions& gl = m_context.getRenderContext().getFunctions();
TestLog& log = m_testCtx.getLog();
DE_ASSERT(!m_program && !m_framebuffer && !m_renderbuffer);
// Create program.
m_program = createIntUintPrecisionEvalProgram(m_context.getRenderContext(), glu::TYPE_INT, m_precision, m_op.c_str(), m_isVertexCase);
log << *m_program;
TCU_CHECK(m_program->isOk());
// Create framebuffer.
gl.genFramebuffers(1, &m_framebuffer);
gl.genRenderbuffers(1, &m_renderbuffer);
gl.bindRenderbuffer(GL_RENDERBUFFER, m_renderbuffer);
gl.renderbufferStorage(GL_RENDERBUFFER, GL_R32I, FRAMEBUFFER_WIDTH, FRAMEBUFFER_HEIGHT);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_framebuffer);
gl.framebufferRenderbuffer(GL_FRAMEBUFFER, GL_COLOR_ATTACHMENT0, GL_RENDERBUFFER, m_renderbuffer);
GLU_EXPECT_NO_ERROR(gl.getError(), "Post framebuffer setup");
TCU_CHECK(gl.checkFramebufferStatus(GL_FRAMEBUFFER) == GL_FRAMEBUFFER_COMPLETE);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_context.getRenderContext().getDefaultFramebuffer());
// Initialize test result to pass.
m_testCtx.setTestResult(QP_TEST_RESULT_PASS, "Pass");
m_iterNdx = 0;
log << TestLog::Message << "Number of accurate bits assumed = " << m_bits << TestLog::EndMessage;
}
void ShaderIntPrecisionCase::deinit (void)
{
delete m_program;
if (m_framebuffer)
m_context.getRenderContext().getFunctions().deleteFramebuffers(1, &m_framebuffer);
if (m_renderbuffer)
m_context.getRenderContext().getFunctions().deleteRenderbuffers(1, &m_renderbuffer);
m_program = DE_NULL;
m_framebuffer = 0;
m_renderbuffer = 0;
}
ShaderIntPrecisionCase::IterateResult ShaderIntPrecisionCase::iterate (void)
{
// Constant data.
const float position[] =
{
-1.0f, -1.0f, 0.0f, 1.0f,
-1.0f, 1.0f, 0.0f, 1.0f,
1.0f, -1.0f, 0.0f, 1.0f,
1.0f, 1.0f, 0.0f, 1.0f
};
const deUint16 indices[] = { 0, 1, 2, 2, 1, 3 };
const int numVertices = 4;
int in0Arr[4] = { 0 };
int in1Arr[4] = { 0 };
TestLog& log = m_testCtx.getLog();
const glw::Functions& gl = m_context.getRenderContext().getFunctions();
deUint32 mask = m_bits == 32 ? 0xffffffffu : ((1u<<m_bits)-1);
vector<int> pixels (FRAMEBUFFER_WIDTH*FRAMEBUFFER_HEIGHT*4);
vector<glu::VertexArrayBinding> vertexArrays;
deUint32 prog = m_program->getProgram();
// \todo [2012-05-03 pyry] A bit hacky. getInt() should work fine with ranges like this.
bool isMaxRangeA = m_rangeA.x() == (int)0x80000000 && m_rangeA.y() == (int)0x7fffffff;
bool isMaxRangeB = m_rangeB.x() == (int)0x80000000 && m_rangeB.y() == (int)0x7fffffff;
gl.useProgram(prog);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_framebuffer);
vertexArrays.push_back(glu::va::Float("a_position", 4, numVertices, 0, &position[0]));
vertexArrays.push_back(glu::va::Int32("a_in0", 1, numVertices, 0, &in0Arr[0]));
vertexArrays.push_back(glu::va::Int32("a_in1", 1, numVertices, 0, &in1Arr[0]));
GLU_EXPECT_NO_ERROR(gl.getError(), "After program setup");
// Compute values and reference.
for (int testNdx = 0; testNdx < m_numTestsPerIter; testNdx++)
{
int in0 = deSignExtendTo32(((isMaxRangeA ? (int)m_rnd.getUint32() : m_rnd.getInt(m_rangeA.x(), m_rangeA.y())) & mask), m_bits);
int in1 = deSignExtendTo32(((isMaxRangeB ? (int)m_rnd.getUint32() : m_rnd.getInt(m_rangeB.x(), m_rangeB.y())) & mask), m_bits);
int refMasked = m_evalFunc(in0, in1) & mask;
int refOut = deSignExtendTo32(refMasked, m_bits);
log << TestLog::Message << "iter " << m_iterNdx << ", test " << testNdx << ": "
<< "in0 = " << in0 << ", in1 = " << in1 << ", ref out = " << refOut << " / " << tcu::toHex(refMasked)
<< TestLog::EndMessage;
std::fill(&in0Arr[0], &in0Arr[0] + DE_LENGTH_OF_ARRAY(in0Arr), in0);
std::fill(&in1Arr[0], &in1Arr[0] + DE_LENGTH_OF_ARRAY(in1Arr), in1);
glu::draw(m_context.getRenderContext(), prog, (int)vertexArrays.size(), &vertexArrays[0],
glu::pr::Triangles(DE_LENGTH_OF_ARRAY(indices), &indices[0]));
gl.readPixels(0, 0, FRAMEBUFFER_WIDTH, FRAMEBUFFER_HEIGHT, GL_RGBA_INTEGER, GL_INT, &pixels[0]);
GLU_EXPECT_NO_ERROR(gl.getError(), "After render");
// Compare pixels.
for (int y = 0; y < FRAMEBUFFER_HEIGHT; y++)
{
for (int x = 0; x < FRAMEBUFFER_WIDTH; x++)
{
int cmpOut = pixels[(y*FRAMEBUFFER_WIDTH + x)*4];
int cmpMasked = cmpOut & mask;
if (cmpMasked != refMasked)
{
log << TestLog::Message << "Comparison failed (at " << x << ", " << y << "): "
<< "got " << cmpOut << " / " << tcu::toHex(cmpOut)
<< TestLog::EndMessage;
m_testCtx.setTestResult(QP_TEST_RESULT_FAIL, "Fail");
return STOP;
}
}
}
}
gl.bindFramebuffer(GL_FRAMEBUFFER, m_context.getRenderContext().getDefaultFramebuffer());
GLU_EXPECT_NO_ERROR(gl.getError(), "After iteration");
m_iterNdx += 1;
return (m_iterNdx < m_numIters) ? CONTINUE : STOP;
}
class ShaderUintPrecisionCase : public TestCase
{
public:
typedef deUint32 (*EvalFunc) (deUint32 a, deUint32 b);
ShaderUintPrecisionCase (Context& context, const char* name, const char* desc, const char* op, EvalFunc evalFunc, glu::Precision precision, int bits, const tcu::UVec2& rangeA, const tcu::UVec2& rangeB, bool isVertexCase);
~ShaderUintPrecisionCase (void);
void init (void);
void deinit (void);
IterateResult iterate (void);
private:
ShaderUintPrecisionCase (const ShaderUintPrecisionCase& other);
ShaderUintPrecisionCase& operator= (const ShaderUintPrecisionCase& other);
// Case parameters.
std::string m_op;
EvalFunc m_evalFunc;
glu::Precision m_precision;
int m_bits;
tcu::UVec2 m_rangeA;
tcu::UVec2 m_rangeB;
bool m_isVertexCase;
int m_numTestsPerIter;
int m_numIters;
de::Random m_rnd;
// Iteration state.
glu::ShaderProgram* m_program;
deUint32 m_framebuffer;
deUint32 m_renderbuffer;
int m_iterNdx;
};
ShaderUintPrecisionCase::ShaderUintPrecisionCase (Context& context, const char* name, const char* desc, const char* op, EvalFunc evalFunc, glu::Precision precision, int bits, const tcu::UVec2& rangeA, const tcu::UVec2& rangeB, bool isVertexCase)
: TestCase (context, name, desc)
, m_op (op)
, m_evalFunc (evalFunc)
, m_precision (precision)
, m_bits (bits)
, m_rangeA (rangeA)
, m_rangeB (rangeB)
, m_isVertexCase (isVertexCase)
, m_numTestsPerIter (32)
, m_numIters (4)
, m_rnd (deStringHash(name))
, m_program (DE_NULL)
, m_framebuffer (0)
, m_renderbuffer (0)
, m_iterNdx (0)
{
}
ShaderUintPrecisionCase::~ShaderUintPrecisionCase (void)
{
ShaderUintPrecisionCase::deinit();
}
void ShaderUintPrecisionCase::init (void)
{
const glw::Functions& gl = m_context.getRenderContext().getFunctions();
TestLog& log = m_testCtx.getLog();
DE_ASSERT(!m_program && !m_framebuffer && !m_renderbuffer);
// Create program.
m_program = createIntUintPrecisionEvalProgram(m_context.getRenderContext(), glu::TYPE_UINT, m_precision, m_op.c_str(), m_isVertexCase);
log << *m_program;
TCU_CHECK(m_program->isOk());
// Create framebuffer.
gl.genFramebuffers(1, &m_framebuffer);
gl.genRenderbuffers(1, &m_renderbuffer);
gl.bindRenderbuffer(GL_RENDERBUFFER, m_renderbuffer);
gl.renderbufferStorage(GL_RENDERBUFFER, GL_R32UI, FRAMEBUFFER_WIDTH, FRAMEBUFFER_HEIGHT);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_framebuffer);
gl.framebufferRenderbuffer(GL_FRAMEBUFFER, GL_COLOR_ATTACHMENT0, GL_RENDERBUFFER, m_renderbuffer);
GLU_EXPECT_NO_ERROR(gl.getError(), "Post framebuffer setup");
TCU_CHECK(gl.checkFramebufferStatus(GL_FRAMEBUFFER) == GL_FRAMEBUFFER_COMPLETE);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_context.getRenderContext().getDefaultFramebuffer());
// Initialize test result to pass.
m_testCtx.setTestResult(QP_TEST_RESULT_PASS, "Pass");
m_iterNdx = 0;
log << TestLog::Message << "Number of accurate bits assumed = " << m_bits << TestLog::EndMessage;
}
void ShaderUintPrecisionCase::deinit (void)
{
delete m_program;
if (m_framebuffer)
m_context.getRenderContext().getFunctions().deleteFramebuffers(1, &m_framebuffer);
if (m_renderbuffer)
m_context.getRenderContext().getFunctions().deleteRenderbuffers(1, &m_renderbuffer);
m_program = DE_NULL;
m_framebuffer = 0;
m_renderbuffer = 0;
}
ShaderUintPrecisionCase::IterateResult ShaderUintPrecisionCase::iterate (void)
{
// Constant data.
const float position[] =
{
-1.0f, -1.0f, 0.0f, 1.0f,
-1.0f, 1.0f, 0.0f, 1.0f,
1.0f, -1.0f, 0.0f, 1.0f,
1.0f, 1.0f, 0.0f, 1.0f
};
const deUint16 indices[] = { 0, 1, 2, 2, 1, 3 };
const int numVertices = 4;
deUint32 in0Arr[4] = { 0 };
deUint32 in1Arr[4] = { 0 };
TestLog& log = m_testCtx.getLog();
const glw::Functions& gl = m_context.getRenderContext().getFunctions();
deUint32 mask = m_bits == 32 ? 0xffffffffu : ((1u<<m_bits)-1);
vector<deUint32> pixels (FRAMEBUFFER_WIDTH*FRAMEBUFFER_HEIGHT*4);
vector<glu::VertexArrayBinding> vertexArrays;
deUint32 prog = m_program->getProgram();
// \todo [2012-05-03 pyry] A bit hacky.
bool isMaxRangeA = m_rangeA.x() == 0 && m_rangeA.y() == 0xffffffff;
bool isMaxRangeB = m_rangeB.x() == 0 && m_rangeB.y() == 0xffffffff;
gl.useProgram(prog);
gl.bindFramebuffer(GL_FRAMEBUFFER, m_framebuffer);
vertexArrays.push_back(glu::va::Float("a_position", 4, numVertices, 0, &position[0]));
vertexArrays.push_back(glu::va::Uint32("a_in0", 1, numVertices, 0, &in0Arr[0]));
vertexArrays.push_back(glu::va::Uint32("a_in1", 1, numVertices, 0, &in1Arr[0]));
GLU_EXPECT_NO_ERROR(gl.getError(), "After program setup");
// Compute values and reference.
for (int testNdx = 0; testNdx < m_numTestsPerIter; testNdx++)
{
deUint32 in0 = (isMaxRangeA ? m_rnd.getUint32() : (m_rangeA.x() + m_rnd.getUint32()%(m_rangeA.y()-m_rangeA.x()+1))) & mask;
deUint32 in1 = (isMaxRangeB ? m_rnd.getUint32() : (m_rangeB.x() + m_rnd.getUint32()%(m_rangeB.y()-m_rangeB.x()+1))) & mask;
deUint32 refOut = m_evalFunc(in0, in1) & mask;
log << TestLog::Message << "iter " << m_iterNdx << ", test " << testNdx << ": "
<< "in0 = " << tcu::toHex(in0) << ", in1 = " << tcu::toHex(in1) << ", ref out = " << tcu::toHex(refOut)
<< TestLog::EndMessage;
std::fill(&in0Arr[0], &in0Arr[0] + DE_LENGTH_OF_ARRAY(in0Arr), in0);
std::fill(&in1Arr[0], &in1Arr[0] + DE_LENGTH_OF_ARRAY(in1Arr), in1);
glu::draw(m_context.getRenderContext(), prog, (int)vertexArrays.size(), &vertexArrays[0],
glu::pr::Triangles(DE_LENGTH_OF_ARRAY(indices), &indices[0]));
gl.readPixels(0, 0, FRAMEBUFFER_WIDTH, FRAMEBUFFER_HEIGHT, GL_RGBA_INTEGER, GL_UNSIGNED_INT, &pixels[0]);
GLU_EXPECT_NO_ERROR(gl.getError(), "After render");
// Compare pixels.
for (int y = 0; y < FRAMEBUFFER_HEIGHT; y++)
{
for (int x = 0; x < FRAMEBUFFER_WIDTH; x++)
{
deUint32 cmpOut = pixels[(y*FRAMEBUFFER_WIDTH + x)*4];
deUint32 cmpMasked = cmpOut & mask;
if (cmpMasked != refOut)
{
log << TestLog::Message << "Comparison failed (at " << x << ", " << y << "): "
<< "got " << tcu::toHex(cmpOut)
<< TestLog::EndMessage;
m_testCtx.setTestResult(QP_TEST_RESULT_FAIL, "Fail");
return STOP;
}
}
}
}
gl.bindFramebuffer(GL_FRAMEBUFFER, 0);
GLU_EXPECT_NO_ERROR(gl.getError(), "After iteration");
m_iterNdx += 1;
return (m_iterNdx < m_numIters) ? CONTINUE : STOP;
}
ShaderPrecisionTests::ShaderPrecisionTests (Context& context)
: TestCaseGroup(context, "precision", "Shader precision requirements validation tests")
{
}
ShaderPrecisionTests::~ShaderPrecisionTests (void)
{
}
void ShaderPrecisionTests::init (void)
{
using tcu::add;
using tcu::sub;
using tcu::mul;
using tcu::div;
using tcu::Vec2;
using tcu::IVec2;
using tcu::UVec2;
// Exp = Emax-2, Mantissa = 0
float minF32 = tcu::Float32((1u<<31) | (0xfdu<<23) | 0x0u).asFloat();
float maxF32 = tcu::Float32((0u<<31) | (0xfdu<<23) | 0x0u).asFloat();
float minF16 = tcu::Float16((deUint16)((1u<<15) | (0x1du<<10) | 0x0u)).asFloat();
float maxF16 = tcu::Float16((deUint16)((0u<<15) | (0x1du<<10) | 0x0u)).asFloat();
tcu::Vec2 fullRange32F (minF32, maxF32);
tcu::Vec2 fullRange16F (minF16, maxF16);
tcu::IVec2 fullRange32I (0x80000000, 0x7fffffff);
tcu::IVec2 fullRange16I (-(1<<15), (1<<15)-1);
tcu::IVec2 fullRange8I (-(1<<7), (1<<7)-1);
tcu::UVec2 fullRange32U (0u, 0xffffffffu);
tcu::UVec2 fullRange16U (0u, 0xffffu);
tcu::UVec2 fullRange8U (0u, 0xffu);
// \note Right now it is not programmatically verified that the results shouldn't end up being inf/nan but
// actual values used are ok.
static const struct
{
const char* name;
const char* op;
ShaderFloatPrecisionCase::EvalFunc evalFunc;
glu::Precision precision;
tcu::Vec2 rangeA;
tcu::Vec2 rangeB;
} floatCases[] =
{
// Name Op Eval Precision RangeA RangeB
{ "highp_add", "in0 + in1", add<double>, glu::PRECISION_HIGHP, fullRange32F, fullRange32F },
{ "highp_sub", "in0 - in1", sub<double>, glu::PRECISION_HIGHP, fullRange32F, fullRange32F },
{ "highp_mul", "in0 * in1", mul<double>, glu::PRECISION_HIGHP, Vec2(-1e5f, 1e5f), Vec2(-1e5f, 1e5f) },
{ "highp_div", "in0 / in1", div<double>, glu::PRECISION_HIGHP, Vec2(-1e5f, 1e5f), Vec2(-1e5f, 1e5f) },
{ "mediump_add", "in0 + in1", add<double>, glu::PRECISION_MEDIUMP, fullRange16F, fullRange16F },
{ "mediump_sub", "in0 - in1", sub<double>, glu::PRECISION_MEDIUMP, fullRange16F, fullRange16F },
{ "mediump_mul", "in0 * in1", mul<double>, glu::PRECISION_MEDIUMP, Vec2(-1e2f, 1e2f), Vec2(-1e2f, 1e2f) },
{ "mediump_div", "in0 / in1", div<double>, glu::PRECISION_MEDIUMP, Vec2(-1e2f, 1e2f), Vec2(-1e2f, 1e2f) }
};
static const struct
{
const char* name;
const char* op;
ShaderIntPrecisionCase::EvalFunc evalFunc;
glu::Precision precision;
int bits;
tcu::IVec2 rangeA;
tcu::IVec2 rangeB;
} intCases[] =
{
// Name Op Eval Precision Bits RangeA RangeB
{ "highp_add", "in0 + in1", add<int>, glu::PRECISION_HIGHP, 32, fullRange32I, fullRange32I },
{ "highp_sub", "in0 - in1", sub<int>, glu::PRECISION_HIGHP, 32, fullRange32I, fullRange32I },
{ "highp_mul", "in0 * in1", mul<int>, glu::PRECISION_HIGHP, 32, fullRange32I, fullRange32I },
{ "highp_div", "in0 / in1", div<int>, glu::PRECISION_HIGHP, 32, fullRange32I, IVec2(-10000, -1) },
{ "mediump_add", "in0 + in1", add<int>, glu::PRECISION_MEDIUMP, 16, fullRange16I, fullRange16I },
{ "mediump_sub", "in0 - in1", sub<int>, glu::PRECISION_MEDIUMP, 16, fullRange16I, fullRange16I },
{ "mediump_mul", "in0 * in1", mul<int>, glu::PRECISION_MEDIUMP, 16, fullRange16I, fullRange16I },
{ "mediump_div", "in0 / in1", div<int>, glu::PRECISION_MEDIUMP, 16, fullRange16I, IVec2(1, 1000) },
{ "lowp_add", "in0 + in1", add<int>, glu::PRECISION_LOWP, 8, fullRange8I, fullRange8I },
{ "lowp_sub", "in0 - in1", sub<int>, glu::PRECISION_LOWP, 8, fullRange8I, fullRange8I },
{ "lowp_mul", "in0 * in1", mul<int>, glu::PRECISION_LOWP, 8, fullRange8I, fullRange8I },
{ "lowp_div", "in0 / in1", div<int>, glu::PRECISION_LOWP, 8, fullRange8I, IVec2(-50, -1) }
};
static const struct
{
const char* name;
const char* op;
ShaderUintPrecisionCase::EvalFunc evalFunc;
glu::Precision precision;
int bits;
tcu::UVec2 rangeA;
tcu::UVec2 rangeB;
} uintCases[] =
{
// Name Op Eval Precision Bits RangeA RangeB
{ "highp_add", "in0 + in1", add<deUint32>, glu::PRECISION_HIGHP, 32, fullRange32U, fullRange32U },
{ "highp_sub", "in0 - in1", sub<deUint32>, glu::PRECISION_HIGHP, 32, fullRange32U, fullRange32U },
{ "highp_mul", "in0 * in1", mul<deUint32>, glu::PRECISION_HIGHP, 32, fullRange32U, fullRange32U },
{ "highp_div", "in0 / in1", div<deUint32>, glu::PRECISION_HIGHP, 32, fullRange32U, UVec2(1u, 10000u) },
{ "mediump_add", "in0 + in1", add<deUint32>, glu::PRECISION_MEDIUMP, 16, fullRange16U, fullRange16U },
{ "mediump_sub", "in0 - in1", sub<deUint32>, glu::PRECISION_MEDIUMP, 16, fullRange16U, fullRange16U },
{ "mediump_mul", "in0 * in1", mul<deUint32>, glu::PRECISION_MEDIUMP, 16, fullRange16U, fullRange16U },
{ "mediump_div", "in0 / in1", div<deUint32>, glu::PRECISION_MEDIUMP, 16, fullRange16U, UVec2(1, 1000u) },
{ "lowp_add", "in0 + in1", add<deUint32>, glu::PRECISION_LOWP, 8, fullRange8U, fullRange8U },
{ "lowp_sub", "in0 - in1", sub<deUint32>, glu::PRECISION_LOWP, 8, fullRange8U, fullRange8U },
{ "lowp_mul", "in0 * in1", mul<deUint32>, glu::PRECISION_LOWP, 8, fullRange8U, fullRange8U },
{ "lowp_div", "in0 / in1", div<deUint32>, glu::PRECISION_LOWP, 8, fullRange8U, UVec2(1, 50u) }
};
tcu::TestCaseGroup* floatGroup = new tcu::TestCaseGroup(m_testCtx, "float", "Floating-point precision tests");
addChild(floatGroup);
for (int ndx = 0; ndx < DE_LENGTH_OF_ARRAY(floatCases); ndx++)
{
floatGroup->addChild(new ShaderFloatPrecisionCase(m_context,
(string(floatCases[ndx].name) + "_vertex").c_str(), "",
floatCases[ndx].op,
floatCases[ndx].evalFunc,
floatCases[ndx].precision,
floatCases[ndx].rangeA,
floatCases[ndx].rangeB,
true));
floatGroup->addChild(new ShaderFloatPrecisionCase(m_context,
(string(floatCases[ndx].name) + "_fragment").c_str(), "",
floatCases[ndx].op,
floatCases[ndx].evalFunc,
floatCases[ndx].precision,
floatCases[ndx].rangeA,
floatCases[ndx].rangeB,
false));
}
tcu::TestCaseGroup* intGroup = new tcu::TestCaseGroup(m_testCtx, "int", "Integer precision tests");
addChild(intGroup);
for (int ndx = 0; ndx < DE_LENGTH_OF_ARRAY(intCases); ndx++)
{
intGroup->addChild(new ShaderIntPrecisionCase(m_context,
(string(intCases[ndx].name) + "_vertex").c_str(), "",
intCases[ndx].op,
intCases[ndx].evalFunc,
intCases[ndx].precision,
intCases[ndx].bits,
intCases[ndx].rangeA,
intCases[ndx].rangeB,
true));
intGroup->addChild(new ShaderIntPrecisionCase(m_context,
(string(intCases[ndx].name) + "_fragment").c_str(), "",
intCases[ndx].op,
intCases[ndx].evalFunc,
intCases[ndx].precision,
intCases[ndx].bits,
intCases[ndx].rangeA,
intCases[ndx].rangeB,
false));
}
tcu::TestCaseGroup* uintGroup = new tcu::TestCaseGroup(m_testCtx, "uint", "Unsigned integer precision tests");
addChild(uintGroup);
for (int ndx = 0; ndx < DE_LENGTH_OF_ARRAY(uintCases); ndx++)
{
uintGroup->addChild(new ShaderUintPrecisionCase(m_context,
(string(uintCases[ndx].name) + "_vertex").c_str(), "",
uintCases[ndx].op,
uintCases[ndx].evalFunc,
uintCases[ndx].precision,
uintCases[ndx].bits,
uintCases[ndx].rangeA,
uintCases[ndx].rangeB,
true));
uintGroup->addChild(new ShaderUintPrecisionCase(m_context,
(string(uintCases[ndx].name) + "_fragment").c_str(), "",
uintCases[ndx].op,
uintCases[ndx].evalFunc,
uintCases[ndx].precision,
uintCases[ndx].bits,
uintCases[ndx].rangeA,
uintCases[ndx].rangeB,
false));
}
}
} // Functional
} // gles3
} // deqp