modules/gles31/functional/es31fShaderSharedVarTests.cpp - third_party/vulkan-cts - Git at Google

 /*-------------------------------------------------------------------------
  * drawElements Quality Program OpenGL ES 3.1 Module
  * -------------------------------------------------
  *
  * Copyright 2014 The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  *
  *//*!
  * \file
  * \brief GLSL Shared variable tests.
  *//*--------------------------------------------------------------------*/

 #include "es31fShaderSharedVarTests.hpp"
 #include "es31fShaderAtomicOpTests.hpp"
 #include "gluShaderProgram.hpp"
 #include "gluShaderUtil.hpp"
 #include "gluRenderContext.hpp"
 #include "gluObjectWrapper.hpp"
 #include "gluProgramInterfaceQuery.hpp"
 #include "tcuVector.hpp"
 #include "tcuTestLog.hpp"
 #include "tcuVectorUtil.hpp"
 #include "tcuFormatUtil.hpp"
 #include "deRandom.hpp"
 #include "deArrayUtil.hpp"
 #include "glwFunctions.hpp"
 #include "glwEnums.hpp"

 #include <algorithm>
 #include <set>

 namespace deqp
 {
 namespace gles31
 {
 namespace Functional
 {

 using std::string;
 using std::vector;
 using tcu::TestLog;
 using tcu::UVec3;
 using std::set;
 using namespace glu;

 enum
 {
 	MAX_VALUE_ARRAY_LENGTH	= 15	// * 2 * sizeof(mat4) + sizeof(int) = 481 uniform components (limit 512)
 };

 template<typename T, int Size>
 static inline T product (const tcu::Vector<T, Size>& v)
 {
 	T res = v[0];
 	for (int ndx = 1; ndx < Size; ndx++)
 		res *= v[ndx];
 	return res;
 }

 class SharedBasicVarCase : public TestCase
 {
 public:
 							SharedBasicVarCase		(Context& context, const char* name, DataType basicType, Precision precision, const tcu::UVec3& workGroupSize);
 							~SharedBasicVarCase		(void);

 	void					init					(void);
 	void					deinit					(void);
 	IterateResult			iterate					(void);

 private:
 							SharedBasicVarCase		(const SharedBasicVarCase& other);
 	SharedBasicVarCase&		operator=				(const SharedBasicVarCase& other);

 	const DataType			m_basicType;
 	const Precision			m_precision;
 	const tcu::UVec3		m_workGroupSize;

 	ShaderProgram*			m_program;
 };

 static std::string getBasicCaseDescription (DataType basicType, Precision precision, const tcu::UVec3& workGroupSize)
 {
 	std::ostringstream str;
 	if (precision != PRECISION_LAST)
 		str << getPrecisionName(precision) << " ";
 	str << getDataTypeName(basicType) << ", work group size = " << workGroupSize;
 	return str.str();
 }

 SharedBasicVarCase::SharedBasicVarCase (Context& context, const char* name, DataType basicType, Precision precision, const tcu::UVec3& workGroupSize)
 	: TestCase			(context, name, getBasicCaseDescription(basicType, precision, workGroupSize).c_str())
 	, m_basicType		(basicType)
 	, m_precision		(precision)
 	, m_workGroupSize	(workGroupSize)
 	, m_program			(DE_NULL)
 {
 }

 SharedBasicVarCase::~SharedBasicVarCase (void)
 {
 	SharedBasicVarCase::deinit();
 }

 void SharedBasicVarCase::init (void)
 {
 	const int			valArrayLength	= de::min<int>(MAX_VALUE_ARRAY_LENGTH, product(m_workGroupSize));
 	const char*			precName		= m_precision != glu::PRECISION_LAST ? getPrecisionName(m_precision) : "";
 	const char*			typeName		= getDataTypeName(m_basicType);
 	std::ostringstream	src;

 	src << "#version 310 es\n"
 		<< "layout (local_size_x = " << m_workGroupSize[0]
 		<< ", local_size_y = " << m_workGroupSize[1]
 		<< ", local_size_z = " << m_workGroupSize[2]
 		<< ") in;\n"
 		<< "const uint LOCAL_SIZE = gl_WorkGroupSize.x*gl_WorkGroupSize.y*gl_WorkGroupSize.z;\n"
 		<< "shared " << precName << " " << typeName << " s_var;\n"
 		<< "uniform " << precName << " " << typeName << " u_val[" << valArrayLength << "];\n"
 		<< "uniform " << precName << " " << typeName << " u_ref[" << valArrayLength << "];\n"
 		<< "uniform uint u_numIters;\n"
 		<< "layout(binding = 0) buffer Result\n"
 		<< "{\n"
 		<< "	bool isOk[LOCAL_SIZE];\n"
 		<< "};\n"
 		<< "\n"
 		<< "void main (void)\n"
 		<< "{\n"
 		<< "	bool allOk = true;\n"
 		<< "	for (uint ndx = 0u; ndx < u_numIters; ndx++)\n"
 		<< "	{\n"
 		<< "		if (ndx == gl_LocalInvocationIndex)\n"
 		<< "			s_var = u_val[ndx%uint(u_val.length())];\n"
 		<< "\n"
 		<< "		barrier();\n"
 		<< "\n"
 		<< "		if (s_var != u_ref[ndx%uint(u_ref.length())])\n"
 		<< "			allOk = false;\n"
 		<< "\n"
 		<< "		barrier();\n"
 		<< "	}\n"
 		<< "\n"
 		<< "	isOk[gl_LocalInvocationIndex] = allOk;\n"
 		<< "}\n";

 	DE_ASSERT(!m_program);
 	m_program = new ShaderProgram(m_context.getRenderContext(), ProgramSources() << ComputeSource(src.str()));

 	m_testCtx.getLog() << *m_program;

 	if (!m_program->isOk())
 	{
 		delete m_program;
 		m_program = DE_NULL;
 		throw tcu::TestError("Compile failed");
 	}
 }

 void SharedBasicVarCase::deinit (void)
 {
 	delete m_program;
 	m_program = DE_NULL;
 }

 SharedBasicVarCase::IterateResult SharedBasicVarCase::iterate (void)
 {
 	const glw::Functions&		gl				= m_context.getRenderContext().getFunctions();
 	const deUint32				program			= m_program->getProgram();
 	Buffer						outputBuffer	(m_context.getRenderContext());
 	const deUint32				outBlockNdx		= gl.getProgramResourceIndex(program, GL_SHADER_STORAGE_BLOCK, "Result");
 	const InterfaceBlockInfo	outBlockInfo	= getProgramInterfaceBlockInfo(gl, program, GL_SHADER_STORAGE_BLOCK, outBlockNdx);

 	gl.useProgram(program);

 	// Setup input values.
 	{
 		const int		numValues		= (int)product(m_workGroupSize);
 		const int		valLoc			= gl.getUniformLocation(program, "u_val[0]");
 		const int		refLoc			= gl.getUniformLocation(program, "u_ref[0]");
 		const int		iterCountLoc	= gl.getUniformLocation(program, "u_numIters");
 		const int		scalarSize		= getDataTypeScalarSize(m_basicType);

 		if (isDataTypeFloatOrVec(m_basicType))
 		{
 			const int		maxInt			= m_precision == glu::PRECISION_LOWP ? 2 : 1024;
 			const int		minInt			= -de::min(numValues/2, maxInt);
 			vector<float>	values			(numValues*scalarSize);

 			for (int ndx = 0; ndx < (int)values.size(); ndx++)
 				values[ndx] = float(minInt + (ndx % (maxInt-minInt+1)));

 			for (int uNdx = 0; uNdx < 2; uNdx++)
 			{
 				const int location = uNdx == 1 ? refLoc : valLoc;

 				if (scalarSize == 1)		gl.uniform1fv(location, numValues, &values[0]);
 				else if (scalarSize == 2)	gl.uniform2fv(location, numValues, &values[0]);
 				else if (scalarSize == 3)	gl.uniform3fv(location, numValues, &values[0]);
 				else if (scalarSize == 4)	gl.uniform4fv(location, numValues, &values[0]);
 			}
 		}
 		else if (isDataTypeIntOrIVec(m_basicType))
 		{
 			const int		maxInt			= m_precision == glu::PRECISION_LOWP ? 64 : 1024;
 			const int		minInt			= -de::min(numValues/2, maxInt);
 			vector<int>		values			(numValues*scalarSize);

 			for (int ndx = 0; ndx < (int)values.size(); ndx++)
 				values[ndx] = minInt + (ndx % (maxInt-minInt+1));

 			for (int uNdx = 0; uNdx < 2; uNdx++)
 			{
 				const int location = uNdx == 1 ? refLoc : valLoc;

 				if (scalarSize == 1)		gl.uniform1iv(location, numValues, &values[0]);
 				else if (scalarSize == 2)	gl.uniform2iv(location, numValues, &values[0]);
 				else if (scalarSize == 3)	gl.uniform3iv(location, numValues, &values[0]);
 				else if (scalarSize == 4)	gl.uniform4iv(location, numValues, &values[0]);
 			}
 		}
 		else if (isDataTypeUintOrUVec(m_basicType))
 		{
 			const deUint32		maxInt		= m_precision == glu::PRECISION_LOWP ? 128 : 1024;
 			vector<deUint32>	values		(numValues*scalarSize);

 			for (int ndx = 0; ndx < (int)values.size(); ndx++)
 				values[ndx] = ndx % (maxInt+1);

 			for (int uNdx = 0; uNdx < 2; uNdx++)
 			{
 				const int location = uNdx == 1 ? refLoc : valLoc;

 				if (scalarSize == 1)		gl.uniform1uiv(location, numValues, &values[0]);
 				else if (scalarSize == 2)	gl.uniform2uiv(location, numValues, &values[0]);
 				else if (scalarSize == 3)	gl.uniform3uiv(location, numValues, &values[0]);
 				else if (scalarSize == 4)	gl.uniform4uiv(location, numValues, &values[0]);
 			}
 		}
 		else if (isDataTypeBoolOrBVec(m_basicType))
 		{
 			de::Random		rnd				(0x324f);
 			vector<int>		values			(numValues*scalarSize);

 			for (int ndx = 0; ndx < (int)values.size(); ndx++)
 				values[ndx] = rnd.getBool() ? 1 : 0;

 			for (int uNdx = 0; uNdx < 2; uNdx++)
 			{
 				const int location = uNdx == 1 ? refLoc : valLoc;

 				if (scalarSize == 1)		gl.uniform1iv(location, numValues, &values[0]);
 				else if (scalarSize == 2)	gl.uniform2iv(location, numValues, &values[0]);
 				else if (scalarSize == 3)	gl.uniform3iv(location, numValues, &values[0]);
 				else if (scalarSize == 4)	gl.uniform4iv(location, numValues, &values[0]);
 			}
 		}
 		else if (isDataTypeMatrix(m_basicType))
 		{
 			const int		maxInt			= m_precision == glu::PRECISION_LOWP ? 2 : 1024;
 			const int		minInt			= -de::min(numValues/2, maxInt);
 			vector<float>	values			(numValues*scalarSize);

 			for (int ndx = 0; ndx < (int)values.size(); ndx++)
 				values[ndx] = float(minInt + (ndx % (maxInt-minInt+1)));

 			for (int uNdx = 0; uNdx < 2; uNdx++)
 			{
 				const int location = uNdx == 1 ? refLoc : valLoc;

 				switch (m_basicType)
 				{
 					case TYPE_FLOAT_MAT2:	gl.uniformMatrix2fv  (location, numValues, DE_FALSE, &values[0]);	break;
 					case TYPE_FLOAT_MAT2X3:	gl.uniformMatrix2x3fv(location, numValues, DE_FALSE, &values[0]);	break;
 					case TYPE_FLOAT_MAT2X4:	gl.uniformMatrix2x4fv(location, numValues, DE_FALSE, &values[0]);	break;
 					case TYPE_FLOAT_MAT3X2:	gl.uniformMatrix3x2fv(location, numValues, DE_FALSE, &values[0]);	break;
 					case TYPE_FLOAT_MAT3:	gl.uniformMatrix3fv  (location, numValues, DE_FALSE, &values[0]);	break;
 					case TYPE_FLOAT_MAT3X4:	gl.uniformMatrix3x4fv(location, numValues, DE_FALSE, &values[0]);	break;
 					case TYPE_FLOAT_MAT4X2:	gl.uniformMatrix4x2fv(location, numValues, DE_FALSE, &values[0]);	break;
 					case TYPE_FLOAT_MAT4X3:	gl.uniformMatrix4x3fv(location, numValues, DE_FALSE, &values[0]);	break;
 					case TYPE_FLOAT_MAT4:	gl.uniformMatrix4fv  (location, numValues, DE_FALSE, &values[0]);	break;
 					default:
 						DE_ASSERT(false);
 				}
 			}
 		}

 		gl.uniform1ui(iterCountLoc, product(m_workGroupSize));
 		GLU_EXPECT_NO_ERROR(gl.getError(), "Input value setup failed");
 	}

 	// Setup output buffer.
 	{
 		vector<deUint8> emptyData(outBlockInfo.dataSize);
 		std::fill(emptyData.begin(), emptyData.end(), 0);

 		gl.bindBuffer(GL_SHADER_STORAGE_BUFFER, *outputBuffer);
 		gl.bufferData(GL_SHADER_STORAGE_BUFFER, outBlockInfo.dataSize, &emptyData[0], GL_STATIC_READ);
 		gl.bindBufferBase(GL_SHADER_STORAGE_BUFFER, 0, *outputBuffer);
 		GLU_EXPECT_NO_ERROR(gl.getError(), "Output buffer setup failed");
 	}

 	gl.dispatchCompute(1, 1, 1);

 	// Read back and compare
 	{
 		const deUint32				numValues	= product(m_workGroupSize);
 		const InterfaceVariableInfo	outVarInfo	= getProgramInterfaceVariableInfo(gl, program, GL_BUFFER_VARIABLE, outBlockInfo.activeVariables[0]);
 		const void*					resPtr		= gl.mapBufferRange(GL_SHADER_STORAGE_BUFFER, 0, outBlockInfo.dataSize, GL_MAP_READ_BIT);
 		const int					maxErrMsg	= 10;
 		int							numFailed	= 0;

 		GLU_EXPECT_NO_ERROR(gl.getError(), "glMapBufferRange()");
 		TCU_CHECK(resPtr);

 		for (deUint32 ndx = 0; ndx < numValues; ndx++)
 		{
 			const int resVal = *((const int*)((const deUint8*)resPtr + outVarInfo.offset + outVarInfo.arrayStride*ndx));

 			if (resVal == 0)
 			{
 				if (numFailed < maxErrMsg)
 					m_testCtx.getLog() << TestLog::Message << "ERROR: isOk[" << ndx << "] = " << resVal << " != true" << TestLog::EndMessage;
 				else if (numFailed == maxErrMsg)
 					m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;

 				numFailed += 1;
 			}
 		}

 		gl.unmapBuffer(GL_SHADER_STORAGE_BUFFER);
 		GLU_EXPECT_NO_ERROR(gl.getError(), "glUnmapBuffer()");

 		m_testCtx.getLog() << TestLog::Message << (numValues-numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;

 		m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS	: QP_TEST_RESULT_FAIL,
 								numFailed == 0 ? "Pass"					: "Comparison failed");
 	}

 	return STOP;
 }

 ShaderSharedVarTests::ShaderSharedVarTests (Context& context)
 	: TestCaseGroup(context, "shared_var", "Shared Variable Tests")
 {
 }

 ShaderSharedVarTests::~ShaderSharedVarTests (void)
 {
 }

 void ShaderSharedVarTests::init (void)
 {
 	// .basic_type
 	{
 		tcu::TestCaseGroup *const basicTypeGroup = new tcu::TestCaseGroup(m_testCtx, "basic_type", "Basic Types");
 		addChild(basicTypeGroup);

 		for (int basicType = TYPE_FLOAT; basicType <= TYPE_BOOL_VEC4; basicType++)
 		{
 			if (glu::getDataTypeScalarType(DataType(basicType)) == glu::TYPE_DOUBLE)
 				continue;

 			if (glu::isDataTypeBoolOrBVec(DataType(basicType)))
 			{
 				const tcu::UVec3	workGroupSize	(2,1,3);
 				basicTypeGroup->addChild(new SharedBasicVarCase(m_context, getDataTypeName(DataType(basicType)), DataType(basicType), PRECISION_LAST, workGroupSize));
 			}
 			else
 			{
 				for (int precision = 0; precision < PRECISION_LAST; precision++)
 				{
 					const tcu::UVec3	workGroupSize	(2,1,3);
 					const string		name			= string(getDataTypeName(DataType(basicType))) + "_" + getPrecisionName(Precision(precision));

 					basicTypeGroup->addChild(new SharedBasicVarCase(m_context, name.c_str(), DataType(basicType), Precision(precision), workGroupSize));
 				}
 			}
 		}
 	}

 	// .work_group_size
 	{
 		tcu::TestCaseGroup *const workGroupSizeGroup = new tcu::TestCaseGroup(m_testCtx, "work_group_size", "Shared Variables with Various Work Group Sizes");
 		addChild(workGroupSizeGroup);

 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_1_1_1",		TYPE_FLOAT,			PRECISION_HIGHP,	tcu::UVec3(1,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_64_1_1",		TYPE_FLOAT,			PRECISION_HIGHP,	tcu::UVec3(64,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_1_64_1",		TYPE_FLOAT,			PRECISION_HIGHP,	tcu::UVec3(1,64,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_1_1_64",		TYPE_FLOAT,			PRECISION_HIGHP,	tcu::UVec3(1,1,64)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_128_1_1",		TYPE_FLOAT,			PRECISION_HIGHP,	tcu::UVec3(128,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_1_128_1",		TYPE_FLOAT,			PRECISION_HIGHP,	tcu::UVec3(1,128,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_13_2_4",		TYPE_FLOAT,			PRECISION_HIGHP,	tcu::UVec3(13,2,4)));

 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_1_1_1",		TYPE_FLOAT_VEC4,	PRECISION_HIGHP,	tcu::UVec3(1,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_64_1_1",		TYPE_FLOAT_VEC4,	PRECISION_HIGHP,	tcu::UVec3(64,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_1_64_1",		TYPE_FLOAT_VEC4,	PRECISION_HIGHP,	tcu::UVec3(1,64,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_1_1_64",		TYPE_FLOAT_VEC4,	PRECISION_HIGHP,	tcu::UVec3(1,1,64)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_128_1_1",		TYPE_FLOAT_VEC4,	PRECISION_HIGHP,	tcu::UVec3(128,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_1_128_1",		TYPE_FLOAT_VEC4,	PRECISION_HIGHP,	tcu::UVec3(1,128,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_13_2_4",		TYPE_FLOAT_VEC4,	PRECISION_HIGHP,	tcu::UVec3(13,2,4)));

 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_1_1_1",		TYPE_FLOAT_MAT4,	PRECISION_HIGHP,	tcu::UVec3(1,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_64_1_1",		TYPE_FLOAT_MAT4,	PRECISION_HIGHP,	tcu::UVec3(64,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_1_64_1",		TYPE_FLOAT_MAT4,	PRECISION_HIGHP,	tcu::UVec3(1,64,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_1_1_64",		TYPE_FLOAT_MAT4,	PRECISION_HIGHP,	tcu::UVec3(1,1,64)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_128_1_1",		TYPE_FLOAT_MAT4,	PRECISION_HIGHP,	tcu::UVec3(128,1,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_1_128_1",		TYPE_FLOAT_MAT4,	PRECISION_HIGHP,	tcu::UVec3(1,128,1)));
 		workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_13_2_4",		TYPE_FLOAT_MAT4,	PRECISION_HIGHP,	tcu::UVec3(13,2,4)));
 	}

 	// .atomic
 	addChild(new ShaderAtomicOpTests(m_context, "atomic", ATOMIC_OPERAND_SHARED_VARIABLE));
 }

 } // Functional
 } // gles31
 } // deqp
	/*-------------------------------------------------------------------------
	* drawElements Quality Program OpenGL ES 3.1 Module
	* -------------------------------------------------
	*
	* Copyright 2014 The Android Open Source Project
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*
	//!
	* \file
	* \brief GLSL Shared variable tests.
	//--------------------------------------------------------------------*/

	#include "es31fShaderSharedVarTests.hpp"
	#include "es31fShaderAtomicOpTests.hpp"
	#include "gluShaderProgram.hpp"
	#include "gluShaderUtil.hpp"
	#include "gluRenderContext.hpp"
	#include "gluObjectWrapper.hpp"
	#include "gluProgramInterfaceQuery.hpp"
	#include "tcuVector.hpp"
	#include "tcuTestLog.hpp"
	#include "tcuVectorUtil.hpp"
	#include "tcuFormatUtil.hpp"
	#include "deRandom.hpp"
	#include "deArrayUtil.hpp"
	#include "glwFunctions.hpp"
	#include "glwEnums.hpp"

	#include <algorithm>
	#include <set>

	namespace deqp
	{
	namespace gles31
	{
	namespace Functional
	{

	using std::string;
	using std::vector;
	using tcu::TestLog;
	using tcu::UVec3;
	using std::set;
	using namespace glu;

	enum
	{
	MAX_VALUE_ARRAY_LENGTH = 15 // * 2 * sizeof(mat4) + sizeof(int) = 481 uniform components (limit 512)
	};

	template<typename T, int Size>
	static inline T product (const tcu::Vector<T, Size>& v)
	{
	T res = v[0];
	for (int ndx = 1; ndx < Size; ndx++)
	res *= v[ndx];
	return res;
	}

	class SharedBasicVarCase : public TestCase
	{
	public:
	SharedBasicVarCase (Context& context, const char* name, DataType basicType, Precision precision, const tcu::UVec3& workGroupSize);
	~SharedBasicVarCase (void);

	void init (void);
	void deinit (void);
	IterateResult iterate (void);

	private:
	SharedBasicVarCase (const SharedBasicVarCase& other);
	SharedBasicVarCase& operator= (const SharedBasicVarCase& other);

	const DataType m_basicType;
	const Precision m_precision;
	const tcu::UVec3 m_workGroupSize;

	ShaderProgram* m_program;
	};

	static std::string getBasicCaseDescription (DataType basicType, Precision precision, const tcu::UVec3& workGroupSize)
	{
	std::ostringstream str;
	if (precision != PRECISION_LAST)
	str << getPrecisionName(precision) << " ";
	str << getDataTypeName(basicType) << ", work group size = " << workGroupSize;
	return str.str();
	}

	SharedBasicVarCase::SharedBasicVarCase (Context& context, const char* name, DataType basicType, Precision precision, const tcu::UVec3& workGroupSize)
	: TestCase (context, name, getBasicCaseDescription(basicType, precision, workGroupSize).c_str())
	, m_basicType (basicType)
	, m_precision (precision)
	, m_workGroupSize (workGroupSize)
	, m_program (DE_NULL)
	{
	}

	SharedBasicVarCase::~SharedBasicVarCase (void)
	{
	SharedBasicVarCase::deinit();
	}

	void SharedBasicVarCase::init (void)
	{
	const int valArrayLength = de::min<int>(MAX_VALUE_ARRAY_LENGTH, product(m_workGroupSize));
	const char* precName = m_precision != glu::PRECISION_LAST ? getPrecisionName(m_precision) : "";
	const char* typeName = getDataTypeName(m_basicType);
	std::ostringstream src;

	src << "#version 310 es\n"
	<< "layout (local_size_x = " << m_workGroupSize[0]
	<< ", local_size_y = " << m_workGroupSize[1]
	<< ", local_size_z = " << m_workGroupSize[2]
	<< ") in;\n"
	<< "const uint LOCAL_SIZE = gl_WorkGroupSize.xgl_WorkGroupSize.ygl_WorkGroupSize.z;\n"
	<< "shared " << precName << " " << typeName << " s_var;\n"
	<< "uniform " << precName << " " << typeName << " u_val[" << valArrayLength << "];\n"
	<< "uniform " << precName << " " << typeName << " u_ref[" << valArrayLength << "];\n"
	<< "uniform uint u_numIters;\n"
	<< "layout(binding = 0) buffer Result\n"
	<< "{\n"
	<< " bool isOk[LOCAL_SIZE];\n"
	<< "};\n"
	<< "\n"
	<< "void main (void)\n"
	<< "{\n"
	<< " bool allOk = true;\n"
	<< " for (uint ndx = 0u; ndx < u_numIters; ndx++)\n"
	<< " {\n"
	<< " if (ndx == gl_LocalInvocationIndex)\n"
	<< " s_var = u_val[ndx%uint(u_val.length())];\n"
	<< "\n"
	<< " barrier();\n"
	<< "\n"
	<< " if (s_var != u_ref[ndx%uint(u_ref.length())])\n"
	<< " allOk = false;\n"
	<< "\n"
	<< " barrier();\n"
	<< " }\n"
	<< "\n"
	<< " isOk[gl_LocalInvocationIndex] = allOk;\n"
	<< "}\n";

	DE_ASSERT(!m_program);
	m_program = new ShaderProgram(m_context.getRenderContext(), ProgramSources() << ComputeSource(src.str()));

	m_testCtx.getLog() << *m_program;

	if (!m_program->isOk())
	{
	delete m_program;
	m_program = DE_NULL;
	throw tcu::TestError("Compile failed");
	}
	}

	void SharedBasicVarCase::deinit (void)
	{
	delete m_program;
	m_program = DE_NULL;
	}

	SharedBasicVarCase::IterateResult SharedBasicVarCase::iterate (void)
	{
	const glw::Functions& gl = m_context.getRenderContext().getFunctions();
	const deUint32 program = m_program->getProgram();
	Buffer outputBuffer (m_context.getRenderContext());
	const deUint32 outBlockNdx = gl.getProgramResourceIndex(program, GL_SHADER_STORAGE_BLOCK, "Result");
	const InterfaceBlockInfo outBlockInfo = getProgramInterfaceBlockInfo(gl, program, GL_SHADER_STORAGE_BLOCK, outBlockNdx);

	gl.useProgram(program);

	// Setup input values.
	{
	const int numValues = (int)product(m_workGroupSize);
	const int valLoc = gl.getUniformLocation(program, "u_val[0]");
	const int refLoc = gl.getUniformLocation(program, "u_ref[0]");
	const int iterCountLoc = gl.getUniformLocation(program, "u_numIters");
	const int scalarSize = getDataTypeScalarSize(m_basicType);

	if (isDataTypeFloatOrVec(m_basicType))
	{
	const int maxInt = m_precision == glu::PRECISION_LOWP ? 2 : 1024;
	const int minInt = -de::min(numValues/2, maxInt);
	vector<float> values (numValues*scalarSize);

	for (int ndx = 0; ndx < (int)values.size(); ndx++)
	values[ndx] = float(minInt + (ndx % (maxInt-minInt+1)));

	for (int uNdx = 0; uNdx < 2; uNdx++)
	{
	const int location = uNdx == 1 ? refLoc : valLoc;

	if (scalarSize == 1) gl.uniform1fv(location, numValues, &values[0]);
	else if (scalarSize == 2) gl.uniform2fv(location, numValues, &values[0]);
	else if (scalarSize == 3) gl.uniform3fv(location, numValues, &values[0]);
	else if (scalarSize == 4) gl.uniform4fv(location, numValues, &values[0]);
	}
	}
	else if (isDataTypeIntOrIVec(m_basicType))
	{
	const int maxInt = m_precision == glu::PRECISION_LOWP ? 64 : 1024;
	const int minInt = -de::min(numValues/2, maxInt);
	vector<int> values (numValues*scalarSize);

	for (int ndx = 0; ndx < (int)values.size(); ndx++)
	values[ndx] = minInt + (ndx % (maxInt-minInt+1));

	for (int uNdx = 0; uNdx < 2; uNdx++)
	{
	const int location = uNdx == 1 ? refLoc : valLoc;

	if (scalarSize == 1) gl.uniform1iv(location, numValues, &values[0]);
	else if (scalarSize == 2) gl.uniform2iv(location, numValues, &values[0]);
	else if (scalarSize == 3) gl.uniform3iv(location, numValues, &values[0]);
	else if (scalarSize == 4) gl.uniform4iv(location, numValues, &values[0]);
	}
	}
	else if (isDataTypeUintOrUVec(m_basicType))
	{
	const deUint32 maxInt = m_precision == glu::PRECISION_LOWP ? 128 : 1024;
	vector<deUint32> values (numValues*scalarSize);

	for (int ndx = 0; ndx < (int)values.size(); ndx++)
	values[ndx] = ndx % (maxInt+1);

	for (int uNdx = 0; uNdx < 2; uNdx++)
	{
	const int location = uNdx == 1 ? refLoc : valLoc;

	if (scalarSize == 1) gl.uniform1uiv(location, numValues, &values[0]);
	else if (scalarSize == 2) gl.uniform2uiv(location, numValues, &values[0]);
	else if (scalarSize == 3) gl.uniform3uiv(location, numValues, &values[0]);
	else if (scalarSize == 4) gl.uniform4uiv(location, numValues, &values[0]);
	}
	}
	else if (isDataTypeBoolOrBVec(m_basicType))
	{
	de::Random rnd (0x324f);
	vector<int> values (numValues*scalarSize);

	for (int ndx = 0; ndx < (int)values.size(); ndx++)
	values[ndx] = rnd.getBool() ? 1 : 0;

	for (int uNdx = 0; uNdx < 2; uNdx++)
	{
	const int location = uNdx == 1 ? refLoc : valLoc;

	if (scalarSize == 1) gl.uniform1iv(location, numValues, &values[0]);
	else if (scalarSize == 2) gl.uniform2iv(location, numValues, &values[0]);
	else if (scalarSize == 3) gl.uniform3iv(location, numValues, &values[0]);
	else if (scalarSize == 4) gl.uniform4iv(location, numValues, &values[0]);
	}
	}
	else if (isDataTypeMatrix(m_basicType))
	{
	const int maxInt = m_precision == glu::PRECISION_LOWP ? 2 : 1024;
	const int minInt = -de::min(numValues/2, maxInt);
	vector<float> values (numValues*scalarSize);

	for (int ndx = 0; ndx < (int)values.size(); ndx++)
	values[ndx] = float(minInt + (ndx % (maxInt-minInt+1)));

	for (int uNdx = 0; uNdx < 2; uNdx++)
	{
	const int location = uNdx == 1 ? refLoc : valLoc;

	switch (m_basicType)
	{
	case TYPE_FLOAT_MAT2: gl.uniformMatrix2fv (location, numValues, DE_FALSE, &values[0]); break;
	case TYPE_FLOAT_MAT2X3: gl.uniformMatrix2x3fv(location, numValues, DE_FALSE, &values[0]); break;
	case TYPE_FLOAT_MAT2X4: gl.uniformMatrix2x4fv(location, numValues, DE_FALSE, &values[0]); break;
	case TYPE_FLOAT_MAT3X2: gl.uniformMatrix3x2fv(location, numValues, DE_FALSE, &values[0]); break;
	case TYPE_FLOAT_MAT3: gl.uniformMatrix3fv (location, numValues, DE_FALSE, &values[0]); break;
	case TYPE_FLOAT_MAT3X4: gl.uniformMatrix3x4fv(location, numValues, DE_FALSE, &values[0]); break;
	case TYPE_FLOAT_MAT4X2: gl.uniformMatrix4x2fv(location, numValues, DE_FALSE, &values[0]); break;
	case TYPE_FLOAT_MAT4X3: gl.uniformMatrix4x3fv(location, numValues, DE_FALSE, &values[0]); break;
	case TYPE_FLOAT_MAT4: gl.uniformMatrix4fv (location, numValues, DE_FALSE, &values[0]); break;
	default:
	DE_ASSERT(false);
	}
	}
	}

	gl.uniform1ui(iterCountLoc, product(m_workGroupSize));
	GLU_EXPECT_NO_ERROR(gl.getError(), "Input value setup failed");
	}

	// Setup output buffer.
	{
	vector<deUint8> emptyData(outBlockInfo.dataSize);
	std::fill(emptyData.begin(), emptyData.end(), 0);

	gl.bindBuffer(GL_SHADER_STORAGE_BUFFER, *outputBuffer);
	gl.bufferData(GL_SHADER_STORAGE_BUFFER, outBlockInfo.dataSize, &emptyData[0], GL_STATIC_READ);
	gl.bindBufferBase(GL_SHADER_STORAGE_BUFFER, 0, *outputBuffer);
	GLU_EXPECT_NO_ERROR(gl.getError(), "Output buffer setup failed");
	}

	gl.dispatchCompute(1, 1, 1);

	// Read back and compare
	{
	const deUint32 numValues = product(m_workGroupSize);
	const InterfaceVariableInfo outVarInfo = getProgramInterfaceVariableInfo(gl, program, GL_BUFFER_VARIABLE, outBlockInfo.activeVariables[0]);
	const void* resPtr = gl.mapBufferRange(GL_SHADER_STORAGE_BUFFER, 0, outBlockInfo.dataSize, GL_MAP_READ_BIT);
	const int maxErrMsg = 10;
	int numFailed = 0;

	GLU_EXPECT_NO_ERROR(gl.getError(), "glMapBufferRange()");
	TCU_CHECK(resPtr);

	for (deUint32 ndx = 0; ndx < numValues; ndx++)
	{
	const int resVal = ((const int)((const deUint8)resPtr + outVarInfo.offset + outVarInfo.arrayStridendx));

	if (resVal == 0)
	{
	if (numFailed < maxErrMsg)
	m_testCtx.getLog() << TestLog::Message << "ERROR: isOk[" << ndx << "] = " << resVal << " != true" << TestLog::EndMessage;
	else if (numFailed == maxErrMsg)
	m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;

	numFailed += 1;
	}
	}

	gl.unmapBuffer(GL_SHADER_STORAGE_BUFFER);
	GLU_EXPECT_NO_ERROR(gl.getError(), "glUnmapBuffer()");

	m_testCtx.getLog() << TestLog::Message << (numValues-numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;

	m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
	numFailed == 0 ? "Pass" : "Comparison failed");
	}

	return STOP;
	}

	ShaderSharedVarTests::ShaderSharedVarTests (Context& context)
	: TestCaseGroup(context, "shared_var", "Shared Variable Tests")
	{
	}

	ShaderSharedVarTests::~ShaderSharedVarTests (void)
	{
	}

	void ShaderSharedVarTests::init (void)
	{
	// .basic_type
	{
	tcu::TestCaseGroup *const basicTypeGroup = new tcu::TestCaseGroup(m_testCtx, "basic_type", "Basic Types");
	addChild(basicTypeGroup);

	for (int basicType = TYPE_FLOAT; basicType <= TYPE_BOOL_VEC4; basicType++)
	{
	if (glu::getDataTypeScalarType(DataType(basicType)) == glu::TYPE_DOUBLE)
	continue;

	if (glu::isDataTypeBoolOrBVec(DataType(basicType)))
	{
	const tcu::UVec3 workGroupSize (2,1,3);
	basicTypeGroup->addChild(new SharedBasicVarCase(m_context, getDataTypeName(DataType(basicType)), DataType(basicType), PRECISION_LAST, workGroupSize));
	}
	else
	{
	for (int precision = 0; precision < PRECISION_LAST; precision++)
	{
	const tcu::UVec3 workGroupSize (2,1,3);
	const string name = string(getDataTypeName(DataType(basicType))) + "_" + getPrecisionName(Precision(precision));

	basicTypeGroup->addChild(new SharedBasicVarCase(m_context, name.c_str(), DataType(basicType), Precision(precision), workGroupSize));
	}
	}
	}
	}

	// .work_group_size
	{
	tcu::TestCaseGroup *const workGroupSizeGroup = new tcu::TestCaseGroup(m_testCtx, "work_group_size", "Shared Variables with Various Work Group Sizes");
	addChild(workGroupSizeGroup);

	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_1_1_1", TYPE_FLOAT, PRECISION_HIGHP, tcu::UVec3(1,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_64_1_1", TYPE_FLOAT, PRECISION_HIGHP, tcu::UVec3(64,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_1_64_1", TYPE_FLOAT, PRECISION_HIGHP, tcu::UVec3(1,64,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_1_1_64", TYPE_FLOAT, PRECISION_HIGHP, tcu::UVec3(1,1,64)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_128_1_1", TYPE_FLOAT, PRECISION_HIGHP, tcu::UVec3(128,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_1_128_1", TYPE_FLOAT, PRECISION_HIGHP, tcu::UVec3(1,128,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "float_13_2_4", TYPE_FLOAT, PRECISION_HIGHP, tcu::UVec3(13,2,4)));

	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_1_1_1", TYPE_FLOAT_VEC4, PRECISION_HIGHP, tcu::UVec3(1,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_64_1_1", TYPE_FLOAT_VEC4, PRECISION_HIGHP, tcu::UVec3(64,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_1_64_1", TYPE_FLOAT_VEC4, PRECISION_HIGHP, tcu::UVec3(1,64,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_1_1_64", TYPE_FLOAT_VEC4, PRECISION_HIGHP, tcu::UVec3(1,1,64)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_128_1_1", TYPE_FLOAT_VEC4, PRECISION_HIGHP, tcu::UVec3(128,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_1_128_1", TYPE_FLOAT_VEC4, PRECISION_HIGHP, tcu::UVec3(1,128,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "vec4_13_2_4", TYPE_FLOAT_VEC4, PRECISION_HIGHP, tcu::UVec3(13,2,4)));

	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_1_1_1", TYPE_FLOAT_MAT4, PRECISION_HIGHP, tcu::UVec3(1,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_64_1_1", TYPE_FLOAT_MAT4, PRECISION_HIGHP, tcu::UVec3(64,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_1_64_1", TYPE_FLOAT_MAT4, PRECISION_HIGHP, tcu::UVec3(1,64,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_1_1_64", TYPE_FLOAT_MAT4, PRECISION_HIGHP, tcu::UVec3(1,1,64)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_128_1_1", TYPE_FLOAT_MAT4, PRECISION_HIGHP, tcu::UVec3(128,1,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_1_128_1", TYPE_FLOAT_MAT4, PRECISION_HIGHP, tcu::UVec3(1,128,1)));
	workGroupSizeGroup->addChild(new SharedBasicVarCase(m_context, "mat4_13_2_4", TYPE_FLOAT_MAT4, PRECISION_HIGHP, tcu::UVec3(13,2,4)));
	}

	// .atomic
	addChild(new ShaderAtomicOpTests(m_context, "atomic", ATOMIC_OPERAND_SHARED_VARIABLE));
	}

	} // Functional
	} // gles31
	} // deqp