framework/randomshaders/rsgProgramExecutor.cpp - third_party/vulkan-cts - Git at Google

 /*-------------------------------------------------------------------------
  * drawElements Quality Program Random Shader Generator
  * ----------------------------------------------------
  *
  * Copyright 2014 The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  *
  *//*!
  * \file
  * \brief Program Executor.
  *//*--------------------------------------------------------------------*/

 #include "rsgProgramExecutor.hpp"
 #include "rsgExecutionContext.hpp"
 #include "rsgVariableValue.hpp"
 #include "rsgUtils.hpp"
 #include "tcuSurface.hpp"
 #include "deMath.h"
 #include "deString.h"

 #include <set>
 #include <string>
 #include <map>

 using std::set;
 using std::string;
 using std::vector;
 using std::map;

 namespace rsg
 {

 class VaryingStorage
 {
 public:
 							VaryingStorage		(const VariableType& type, int numVertices);
 							~VaryingStorage		(void) {}

 	ValueAccess				getValue			(const VariableType& type, int vtxNdx);
 	ConstValueAccess		getValue			(const VariableType& type, int vtxNdx) const;

 private:
 	std::vector<Scalar>		m_value;
 };

 VaryingStorage::VaryingStorage (const VariableType& type, int numVertices)
 	: m_value(type.getScalarSize()*numVertices)
 {
 }

 ValueAccess VaryingStorage::getValue (const VariableType& type, int vtxNdx)
 {
 	return ValueAccess(type, &m_value[type.getScalarSize()*vtxNdx]);
 }

 ConstValueAccess VaryingStorage::getValue (const VariableType& type, int vtxNdx) const
 {
 	return ConstValueAccess(type, &m_value[type.getScalarSize()*vtxNdx]);
 }

 class VaryingStore
 {
 public:
 							VaryingStore		(int numVertices);
 							~VaryingStore		(void);

 	VaryingStorage*			getStorage			(const VariableType& type, const char* name);

 private:
 	int											m_numVertices;
 	std::map<std::string, VaryingStorage*>		m_values;
 };

 VaryingStore::VaryingStore (int numVertices)
 	: m_numVertices(numVertices)
 {
 }

 VaryingStore::~VaryingStore (void)
 {
 	for (map<string, VaryingStorage*>::iterator i = m_values.begin(); i != m_values.end(); i++)
 		delete i->second;
 	m_values.clear();
 }

 VaryingStorage* VaryingStore::getStorage (const VariableType& type, const char* name)
 {
 	VaryingStorage* storage = m_values[name];

 	if (!storage)
 	{
 		storage = new VaryingStorage(type, m_numVertices);
 		m_values[name] = storage;
 	}

 	return storage;
 }

 inline float interpolateVertexQuad (const tcu::Vec4& quad, float x, float y)
 {
 	float w00 = (1.0f-x)*(1.0f-y);
 	float w01 = (1.0f-x)*y;
 	float w10 = x*(1.0f-y);
 	float w11 = x*y;
 	return quad.x()*w00 + quad.y()*w10 + quad.z()*w01 + quad.w()*w11;
 }

 inline float interpolateVertex (float x0y0, float x1y1, float x, float y)
 {
 	return interpolateVertexQuad(tcu::Vec4(x0y0, (x0y0+x1y1)*0.5f, (x0y0+x1y1)*0.5f, x1y1), x, y);
 }

 inline float interpolateTri (float v0, float v1, float v2, float x, float y)
 {
 	return v0 + (v1-v0)*x + (v2-v0)*y;
 }

 inline float interpolateFragment (const tcu::Vec4& quad, float x, float y)
 {
 	if (x + y < 1.0f)
 		return interpolateTri(quad.x(), quad.y(), quad.z(), x, y);
 	else
 		return interpolateTri(quad.w(), quad.z(), quad.y(), 1.0f-x, 1.0f-y);
 }

 template <int Stride>
 void interpolateVertexInput (StridedValueAccess<Stride> dst, int dstComp, const ConstValueRangeAccess valueRange, float x, float y)
 {
 	TCU_CHECK(valueRange.getType().getBaseType() == VariableType::TYPE_FLOAT);
 	int numElements = valueRange.getType().getNumElements();
 	for (int elementNdx = 0; elementNdx < numElements; elementNdx++)
 	{
 		float xd, yd;
 		getVertexInterpolationCoords(xd, yd, x, y, elementNdx);
 		dst.component(elementNdx).asFloat(dstComp) = interpolateVertex(valueRange.getMin().component(elementNdx).asFloat(), valueRange.getMax().component(elementNdx).asFloat(), xd, yd);
 	}
 }

 template <int Stride>
 void interpolateFragmentInput (StridedValueAccess<Stride> dst, int dstComp, ConstValueAccess vtx0, ConstValueAccess vtx1, ConstValueAccess vtx2, ConstValueAccess vtx3, float x, float y)
 {
 	TCU_CHECK(dst.getType().getBaseType() == VariableType::TYPE_FLOAT);
 	int numElements = dst.getType().getNumElements();
 	for (int ndx = 0; ndx < numElements; ndx++)
 		dst.component(ndx).asFloat(dstComp) = interpolateFragment(tcu::Vec4(vtx0.component(ndx).asFloat(), vtx1.component(ndx).asFloat(), vtx2.component(ndx).asFloat(), vtx3.component(ndx).asFloat()), x, y);
 }

 template <int Stride>
 void copyVarying (ValueAccess dst, ConstStridedValueAccess<Stride> src, int compNdx)
 {
 	TCU_CHECK(dst.getType().getBaseType() == VariableType::TYPE_FLOAT);
 	for (int elemNdx = 0; elemNdx < dst.getType().getNumElements(); elemNdx++)
 		dst.component(elemNdx).asFloat() = src.component(elemNdx).asFloat(compNdx);
 }

 ProgramExecutor::ProgramExecutor (const tcu::PixelBufferAccess& dst, int gridWidth, int gridHeight)
 	: m_dst			(dst)
 	, m_gridWidth	(gridWidth)
 	, m_gridHeight	(gridHeight)
 {
 }

 ProgramExecutor::~ProgramExecutor (void)
 {
 }

 void ProgramExecutor::setTexture (int samplerNdx, const tcu::Texture2D* texture, const tcu::Sampler& sampler)
 {
 	m_samplers2D[samplerNdx] = Sampler2D(texture, sampler);
 }

 void ProgramExecutor::setTexture (int samplerNdx, const tcu::TextureCube* texture, const tcu::Sampler& sampler)
 {
 	m_samplersCube[samplerNdx] = SamplerCube(texture, sampler);
 }

 inline tcu::IVec4 computeVertexIndices (float cellWidth, float cellHeight, int gridVtxWidth, int gridVtxHeight, int x, int y)
 {
 	DE_UNREF(gridVtxHeight);
 	int x0 = (int)deFloatFloor((float)x / cellWidth);
 	int y0 = (int)deFloatFloor((float)y / cellHeight);
 	return tcu::IVec4(y0*gridVtxWidth + x0, y0*gridVtxWidth + x0 + 1, (y0+1)*gridVtxWidth + x0, (y0+1)*gridVtxWidth + x0 + 1);
 }

 inline tcu::Vec2 computeGridCellWeights (float cellWidth, float cellHeight, int x, int y)
 {
 	float gx = ((float)x + 0.5f) / cellWidth;
 	float gy = ((float)y + 0.5f) / cellHeight;
 	return tcu::Vec2(deFloatFrac(gx), deFloatFrac(gy));
 }

 inline tcu::RGBA toColor (tcu::Vec4 rgba)
 {
 	return tcu::RGBA(deClamp32(deRoundFloatToInt32(rgba.x()*255), 0, 255),
 					 deClamp32(deRoundFloatToInt32(rgba.y()*255), 0, 255),
 					 deClamp32(deRoundFloatToInt32(rgba.z()*255), 0, 255),
 					 deClamp32(deRoundFloatToInt32(rgba.w()*255), 0, 255));
 }

 void ProgramExecutor::execute (const Shader& vertexShader, const Shader& fragmentShader, const vector<VariableValue>& uniformValues)
 {
 	int	gridVtxWidth	= m_gridWidth+1;
 	int gridVtxHeight	= m_gridHeight+1;
 	int numVertices		= gridVtxWidth*gridVtxHeight;

 	VaryingStore varyingStore(numVertices);

 	// Execute vertex shader
 	{
 		ExecutionContext	execCtx(m_samplers2D, m_samplersCube);
 		int					numPackets	= numVertices + ((numVertices%EXEC_VEC_WIDTH) ? 1 : 0);

 		const vector<ShaderInput*>& inputs	= vertexShader.getInputs();
 		vector<const Variable*>		outputs;
 		vertexShader.getOutputs(outputs);

 		// Set uniform values
 		for (vector<VariableValue>::const_iterator uniformIter = uniformValues.begin(); uniformIter != uniformValues.end(); uniformIter++)
 			execCtx.getValue(uniformIter->getVariable()) = uniformIter->getValue().value();

 		for (int packetNdx = 0; packetNdx < numPackets; packetNdx++)
 		{
 			int packetStart	= packetNdx*EXEC_VEC_WIDTH;
 			int packetEnd	= deMin32((packetNdx+1)*EXEC_VEC_WIDTH, numVertices);

 			// Compute values for vertex shader inputs
 			for (vector<ShaderInput*>::const_iterator i = inputs.begin(); i != inputs.end(); i++)
 			{
 				const ShaderInput*	input	= *i;
 				ExecValueAccess		access	= execCtx.getValue(input->getVariable());

 				for (int vtxNdx = packetStart; vtxNdx < packetEnd; vtxNdx++)
 				{
 					int		y	= (vtxNdx/gridVtxWidth);
 					int		x	= vtxNdx - y*gridVtxWidth;
 					float	xf	= (float)x / (float)(gridVtxWidth-1);
 					float	yf	= (float)y / (float)(gridVtxHeight-1);

 					interpolateVertexInput(access, vtxNdx-packetStart, input->getValueRange(), xf, yf);
 				}
 			}

 			// Execute vertex shader for packet
 			vertexShader.execute(execCtx);

 			// Store output values
 			for (vector<const Variable*>::const_iterator i = outputs.begin(); i != outputs.end(); i++)
 			{
 				const Variable*			output	= *i;

 				if (deStringEqual(output->getName(), "gl_Position"))
 					continue; // Do not store position

 				ExecConstValueAccess	access	= execCtx.getValue(output);
 				VaryingStorage*			dst		= varyingStore.getStorage(output->getType(), output->getName());

 				for (int vtxNdx = packetStart; vtxNdx < packetEnd; vtxNdx++)
 				{
 					ValueAccess varyingAccess = dst->getValue(output->getType(), vtxNdx);
 					copyVarying(varyingAccess, access, vtxNdx-packetStart);
 				}
 			}
 		}
 	}

 	// Execute fragment shader
 	{
 		ExecutionContext execCtx(m_samplers2D, m_samplersCube);

 		// Assign uniform values
 		for (vector<VariableValue>::const_iterator i = uniformValues.begin(); i != uniformValues.end(); i++)
 			execCtx.getValue(i->getVariable()) = i->getValue().value();

 		const vector<ShaderInput*>& inputs			= fragmentShader.getInputs();
 		const Variable*				fragColorVar	= DE_NULL;
 		vector<const Variable*>		outputs;

 		// Find fragment shader output assigned to location 0. This is fragment color.
 		fragmentShader.getOutputs(outputs);
 		for (vector<const Variable*>::const_iterator i = outputs.begin(); i != outputs.end(); i++)
 		{
 			if ((*i)->getLayoutLocation() == 0)
 			{
 				fragColorVar = *i;
 				break;
 			}
 		}
 		TCU_CHECK(fragColorVar);

 		int	width		= m_dst.getWidth();
 		int height		= m_dst.getHeight();
 		int numPackets	= (width*height)/EXEC_VEC_WIDTH + (((width*height)%EXEC_VEC_WIDTH) ? 1 : 0);

 		float cellWidth		= (float)width	/ (float)m_gridWidth;
 		float cellHeight	= (float)height	/ (float)m_gridHeight;

 		for (int packetNdx = 0; packetNdx < numPackets; packetNdx++)
 		{
 			int packetStart	= packetNdx*EXEC_VEC_WIDTH;
 			int packetEnd	= deMin32((packetNdx+1)*EXEC_VEC_WIDTH, width*height);

 			// Interpolate varyings
 			for (vector<ShaderInput*>::const_iterator i = inputs.begin(); i != inputs.end(); i++)
 			{
 				const ShaderInput*		input	= *i;
 				ExecValueAccess			access	= execCtx.getValue(input->getVariable());
 				const VariableType&		type	= input->getVariable()->getType();
 				const VaryingStorage*	src		= varyingStore.getStorage(type, input->getVariable()->getName());

 				// \todo [2011-03-08 pyry] Part of this could be pre-computed...
 				for (int fragNdx = packetStart; fragNdx < packetEnd; fragNdx++)
 				{
 					int y = fragNdx/width;
 					int x = fragNdx - y*width;
 					tcu::IVec4	vtxIndices	= computeVertexIndices(cellWidth, cellHeight, gridVtxWidth, gridVtxHeight, x, y);
 					tcu::Vec2	weights		= computeGridCellWeights(cellWidth, cellHeight, x, y);

 					interpolateFragmentInput(access, fragNdx-packetStart,
 											 src->getValue(type, vtxIndices.x()),
 											 src->getValue(type, vtxIndices.y()),
 											 src->getValue(type, vtxIndices.z()),
 											 src->getValue(type, vtxIndices.w()),
 											 weights.x(), weights.y());
 				}
 			}

 			// Execute fragment shader
 			fragmentShader.execute(execCtx);

 			// Write resulting color
 			ExecConstValueAccess colorValue = execCtx.getValue(fragColorVar);
 			for (int fragNdx = packetStart; fragNdx < packetEnd; fragNdx++)
 			{
 				int			y		= fragNdx/width;
 				int			x		= fragNdx - y*width;
 				int			cNdx	= fragNdx-packetStart;
 				tcu::Vec4	c		= tcu::Vec4(colorValue.component(0).asFloat(cNdx),
 												colorValue.component(1).asFloat(cNdx),
 												colorValue.component(2).asFloat(cNdx),
 												colorValue.component(3).asFloat(cNdx));

 				// \todo [2012-11-13 pyry] Reverse order.
 				m_dst.setPixel(c, x, m_dst.getHeight()-y-1);
 			}
 		}
 	}
 }

 } // rsg
	/*-------------------------------------------------------------------------
	* drawElements Quality Program Random Shader Generator
	* ----------------------------------------------------
	*
	* Copyright 2014 The Android Open Source Project
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*
	//!
	* \file
	* \brief Program Executor.
	//--------------------------------------------------------------------*/

	#include "rsgProgramExecutor.hpp"
	#include "rsgExecutionContext.hpp"
	#include "rsgVariableValue.hpp"
	#include "rsgUtils.hpp"
	#include "tcuSurface.hpp"
	#include "deMath.h"
	#include "deString.h"

	#include <set>
	#include <string>
	#include <map>

	using std::set;
	using std::string;
	using std::vector;
	using std::map;

	namespace rsg
	{

	class VaryingStorage
	{
	public:
	VaryingStorage (const VariableType& type, int numVertices);
	~VaryingStorage (void) {}

	ValueAccess getValue (const VariableType& type, int vtxNdx);
	ConstValueAccess getValue (const VariableType& type, int vtxNdx) const;

	private:
	std::vector<Scalar> m_value;
	};

	VaryingStorage::VaryingStorage (const VariableType& type, int numVertices)
	: m_value(type.getScalarSize()*numVertices)
	{
	}

	ValueAccess VaryingStorage::getValue (const VariableType& type, int vtxNdx)
	{
	return ValueAccess(type, &m_value[type.getScalarSize()*vtxNdx]);
	}

	ConstValueAccess VaryingStorage::getValue (const VariableType& type, int vtxNdx) const
	{
	return ConstValueAccess(type, &m_value[type.getScalarSize()*vtxNdx]);
	}

	class VaryingStore
	{
	public:
	VaryingStore (int numVertices);
	~VaryingStore (void);

	VaryingStorage* getStorage (const VariableType& type, const char* name);

	private:
	int m_numVertices;
	std::map<std::string, VaryingStorage*> m_values;
	};

	VaryingStore::VaryingStore (int numVertices)
	: m_numVertices(numVertices)
	{
	}

	VaryingStore::~VaryingStore (void)
	{
	for (map<string, VaryingStorage*>::iterator i = m_values.begin(); i != m_values.end(); i++)
	delete i->second;
	m_values.clear();
	}

	VaryingStorage* VaryingStore::getStorage (const VariableType& type, const char* name)
	{
	VaryingStorage* storage = m_values[name];

	if (!storage)
	{
	storage = new VaryingStorage(type, m_numVertices);
	m_values[name] = storage;
	}

	return storage;
	}

	inline float interpolateVertexQuad (const tcu::Vec4& quad, float x, float y)
	{
	float w00 = (1.0f-x)*(1.0f-y);
	float w01 = (1.0f-x)*y;
	float w10 = x*(1.0f-y);
	float w11 = x*y;
	return quad.x()w00 + quad.y()w10 + quad.z()w01 + quad.w()w11;
	}

	inline float interpolateVertex (float x0y0, float x1y1, float x, float y)
	{
	return interpolateVertexQuad(tcu::Vec4(x0y0, (x0y0+x1y1)0.5f, (x0y0+x1y1)0.5f, x1y1), x, y);
	}

	inline float interpolateTri (float v0, float v1, float v2, float x, float y)
	{
	return v0 + (v1-v0)x + (v2-v0)y;
	}

	inline float interpolateFragment (const tcu::Vec4& quad, float x, float y)
	{
	if (x + y < 1.0f)
	return interpolateTri(quad.x(), quad.y(), quad.z(), x, y);
	else
	return interpolateTri(quad.w(), quad.z(), quad.y(), 1.0f-x, 1.0f-y);
	}

	template <int Stride>
	void interpolateVertexInput (StridedValueAccess<Stride> dst, int dstComp, const ConstValueRangeAccess valueRange, float x, float y)
	{
	TCU_CHECK(valueRange.getType().getBaseType() == VariableType::TYPE_FLOAT);
	int numElements = valueRange.getType().getNumElements();
	for (int elementNdx = 0; elementNdx < numElements; elementNdx++)
	{
	float xd, yd;
	getVertexInterpolationCoords(xd, yd, x, y, elementNdx);
	dst.component(elementNdx).asFloat(dstComp) = interpolateVertex(valueRange.getMin().component(elementNdx).asFloat(), valueRange.getMax().component(elementNdx).asFloat(), xd, yd);
	}
	}

	template <int Stride>
	void interpolateFragmentInput (StridedValueAccess<Stride> dst, int dstComp, ConstValueAccess vtx0, ConstValueAccess vtx1, ConstValueAccess vtx2, ConstValueAccess vtx3, float x, float y)
	{
	TCU_CHECK(dst.getType().getBaseType() == VariableType::TYPE_FLOAT);
	int numElements = dst.getType().getNumElements();
	for (int ndx = 0; ndx < numElements; ndx++)
	dst.component(ndx).asFloat(dstComp) = interpolateFragment(tcu::Vec4(vtx0.component(ndx).asFloat(), vtx1.component(ndx).asFloat(), vtx2.component(ndx).asFloat(), vtx3.component(ndx).asFloat()), x, y);
	}

	template <int Stride>
	void copyVarying (ValueAccess dst, ConstStridedValueAccess<Stride> src, int compNdx)
	{
	TCU_CHECK(dst.getType().getBaseType() == VariableType::TYPE_FLOAT);
	for (int elemNdx = 0; elemNdx < dst.getType().getNumElements(); elemNdx++)
	dst.component(elemNdx).asFloat() = src.component(elemNdx).asFloat(compNdx);
	}

	ProgramExecutor::ProgramExecutor (const tcu::PixelBufferAccess& dst, int gridWidth, int gridHeight)
	: m_dst (dst)
	, m_gridWidth (gridWidth)
	, m_gridHeight (gridHeight)
	{
	}

	ProgramExecutor::~ProgramExecutor (void)
	{
	}

	void ProgramExecutor::setTexture (int samplerNdx, const tcu::Texture2D* texture, const tcu::Sampler& sampler)
	{
	m_samplers2D[samplerNdx] = Sampler2D(texture, sampler);
	}

	void ProgramExecutor::setTexture (int samplerNdx, const tcu::TextureCube* texture, const tcu::Sampler& sampler)
	{
	m_samplersCube[samplerNdx] = SamplerCube(texture, sampler);
	}

	inline tcu::IVec4 computeVertexIndices (float cellWidth, float cellHeight, int gridVtxWidth, int gridVtxHeight, int x, int y)
	{
	DE_UNREF(gridVtxHeight);
	int x0 = (int)deFloatFloor((float)x / cellWidth);
	int y0 = (int)deFloatFloor((float)y / cellHeight);
	return tcu::IVec4(y0gridVtxWidth + x0, y0gridVtxWidth + x0 + 1, (y0+1)gridVtxWidth + x0, (y0+1)gridVtxWidth + x0 + 1);
	}

	inline tcu::Vec2 computeGridCellWeights (float cellWidth, float cellHeight, int x, int y)
	{
	float gx = ((float)x + 0.5f) / cellWidth;
	float gy = ((float)y + 0.5f) / cellHeight;
	return tcu::Vec2(deFloatFrac(gx), deFloatFrac(gy));
	}

	inline tcu::RGBA toColor (tcu::Vec4 rgba)
	{
	return tcu::RGBA(deClamp32(deRoundFloatToInt32(rgba.x()*255), 0, 255),
	deClamp32(deRoundFloatToInt32(rgba.y()*255), 0, 255),
	deClamp32(deRoundFloatToInt32(rgba.z()*255), 0, 255),
	deClamp32(deRoundFloatToInt32(rgba.w()*255), 0, 255));
	}

	void ProgramExecutor::execute (const Shader& vertexShader, const Shader& fragmentShader, const vector<VariableValue>& uniformValues)
	{
	int gridVtxWidth = m_gridWidth+1;
	int gridVtxHeight = m_gridHeight+1;
	int numVertices = gridVtxWidth*gridVtxHeight;

	VaryingStore varyingStore(numVertices);

	// Execute vertex shader
	{
	ExecutionContext execCtx(m_samplers2D, m_samplersCube);
	int numPackets = numVertices + ((numVertices%EXEC_VEC_WIDTH) ? 1 : 0);

	const vector<ShaderInput*>& inputs = vertexShader.getInputs();
	vector<const Variable*> outputs;
	vertexShader.getOutputs(outputs);

	// Set uniform values
	for (vector<VariableValue>::const_iterator uniformIter = uniformValues.begin(); uniformIter != uniformValues.end(); uniformIter++)
	execCtx.getValue(uniformIter->getVariable()) = uniformIter->getValue().value();

	for (int packetNdx = 0; packetNdx < numPackets; packetNdx++)
	{
	int packetStart = packetNdx*EXEC_VEC_WIDTH;
	int packetEnd = deMin32((packetNdx+1)*EXEC_VEC_WIDTH, numVertices);

	// Compute values for vertex shader inputs
	for (vector<ShaderInput*>::const_iterator i = inputs.begin(); i != inputs.end(); i++)
	{
	const ShaderInput* input = *i;
	ExecValueAccess access = execCtx.getValue(input->getVariable());

	for (int vtxNdx = packetStart; vtxNdx < packetEnd; vtxNdx++)
	{
	int y = (vtxNdx/gridVtxWidth);
	int x = vtxNdx - y*gridVtxWidth;
	float xf = (float)x / (float)(gridVtxWidth-1);
	float yf = (float)y / (float)(gridVtxHeight-1);

	interpolateVertexInput(access, vtxNdx-packetStart, input->getValueRange(), xf, yf);
	}
	}

	// Execute vertex shader for packet
	vertexShader.execute(execCtx);

	// Store output values
	for (vector<const Variable*>::const_iterator i = outputs.begin(); i != outputs.end(); i++)
	{
	const Variable* output = *i;

	if (deStringEqual(output->getName(), "gl_Position"))
	continue; // Do not store position

	ExecConstValueAccess access = execCtx.getValue(output);
	VaryingStorage* dst = varyingStore.getStorage(output->getType(), output->getName());

	for (int vtxNdx = packetStart; vtxNdx < packetEnd; vtxNdx++)
	{
	ValueAccess varyingAccess = dst->getValue(output->getType(), vtxNdx);
	copyVarying(varyingAccess, access, vtxNdx-packetStart);
	}
	}
	}
	}

	// Execute fragment shader
	{
	ExecutionContext execCtx(m_samplers2D, m_samplersCube);

	// Assign uniform values
	for (vector<VariableValue>::const_iterator i = uniformValues.begin(); i != uniformValues.end(); i++)
	execCtx.getValue(i->getVariable()) = i->getValue().value();

	const vector<ShaderInput*>& inputs = fragmentShader.getInputs();
	const Variable* fragColorVar = DE_NULL;
	vector<const Variable*> outputs;

	// Find fragment shader output assigned to location 0. This is fragment color.
	fragmentShader.getOutputs(outputs);
	for (vector<const Variable*>::const_iterator i = outputs.begin(); i != outputs.end(); i++)
	{
	if ((*i)->getLayoutLocation() == 0)
	{
	fragColorVar = *i;
	break;
	}
	}
	TCU_CHECK(fragColorVar);

	int width = m_dst.getWidth();
	int height = m_dst.getHeight();
	int numPackets = (widthheight)/EXEC_VEC_WIDTH + (((widthheight)%EXEC_VEC_WIDTH) ? 1 : 0);

	float cellWidth = (float)width / (float)m_gridWidth;
	float cellHeight = (float)height / (float)m_gridHeight;

	for (int packetNdx = 0; packetNdx < numPackets; packetNdx++)
	{
	int packetStart = packetNdx*EXEC_VEC_WIDTH;
	int packetEnd = deMin32((packetNdx+1)EXEC_VEC_WIDTH, widthheight);

	// Interpolate varyings
	for (vector<ShaderInput*>::const_iterator i = inputs.begin(); i != inputs.end(); i++)
	{
	const ShaderInput* input = *i;
	ExecValueAccess access = execCtx.getValue(input->getVariable());
	const VariableType& type = input->getVariable()->getType();
	const VaryingStorage* src = varyingStore.getStorage(type, input->getVariable()->getName());

	// \todo [2011-03-08 pyry] Part of this could be pre-computed...
	for (int fragNdx = packetStart; fragNdx < packetEnd; fragNdx++)
	{
	int y = fragNdx/width;
	int x = fragNdx - y*width;
	tcu::IVec4 vtxIndices = computeVertexIndices(cellWidth, cellHeight, gridVtxWidth, gridVtxHeight, x, y);
	tcu::Vec2 weights = computeGridCellWeights(cellWidth, cellHeight, x, y);

	interpolateFragmentInput(access, fragNdx-packetStart,
	src->getValue(type, vtxIndices.x()),
	src->getValue(type, vtxIndices.y()),
	src->getValue(type, vtxIndices.z()),
	src->getValue(type, vtxIndices.w()),
	weights.x(), weights.y());
	}
	}

	// Execute fragment shader
	fragmentShader.execute(execCtx);

	// Write resulting color
	ExecConstValueAccess colorValue = execCtx.getValue(fragColorVar);
	for (int fragNdx = packetStart; fragNdx < packetEnd; fragNdx++)
	{
	int y = fragNdx/width;
	int x = fragNdx - y*width;
	int cNdx = fragNdx-packetStart;
	tcu::Vec4 c = tcu::Vec4(colorValue.component(0).asFloat(cNdx),
	colorValue.component(1).asFloat(cNdx),
	colorValue.component(2).asFloat(cNdx),
	colorValue.component(3).asFloat(cNdx));

	// \todo [2012-11-13 pyry] Reverse order.
	m_dst.setPixel(c, x, m_dst.getHeight()-y-1);
	}
	}
	}
	}

	} // rsg