~lzh/A133.git

/*-------------------------------------------------------------------------
 * drawElements Quality Program Random Shader Generator
 * ----------------------------------------------------
 *
 * Copyright 2014 The Android Open Source Project
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 *//*!
 * \file
 * \brief Program Executor.
 *//*--------------------------------------------------------------------*/
 
#include "rsgProgramExecutor.hpp"
#include "rsgExecutionContext.hpp"
#include "rsgVariableValue.hpp"
#include "rsgUtils.hpp"
#include "tcuSurface.hpp"
#include "deMath.h"
#include "deString.h"
 
#include <set>
#include <string>
#include <map>
 
using std::set;
using std::string;
using std::vector;
using std::map;
 
namespace rsg
{
 
class VaryingStorage
{
public:
                            VaryingStorage        (const VariableType& type, int numVertices);
                            ~VaryingStorage        (void) {}
 
    ValueAccess                getValue            (const VariableType& type, int vtxNdx);
    ConstValueAccess        getValue            (const VariableType& type, int vtxNdx) const;
 
private:
    std::vector<Scalar>        m_value;
};
 
VaryingStorage::VaryingStorage (const VariableType& type, int numVertices)
    : m_value(type.getScalarSize()*numVertices)
{
}
 
ValueAccess VaryingStorage::getValue (const VariableType& type, int vtxNdx)
{
    return ValueAccess(type, &m_value[type.getScalarSize()*vtxNdx]);
}
 
ConstValueAccess VaryingStorage::getValue (const VariableType& type, int vtxNdx) const
{
    return ConstValueAccess(type, &m_value[type.getScalarSize()*vtxNdx]);
}
 
class VaryingStore
{
public:
                            VaryingStore        (int numVertices);
                            ~VaryingStore        (void);
 
    VaryingStorage*            getStorage            (const VariableType& type, const char* name);
 
private:
    int                                            m_numVertices;
    std::map<std::string, VaryingStorage*>        m_values;
};
 
VaryingStore::VaryingStore (int numVertices)
    : m_numVertices(numVertices)
{
}
 
VaryingStore::~VaryingStore (void)
{
    for (map<string, VaryingStorage*>::iterator i = m_values.begin(); i != m_values.end(); i++)
        delete i->second;
    m_values.clear();
}
 
VaryingStorage* VaryingStore::getStorage (const VariableType& type, const char* name)
{
    VaryingStorage* storage = m_values[name];
 
    if (!storage)
    {
        storage = new VaryingStorage(type, m_numVertices);
        m_values[name] = storage;
    }
 
    return storage;
}
 
inline float interpolateVertexQuad (const tcu::Vec4& quad, float x, float y)
{
    float w00 = (1.0f-x)*(1.0f-y);
    float w01 = (1.0f-x)*y;
    float w10 = x*(1.0f-y);
    float w11 = x*y;
    return quad.x()*w00 + quad.y()*w10 + quad.z()*w01 + quad.w()*w11;
}
 
inline float interpolateVertex (float x0y0, float x1y1, float x, float y)
{
    return interpolateVertexQuad(tcu::Vec4(x0y0, (x0y0+x1y1)*0.5f, (x0y0+x1y1)*0.5f, x1y1), x, y);
}
 
inline float interpolateTri (float v0, float v1, float v2, float x, float y)
{
    return v0 + (v1-v0)*x + (v2-v0)*y;
}
 
inline float interpolateFragment (const tcu::Vec4& quad, float x, float y)
{
    if (x + y < 1.0f)
        return interpolateTri(quad.x(), quad.y(), quad.z(), x, y);
    else
        return interpolateTri(quad.w(), quad.z(), quad.y(), 1.0f-x, 1.0f-y);
}
 
template <int Stride>
void interpolateVertexInput (StridedValueAccess<Stride> dst, int dstComp, const ConstValueRangeAccess valueRange, float x, float y)
{
    TCU_CHECK(valueRange.getType().getBaseType() == VariableType::TYPE_FLOAT);
    int numElements = valueRange.getType().getNumElements();
    for (int elementNdx = 0; elementNdx < numElements; elementNdx++)
    {
        float xd, yd;
        getVertexInterpolationCoords(xd, yd, x, y, elementNdx);
        dst.component(elementNdx).asFloat(dstComp) = interpolateVertex(valueRange.getMin().component(elementNdx).asFloat(), valueRange.getMax().component(elementNdx).asFloat(), xd, yd);
    }
}
 
template <int Stride>
void interpolateFragmentInput (StridedValueAccess<Stride> dst, int dstComp, ConstValueAccess vtx0, ConstValueAccess vtx1, ConstValueAccess vtx2, ConstValueAccess vtx3, float x, float y)
{
    TCU_CHECK(dst.getType().getBaseType() == VariableType::TYPE_FLOAT);
    int numElements = dst.getType().getNumElements();
    for (int ndx = 0; ndx < numElements; ndx++)
        dst.component(ndx).asFloat(dstComp) = interpolateFragment(tcu::Vec4(vtx0.component(ndx).asFloat(), vtx1.component(ndx).asFloat(), vtx2.component(ndx).asFloat(), vtx3.component(ndx).asFloat()), x, y);
}
 
template <int Stride>
void copyVarying (ValueAccess dst, ConstStridedValueAccess<Stride> src, int compNdx)
{
    TCU_CHECK(dst.getType().getBaseType() == VariableType::TYPE_FLOAT);
    for (int elemNdx = 0; elemNdx < dst.getType().getNumElements(); elemNdx++)
        dst.component(elemNdx).asFloat() = src.component(elemNdx).asFloat(compNdx);
}
 
ProgramExecutor::ProgramExecutor (const tcu::PixelBufferAccess& dst, int gridWidth, int gridHeight)
    : m_dst            (dst)
    , m_gridWidth    (gridWidth)
    , m_gridHeight    (gridHeight)
{
}
 
ProgramExecutor::~ProgramExecutor (void)
{
}
 
void ProgramExecutor::setTexture (int samplerNdx, const tcu::Texture2D* texture, const tcu::Sampler& sampler)
{
    m_samplers2D[samplerNdx] = Sampler2D(texture, sampler);
}
 
void ProgramExecutor::setTexture (int samplerNdx, const tcu::TextureCube* texture, const tcu::Sampler& sampler)
{
    m_samplersCube[samplerNdx] = SamplerCube(texture, sampler);
}
 
inline tcu::IVec4 computeVertexIndices (float cellWidth, float cellHeight, int gridVtxWidth, int gridVtxHeight, int x, int y)
{
    DE_UNREF(gridVtxHeight);
    int x0 = (int)deFloatFloor((float)x / cellWidth);
    int y0 = (int)deFloatFloor((float)y / cellHeight);
    return tcu::IVec4(y0*gridVtxWidth + x0, y0*gridVtxWidth + x0 + 1, (y0+1)*gridVtxWidth + x0, (y0+1)*gridVtxWidth + x0 + 1);
}
 
inline tcu::Vec2 computeGridCellWeights (float cellWidth, float cellHeight, int x, int y)
{
    float gx = ((float)x + 0.5f) / cellWidth;
    float gy = ((float)y + 0.5f) / cellHeight;
    return tcu::Vec2(deFloatFrac(gx), deFloatFrac(gy));
}
 
inline tcu::RGBA toColor (tcu::Vec4 rgba)
{
    return tcu::RGBA(deClamp32(deRoundFloatToInt32(rgba.x()*255), 0, 255),
                     deClamp32(deRoundFloatToInt32(rgba.y()*255), 0, 255),
                     deClamp32(deRoundFloatToInt32(rgba.z()*255), 0, 255),
                     deClamp32(deRoundFloatToInt32(rgba.w()*255), 0, 255));
}
 
void ProgramExecutor::execute (const Shader& vertexShader, const Shader& fragmentShader, const vector<VariableValue>& uniformValues)
{
    int    gridVtxWidth    = m_gridWidth+1;
    int gridVtxHeight    = m_gridHeight+1;
    int numVertices        = gridVtxWidth*gridVtxHeight;
 
    VaryingStore varyingStore(numVertices);
 
    // Execute vertex shader
    {
        ExecutionContext    execCtx(m_samplers2D, m_samplersCube);
        int                    numPackets    = numVertices + ((numVertices%EXEC_VEC_WIDTH) ? 1 : 0);
 
        const vector<ShaderInput*>& inputs    = vertexShader.getInputs();
        vector<const Variable*>        outputs;
        vertexShader.getOutputs(outputs);
 
        // Set uniform values
        for (vector<VariableValue>::const_iterator uniformIter = uniformValues.begin(); uniformIter != uniformValues.end(); uniformIter++)
            execCtx.getValue(uniformIter->getVariable()) = uniformIter->getValue().value();
 
        for (int packetNdx = 0; packetNdx < numPackets; packetNdx++)
        {
            int packetStart    = packetNdx*EXEC_VEC_WIDTH;
            int packetEnd    = deMin32((packetNdx+1)*EXEC_VEC_WIDTH, numVertices);
 
            // Compute values for vertex shader inputs
            for (vector<ShaderInput*>::const_iterator i = inputs.begin(); i != inputs.end(); i++)
            {
                const ShaderInput*    input    = *i;
                ExecValueAccess        access    = execCtx.getValue(input->getVariable());
 
                for (int vtxNdx = packetStart; vtxNdx < packetEnd; vtxNdx++)
                {
                    int        y    = (vtxNdx/gridVtxWidth);
                    int        x    = vtxNdx - y*gridVtxWidth;
                    float    xf    = (float)x / (float)(gridVtxWidth-1);
                    float    yf    = (float)y / (float)(gridVtxHeight-1);
 
                    interpolateVertexInput(access, vtxNdx-packetStart, input->getValueRange(), xf, yf);
                }
            }
 
            // Execute vertex shader for packet
            vertexShader.execute(execCtx);
 
            // Store output values
            for (vector<const Variable*>::const_iterator i = outputs.begin(); i != outputs.end(); i++)
            {
                const Variable*            output    = *i;
 
                if (deStringEqual(output->getName(), "gl_Position"))
                    continue; // Do not store position
 
                ExecConstValueAccess    access    = execCtx.getValue(output);
                VaryingStorage*            dst        = varyingStore.getStorage(output->getType(), output->getName());
 
                for (int vtxNdx = packetStart; vtxNdx < packetEnd; vtxNdx++)
                {
                    ValueAccess varyingAccess = dst->getValue(output->getType(), vtxNdx);
                    copyVarying(varyingAccess, access, vtxNdx-packetStart);
                }
            }
        }
    }
 
    // Execute fragment shader
    {
        ExecutionContext execCtx(m_samplers2D, m_samplersCube);
 
        // Assign uniform values
        for (vector<VariableValue>::const_iterator i = uniformValues.begin(); i != uniformValues.end(); i++)
            execCtx.getValue(i->getVariable()) = i->getValue().value();
 
        const vector<ShaderInput*>& inputs            = fragmentShader.getInputs();
        const Variable*                fragColorVar    = DE_NULL;
        vector<const Variable*>        outputs;
 
        // Find fragment shader output assigned to location 0. This is fragment color.
        fragmentShader.getOutputs(outputs);
        for (vector<const Variable*>::const_iterator i = outputs.begin(); i != outputs.end(); i++)
        {
            if ((*i)->getLayoutLocation() == 0)
            {
                fragColorVar = *i;
                break;
            }
        }
        TCU_CHECK(fragColorVar);
 
        int    width        = m_dst.getWidth();
        int height        = m_dst.getHeight();
        int numPackets    = (width*height)/EXEC_VEC_WIDTH + (((width*height)%EXEC_VEC_WIDTH) ? 1 : 0);
 
        float cellWidth        = (float)width    / (float)m_gridWidth;
        float cellHeight    = (float)height    / (float)m_gridHeight;
 
        for (int packetNdx = 0; packetNdx < numPackets; packetNdx++)
        {
            int packetStart    = packetNdx*EXEC_VEC_WIDTH;
            int packetEnd    = deMin32((packetNdx+1)*EXEC_VEC_WIDTH, width*height);
 
            // Interpolate varyings
            for (vector<ShaderInput*>::const_iterator i = inputs.begin(); i != inputs.end(); i++)
            {
                const ShaderInput*        input    = *i;
                ExecValueAccess            access    = execCtx.getValue(input->getVariable());
                const VariableType&        type    = input->getVariable()->getType();
                const VaryingStorage*    src        = varyingStore.getStorage(type, input->getVariable()->getName());
 
                // \todo [2011-03-08 pyry] Part of this could be pre-computed...
                for (int fragNdx = packetStart; fragNdx < packetEnd; fragNdx++)
                {
                    int y = fragNdx/width;
                    int x = fragNdx - y*width;
                    tcu::IVec4    vtxIndices    = computeVertexIndices(cellWidth, cellHeight, gridVtxWidth, gridVtxHeight, x, y);
                    tcu::Vec2    weights        = computeGridCellWeights(cellWidth, cellHeight, x, y);
 
                    interpolateFragmentInput(access, fragNdx-packetStart,
                                             src->getValue(type, vtxIndices.x()),
                                             src->getValue(type, vtxIndices.y()),
                                             src->getValue(type, vtxIndices.z()),
                                             src->getValue(type, vtxIndices.w()),
                                             weights.x(), weights.y());
                }
            }
 
            // Execute fragment shader
            fragmentShader.execute(execCtx);
 
            // Write resulting color
            ExecConstValueAccess colorValue = execCtx.getValue(fragColorVar);
            for (int fragNdx = packetStart; fragNdx < packetEnd; fragNdx++)
            {
                int            y        = fragNdx/width;
                int            x        = fragNdx - y*width;
                int            cNdx    = fragNdx-packetStart;
                tcu::Vec4    c        = tcu::Vec4(colorValue.component(0).asFloat(cNdx),
                                                colorValue.component(1).asFloat(cNdx),
                                                colorValue.component(2).asFloat(cNdx),
                                                colorValue.component(3).asFloat(cNdx));
 
                // \todo [2012-11-13 pyry] Reverse order.
                m_dst.setPixel(c, x, m_dst.getHeight()-y-1);
            }
        }
    }
}
 
} // rsg