~lzh/A133.git

/*-------------------------------------------------------------------------
 * drawElements Quality Program OpenGL (ES) Module
 * -----------------------------------------------
 *
 * Copyright 2014 The Android Open Source Project
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 *//*!
 * \file
 * \brief Calibration tools.
 *//*--------------------------------------------------------------------*/
 
#include "glsCalibration.hpp"
#include "tcuTestLog.hpp"
#include "tcuVectorUtil.hpp"
#include "deStringUtil.hpp"
#include "deMath.h"
#include "deClock.h"
 
#include <algorithm>
#include <limits>
 
using std::string;
using std::vector;
using tcu::Vec2;
using tcu::TestLog;
using tcu::TestNode;
using namespace glu;
 
namespace deqp
{
namespace gls
{
 
// Reorders input arbitrarily, linear complexity and no allocations
template<typename T>
float destructiveMedian (vector<T>& data)
{
    const typename vector<T>::iterator mid = data.begin()+data.size()/2;
 
    std::nth_element(data.begin(), mid, data.end());
 
    if (data.size()%2 == 0) // Even number of elements, need average of two centermost elements
        return (*mid + *std::max_element(data.begin(), mid))*0.5f; // Data is partially sorted around mid, mid is half an item after center
    else
        return *mid;
}
 
LineParameters theilSenLinearRegression (const std::vector<tcu::Vec2>& dataPoints)
{
    const float        epsilon                    = 1e-6f;
 
    const int        numDataPoints            = (int)dataPoints.size();
    vector<float>    pairwiseCoefficients;
    vector<float>    pointwiseOffsets;
    LineParameters    result                    (0.0f, 0.0f);
 
    // Compute the pairwise coefficients.
    for (int i = 0; i < numDataPoints; i++)
    {
        const Vec2& ptA = dataPoints[i];
 
        for (int j = 0; j < i; j++)
        {
            const Vec2& ptB = dataPoints[j];
 
            if (de::abs(ptA.x() - ptB.x()) > epsilon)
                pairwiseCoefficients.push_back((ptA.y() - ptB.y()) / (ptA.x() - ptB.x()));
        }
    }
 
    // Find the median of the pairwise coefficients.
    // \note If there are no data point pairs with differing x values, the coefficient variable will stay zero as initialized.
    if (!pairwiseCoefficients.empty())
        result.coefficient = destructiveMedian(pairwiseCoefficients);
 
    // Compute the offsets corresponding to the median coefficient, for all data points.
    for (int i = 0; i < numDataPoints; i++)
        pointwiseOffsets.push_back(dataPoints[i].y() - result.coefficient*dataPoints[i].x());
 
    // Find the median of the offsets.
    // \note If there are no data points, the offset variable will stay zero as initialized.
    if (!pointwiseOffsets.empty())
        result.offset = destructiveMedian(pointwiseOffsets);
 
    return result;
}
 
// Sample from given values using linear interpolation at a given position as if values were laid to range [0, 1]
template <typename T>
static float linearSample (const std::vector<T>& values, float position)
{
    DE_ASSERT(position >= 0.0f);
    DE_ASSERT(position <= 1.0f);
 
    const int    maxNdx                = (int)values.size() - 1;
    const float    floatNdx            = (float)maxNdx * position;
    const int    lowerNdx            = (int)deFloatFloor(floatNdx);
    const int    higherNdx            = lowerNdx + (lowerNdx == maxNdx ? 0 : 1); // Use only last element if position is 1.0
    const float    interpolationFactor = floatNdx - (float)lowerNdx;
 
    DE_ASSERT(lowerNdx >= 0 && lowerNdx < (int)values.size());
    DE_ASSERT(higherNdx >= 0 && higherNdx < (int)values.size());
    DE_ASSERT(interpolationFactor >= 0 && interpolationFactor < 1.0f);
 
    return tcu::mix((float)values[lowerNdx], (float)values[higherNdx], interpolationFactor);
}
 
LineParametersWithConfidence theilSenSiegelLinearRegression (const std::vector<tcu::Vec2>& dataPoints, float reportedConfidence)
{
    DE_ASSERT(!dataPoints.empty());
 
    // Siegel's variation
 
    const float                        epsilon                = 1e-6f;
    const int                        numDataPoints        = (int)dataPoints.size();
    std::vector<float>                medianSlopes;
    std::vector<float>                pointwiseOffsets;
    LineParametersWithConfidence    result;
 
    // Compute the median slope via each element
    for (int i = 0; i < numDataPoints; i++)
    {
        const tcu::Vec2&    ptA        = dataPoints[i];
        std::vector<float>    slopes;
 
        slopes.reserve(numDataPoints);
 
        for (int j = 0; j < numDataPoints; j++)
        {
            const tcu::Vec2& ptB = dataPoints[j];
 
            if (de::abs(ptA.x() - ptB.x()) > epsilon)
                slopes.push_back((ptA.y() - ptB.y()) / (ptA.x() - ptB.x()));
        }
 
        // Add median of slopes through point i
        medianSlopes.push_back(destructiveMedian(slopes));
    }
 
    DE_ASSERT(!medianSlopes.empty());
 
    // Find the median of the pairwise coefficients.
    std::sort(medianSlopes.begin(), medianSlopes.end());
    result.coefficient = linearSample(medianSlopes, 0.5f);
 
    // Compute the offsets corresponding to the median coefficient, for all data points.
    for (int i = 0; i < numDataPoints; i++)
        pointwiseOffsets.push_back(dataPoints[i].y() - result.coefficient*dataPoints[i].x());
 
    // Find the median of the offsets.
    std::sort(pointwiseOffsets.begin(), pointwiseOffsets.end());
    result.offset = linearSample(pointwiseOffsets, 0.5f);
 
    // calculate confidence intervals
    result.coefficientConfidenceLower = linearSample(medianSlopes, 0.5f - reportedConfidence*0.5f);
    result.coefficientConfidenceUpper = linearSample(medianSlopes, 0.5f + reportedConfidence*0.5f);
 
    result.offsetConfidenceLower = linearSample(pointwiseOffsets, 0.5f - reportedConfidence*0.5f);
    result.offsetConfidenceUpper = linearSample(pointwiseOffsets, 0.5f + reportedConfidence*0.5f);
 
    result.confidence = reportedConfidence;
 
    return result;
}
 
bool MeasureState::isDone (void) const
{
    return (int)frameTimes.size() >= maxNumFrames || (frameTimes.size() >= 2 &&
                                                      frameTimes[frameTimes.size()-2] >= (deUint64)frameShortcutTime &&
                                                      frameTimes[frameTimes.size()-1] >= (deUint64)frameShortcutTime);
}
 
deUint64 MeasureState::getTotalTime (void) const
{
    deUint64 time = 0;
    for (int i = 0; i < (int)frameTimes.size(); i++)
        time += frameTimes[i];
    return time;
}
 
void MeasureState::clear (void)
{
    maxNumFrames        = 0;
    frameShortcutTime    = std::numeric_limits<float>::infinity();
    numDrawCalls        = 0;
    frameTimes.clear();
}
 
void MeasureState::start (int maxNumFrames_, float frameShortcutTime_, int numDrawCalls_)
{
    frameTimes.clear();
    frameTimes.reserve(maxNumFrames_);
    maxNumFrames        = maxNumFrames_;
    frameShortcutTime    = frameShortcutTime_;
    numDrawCalls        = numDrawCalls_;
}
 
TheilSenCalibrator::TheilSenCalibrator (void)
    : m_params    (1 /* initial calls */, 10 /* calibrate iter frames */, 2000.0f /* calibrate iter shortcut threshold */, 31 /* max calibration iterations */,
                 1000.0f/30.0f /* target frame time */, 1000.0f/60.0f /* frame time cap */, 1000.0f /* target measure duration */)
    , m_state    (INTERNALSTATE_LAST)
{
    clear();
}
 
TheilSenCalibrator::TheilSenCalibrator (const CalibratorParameters& params)
    : m_params    (params)
    , m_state    (INTERNALSTATE_LAST)
{
    clear();
}
 
TheilSenCalibrator::~TheilSenCalibrator()
{
}
 
void TheilSenCalibrator::clear (void)
{
    m_measureState.clear();
    m_calibrateIterations.clear();
    m_state = INTERNALSTATE_CALIBRATING;
}
 
void TheilSenCalibrator::clear (const CalibratorParameters& params)
{
    m_params = params;
    clear();
}
 
TheilSenCalibrator::State TheilSenCalibrator::getState (void) const
{
    if (m_state == INTERNALSTATE_FINISHED)
        return STATE_FINISHED;
    else
    {
        DE_ASSERT(m_state == INTERNALSTATE_CALIBRATING || !m_measureState.isDone());
        return m_measureState.isDone() ? STATE_RECOMPUTE_PARAMS : STATE_MEASURE;
    }
}
 
void TheilSenCalibrator::recordIteration (deUint64 iterationTime)
{
    DE_ASSERT((m_state == INTERNALSTATE_CALIBRATING || m_state == INTERNALSTATE_RUNNING) && !m_measureState.isDone());
    m_measureState.frameTimes.push_back(iterationTime);
 
    if (m_state == INTERNALSTATE_RUNNING && m_measureState.isDone())
        m_state = INTERNALSTATE_FINISHED;
}
 
void TheilSenCalibrator::recomputeParameters (void)
{
    DE_ASSERT(m_state == INTERNALSTATE_CALIBRATING);
    DE_ASSERT(m_measureState.isDone());
 
    // Minimum and maximum acceptable frame times.
    const float        minGoodFrameTimeUs    = m_params.targetFrameTimeUs * 0.95f;
    const float        maxGoodFrameTimeUs    = m_params.targetFrameTimeUs * 1.15f;
 
    const int        numIterations        = (int)m_calibrateIterations.size();
 
    // Record frame time.
    if (numIterations > 0)
    {
        m_calibrateIterations.back().frameTime = (float)((double)m_measureState.getTotalTime() / (double)m_measureState.frameTimes.size());
 
        // Check if we're good enough to stop calibrating.
        {
            bool endCalibration = false;
 
            // Is the maximum calibration iteration limit reached?
            endCalibration = endCalibration || (int)m_calibrateIterations.size() >= m_params.maxCalibrateIterations;
 
            // Do a few past iterations have frame time in acceptable range?
            {
                const int numRelevantPastIterations = 2;
 
                if (!endCalibration && (int)m_calibrateIterations.size() >= numRelevantPastIterations)
                {
                    const CalibrateIteration* const        past            = &m_calibrateIterations[m_calibrateIterations.size() - numRelevantPastIterations];
                    bool                                allInGoodRange    = true;
 
                    for (int i = 0; i < numRelevantPastIterations && allInGoodRange; i++)
                    {
                        const float frameTimeUs = past[i].frameTime;
                        if (!de::inRange(frameTimeUs, minGoodFrameTimeUs, maxGoodFrameTimeUs))
                            allInGoodRange = false;
                    }
 
                    endCalibration = endCalibration || allInGoodRange;
                }
            }
 
            // Do a few past iterations have similar-enough call counts?
            {
                const int numRelevantPastIterations = 3;
                if (!endCalibration && (int)m_calibrateIterations.size() >= numRelevantPastIterations)
                {
                    const CalibrateIteration* const        past            = &m_calibrateIterations[m_calibrateIterations.size() - numRelevantPastIterations];
                    int                                    minCallCount    = std::numeric_limits<int>::max();
                    int                                    maxCallCount    = std::numeric_limits<int>::min();
 
                    for (int i = 0; i < numRelevantPastIterations; i++)
                    {
                        minCallCount = de::min(minCallCount, past[i].numDrawCalls);
                        maxCallCount = de::max(maxCallCount, past[i].numDrawCalls);
                    }
 
                    if ((float)(maxCallCount - minCallCount) <= (float)minCallCount * 0.1f)
                        endCalibration = true;
                }
            }
 
            // Is call count just 1, and frame time still way too high?
            endCalibration = endCalibration || (m_calibrateIterations.back().numDrawCalls == 1 && m_calibrateIterations.back().frameTime > m_params.targetFrameTimeUs*2.0f);
 
            if (endCalibration)
            {
                const int    minFrames            = 10;
                const int    maxFrames            = 60;
                int            numMeasureFrames    = deClamp32(deRoundFloatToInt32(m_params.targetMeasureDurationUs / m_calibrateIterations.back().frameTime), minFrames, maxFrames);
 
                m_state = INTERNALSTATE_RUNNING;
                m_measureState.start(numMeasureFrames, m_params.calibrateIterationShortcutThreshold, m_calibrateIterations.back().numDrawCalls);
                return;
            }
        }
    }
 
    DE_ASSERT(m_state == INTERNALSTATE_CALIBRATING);
 
    // Estimate new call count.
    {
        int newCallCount;
 
        if (numIterations == 0)
            newCallCount = m_params.numInitialCalls;
        else
        {
            vector<Vec2> dataPoints;
            for (int i = 0; i < numIterations; i++)
            {
                if (m_calibrateIterations[i].numDrawCalls == 1 || m_calibrateIterations[i].frameTime > m_params.frameTimeCapUs*1.05f) // Only account for measurements not too near the cap.
                    dataPoints.push_back(Vec2((float)m_calibrateIterations[i].numDrawCalls, m_calibrateIterations[i].frameTime));
            }
 
            if (numIterations == 1)
                dataPoints.push_back(Vec2(0.0f, 0.0f)); // If there's just one measurement so far, this will help in getting the next estimate.
 
            {
                const float                targetFrameTimeUs    = m_params.targetFrameTimeUs;
                const float                coeffEpsilon        = 0.001f; // Coefficient must be large enough (and positive) to be considered sensible.
 
                const LineParameters    estimatorLine        = theilSenLinearRegression(dataPoints);
 
                int                        prevMaxCalls        = 0;
 
                // Find the maximum of the past call counts.
                for (int i = 0; i < numIterations; i++)
                    prevMaxCalls = de::max(prevMaxCalls, m_calibrateIterations[i].numDrawCalls);
 
                if (estimatorLine.coefficient < coeffEpsilon) // Coefficient not good for sensible estimation; increase call count enough to get a reasonably different value.
                    newCallCount = 2*prevMaxCalls;
                else
                {
                    // Solve newCallCount such that approximately targetFrameTime = offset + coefficient*newCallCount.
                    newCallCount = (int)((targetFrameTimeUs - estimatorLine.offset) / estimatorLine.coefficient + 0.5f);
 
                    // We should generally prefer FPS counts below the target rather than above (i.e. higher frame times rather than lower).
                    if (estimatorLine.offset + estimatorLine.coefficient*(float)newCallCount < minGoodFrameTimeUs)
                        newCallCount++;
                }
 
                // Make sure we have at least minimum amount of calls, and don't allow increasing call count too much in one iteration.
                newCallCount = de::clamp(newCallCount, 1, prevMaxCalls*10);
            }
        }
 
        m_measureState.start(m_params.maxCalibrateIterationFrames, m_params.calibrateIterationShortcutThreshold, newCallCount);
        m_calibrateIterations.push_back(CalibrateIteration(newCallCount, 0.0f));
    }
}
 
void logCalibrationInfo (tcu::TestLog& log, const TheilSenCalibrator& calibrator)
{
    const CalibratorParameters&                params                = calibrator.getParameters();
    const std::vector<CalibrateIteration>&    calibrateIterations    = calibrator.getCalibrationInfo();
 
    // Write out default calibration info.
 
    log << TestLog::Section("CalibrationInfo", "Calibration Info")
        << TestLog::Message  << "Target frame time: " << params.targetFrameTimeUs << " us (" << 1000000 / params.targetFrameTimeUs << " fps)" << TestLog::EndMessage;
 
    for (int iterNdx = 0; iterNdx < (int)calibrateIterations.size(); iterNdx++)
    {
        log << TestLog::Message << "  iteration " << iterNdx << ": " << calibrateIterations[iterNdx].numDrawCalls << " calls => "
                                << de::floatToString(calibrateIterations[iterNdx].frameTime, 2) << " us ("
                                << de::floatToString(1000000.0f / calibrateIterations[iterNdx].frameTime, 2) << " fps)" << TestLog::EndMessage;
    }
    log << TestLog::Integer("CallCount",    "Calibrated call count",    "",    QP_KEY_TAG_NONE, calibrator.getMeasureState().numDrawCalls)
        << TestLog::Integer("FrameCount",    "Calibrated frame count",    "", QP_KEY_TAG_NONE, (int)calibrator.getMeasureState().frameTimes.size());
    log << TestLog::EndSection;
}
 
} // gls
} // deqp