/*------------------------------------------------------------------------- * drawElements Quality Program OpenGL (ES) Module * ----------------------------------------------- * * Copyright 2014 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * *//*! * \file * \brief Calibration tools. *//*--------------------------------------------------------------------*/ #include "glsCalibration.hpp" #include "tcuTestLog.hpp" #include "tcuVectorUtil.hpp" #include "deStringUtil.hpp" #include "deMath.h" #include "deClock.h" #include #include using std::string; using std::vector; using tcu::Vec2; using tcu::TestLog; using tcu::TestNode; using namespace glu; namespace deqp { namespace gls { // Reorders input arbitrarily, linear complexity and no allocations template float destructiveMedian (vector& data) { const typename vector::iterator mid = data.begin()+data.size()/2; std::nth_element(data.begin(), mid, data.end()); if (data.size()%2 == 0) // Even number of elements, need average of two centermost elements return (*mid + *std::max_element(data.begin(), mid))*0.5f; // Data is partially sorted around mid, mid is half an item after center else return *mid; } LineParameters theilSenLinearRegression (const std::vector& dataPoints) { const float epsilon = 1e-6f; const int numDataPoints = (int)dataPoints.size(); vector pairwiseCoefficients; vector pointwiseOffsets; LineParameters result (0.0f, 0.0f); // Compute the pairwise coefficients. for (int i = 0; i < numDataPoints; i++) { const Vec2& ptA = dataPoints[i]; for (int j = 0; j < i; j++) { const Vec2& ptB = dataPoints[j]; if (de::abs(ptA.x() - ptB.x()) > epsilon) pairwiseCoefficients.push_back((ptA.y() - ptB.y()) / (ptA.x() - ptB.x())); } } // Find the median of the pairwise coefficients. // \note If there are no data point pairs with differing x values, the coefficient variable will stay zero as initialized. if (!pairwiseCoefficients.empty()) result.coefficient = destructiveMedian(pairwiseCoefficients); // Compute the offsets corresponding to the median coefficient, for all data points. for (int i = 0; i < numDataPoints; i++) pointwiseOffsets.push_back(dataPoints[i].y() - result.coefficient*dataPoints[i].x()); // Find the median of the offsets. // \note If there are no data points, the offset variable will stay zero as initialized. if (!pointwiseOffsets.empty()) result.offset = destructiveMedian(pointwiseOffsets); return result; } // Sample from given values using linear interpolation at a given position as if values were laid to range [0, 1] template static float linearSample (const std::vector& values, float position) { DE_ASSERT(position >= 0.0f); DE_ASSERT(position <= 1.0f); const int maxNdx = (int)values.size() - 1; const float floatNdx = (float)maxNdx * position; const int lowerNdx = (int)deFloatFloor(floatNdx); const int higherNdx = lowerNdx + (lowerNdx == maxNdx ? 0 : 1); // Use only last element if position is 1.0 const float interpolationFactor = floatNdx - (float)lowerNdx; DE_ASSERT(lowerNdx >= 0 && lowerNdx < (int)values.size()); DE_ASSERT(higherNdx >= 0 && higherNdx < (int)values.size()); DE_ASSERT(interpolationFactor >= 0 && interpolationFactor < 1.0f); return tcu::mix((float)values[lowerNdx], (float)values[higherNdx], interpolationFactor); } LineParametersWithConfidence theilSenSiegelLinearRegression (const std::vector& dataPoints, float reportedConfidence) { DE_ASSERT(!dataPoints.empty()); // Siegel's variation const float epsilon = 1e-6f; const int numDataPoints = (int)dataPoints.size(); std::vector medianSlopes; std::vector pointwiseOffsets; LineParametersWithConfidence result; // Compute the median slope via each element for (int i = 0; i < numDataPoints; i++) { const tcu::Vec2& ptA = dataPoints[i]; std::vector slopes; slopes.reserve(numDataPoints); for (int j = 0; j < numDataPoints; j++) { const tcu::Vec2& ptB = dataPoints[j]; if (de::abs(ptA.x() - ptB.x()) > epsilon) slopes.push_back((ptA.y() - ptB.y()) / (ptA.x() - ptB.x())); } // Add median of slopes through point i medianSlopes.push_back(destructiveMedian(slopes)); } DE_ASSERT(!medianSlopes.empty()); // Find the median of the pairwise coefficients. std::sort(medianSlopes.begin(), medianSlopes.end()); result.coefficient = linearSample(medianSlopes, 0.5f); // Compute the offsets corresponding to the median coefficient, for all data points. for (int i = 0; i < numDataPoints; i++) pointwiseOffsets.push_back(dataPoints[i].y() - result.coefficient*dataPoints[i].x()); // Find the median of the offsets. std::sort(pointwiseOffsets.begin(), pointwiseOffsets.end()); result.offset = linearSample(pointwiseOffsets, 0.5f); // calculate confidence intervals result.coefficientConfidenceLower = linearSample(medianSlopes, 0.5f - reportedConfidence*0.5f); result.coefficientConfidenceUpper = linearSample(medianSlopes, 0.5f + reportedConfidence*0.5f); result.offsetConfidenceLower = linearSample(pointwiseOffsets, 0.5f - reportedConfidence*0.5f); result.offsetConfidenceUpper = linearSample(pointwiseOffsets, 0.5f + reportedConfidence*0.5f); result.confidence = reportedConfidence; return result; } bool MeasureState::isDone (void) const { return (int)frameTimes.size() >= maxNumFrames || (frameTimes.size() >= 2 && frameTimes[frameTimes.size()-2] >= (deUint64)frameShortcutTime && frameTimes[frameTimes.size()-1] >= (deUint64)frameShortcutTime); } deUint64 MeasureState::getTotalTime (void) const { deUint64 time = 0; for (int i = 0; i < (int)frameTimes.size(); i++) time += frameTimes[i]; return time; } void MeasureState::clear (void) { maxNumFrames = 0; frameShortcutTime = std::numeric_limits::infinity(); numDrawCalls = 0; frameTimes.clear(); } void MeasureState::start (int maxNumFrames_, float frameShortcutTime_, int numDrawCalls_) { frameTimes.clear(); frameTimes.reserve(maxNumFrames_); maxNumFrames = maxNumFrames_; frameShortcutTime = frameShortcutTime_; numDrawCalls = numDrawCalls_; } TheilSenCalibrator::TheilSenCalibrator (void) : m_params (1 /* initial calls */, 10 /* calibrate iter frames */, 2000.0f /* calibrate iter shortcut threshold */, 31 /* max calibration iterations */, 1000.0f/30.0f /* target frame time */, 1000.0f/60.0f /* frame time cap */, 1000.0f /* target measure duration */) , m_state (INTERNALSTATE_LAST) { clear(); } TheilSenCalibrator::TheilSenCalibrator (const CalibratorParameters& params) : m_params (params) , m_state (INTERNALSTATE_LAST) { clear(); } TheilSenCalibrator::~TheilSenCalibrator() { } void TheilSenCalibrator::clear (void) { m_measureState.clear(); m_calibrateIterations.clear(); m_state = INTERNALSTATE_CALIBRATING; } void TheilSenCalibrator::clear (const CalibratorParameters& params) { m_params = params; clear(); } TheilSenCalibrator::State TheilSenCalibrator::getState (void) const { if (m_state == INTERNALSTATE_FINISHED) return STATE_FINISHED; else { DE_ASSERT(m_state == INTERNALSTATE_CALIBRATING || !m_measureState.isDone()); return m_measureState.isDone() ? STATE_RECOMPUTE_PARAMS : STATE_MEASURE; } } void TheilSenCalibrator::recordIteration (deUint64 iterationTime) { DE_ASSERT((m_state == INTERNALSTATE_CALIBRATING || m_state == INTERNALSTATE_RUNNING) && !m_measureState.isDone()); m_measureState.frameTimes.push_back(iterationTime); if (m_state == INTERNALSTATE_RUNNING && m_measureState.isDone()) m_state = INTERNALSTATE_FINISHED; } void TheilSenCalibrator::recomputeParameters (void) { DE_ASSERT(m_state == INTERNALSTATE_CALIBRATING); DE_ASSERT(m_measureState.isDone()); // Minimum and maximum acceptable frame times. const float minGoodFrameTimeUs = m_params.targetFrameTimeUs * 0.95f; const float maxGoodFrameTimeUs = m_params.targetFrameTimeUs * 1.15f; const int numIterations = (int)m_calibrateIterations.size(); // Record frame time. if (numIterations > 0) { m_calibrateIterations.back().frameTime = (float)((double)m_measureState.getTotalTime() / (double)m_measureState.frameTimes.size()); // Check if we're good enough to stop calibrating. { bool endCalibration = false; // Is the maximum calibration iteration limit reached? endCalibration = endCalibration || (int)m_calibrateIterations.size() >= m_params.maxCalibrateIterations; // Do a few past iterations have frame time in acceptable range? { const int numRelevantPastIterations = 2; if (!endCalibration && (int)m_calibrateIterations.size() >= numRelevantPastIterations) { const CalibrateIteration* const past = &m_calibrateIterations[m_calibrateIterations.size() - numRelevantPastIterations]; bool allInGoodRange = true; for (int i = 0; i < numRelevantPastIterations && allInGoodRange; i++) { const float frameTimeUs = past[i].frameTime; if (!de::inRange(frameTimeUs, minGoodFrameTimeUs, maxGoodFrameTimeUs)) allInGoodRange = false; } endCalibration = endCalibration || allInGoodRange; } } // Do a few past iterations have similar-enough call counts? { const int numRelevantPastIterations = 3; if (!endCalibration && (int)m_calibrateIterations.size() >= numRelevantPastIterations) { const CalibrateIteration* const past = &m_calibrateIterations[m_calibrateIterations.size() - numRelevantPastIterations]; int minCallCount = std::numeric_limits::max(); int maxCallCount = std::numeric_limits::min(); for (int i = 0; i < numRelevantPastIterations; i++) { minCallCount = de::min(minCallCount, past[i].numDrawCalls); maxCallCount = de::max(maxCallCount, past[i].numDrawCalls); } if ((float)(maxCallCount - minCallCount) <= (float)minCallCount * 0.1f) endCalibration = true; } } // Is call count just 1, and frame time still way too high? endCalibration = endCalibration || (m_calibrateIterations.back().numDrawCalls == 1 && m_calibrateIterations.back().frameTime > m_params.targetFrameTimeUs*2.0f); if (endCalibration) { const int minFrames = 10; const int maxFrames = 60; int numMeasureFrames = deClamp32(deRoundFloatToInt32(m_params.targetMeasureDurationUs / m_calibrateIterations.back().frameTime), minFrames, maxFrames); m_state = INTERNALSTATE_RUNNING; m_measureState.start(numMeasureFrames, m_params.calibrateIterationShortcutThreshold, m_calibrateIterations.back().numDrawCalls); return; } } } DE_ASSERT(m_state == INTERNALSTATE_CALIBRATING); // Estimate new call count. { int newCallCount; if (numIterations == 0) newCallCount = m_params.numInitialCalls; else { vector dataPoints; for (int i = 0; i < numIterations; i++) { if (m_calibrateIterations[i].numDrawCalls == 1 || m_calibrateIterations[i].frameTime > m_params.frameTimeCapUs*1.05f) // Only account for measurements not too near the cap. dataPoints.push_back(Vec2((float)m_calibrateIterations[i].numDrawCalls, m_calibrateIterations[i].frameTime)); } if (numIterations == 1) dataPoints.push_back(Vec2(0.0f, 0.0f)); // If there's just one measurement so far, this will help in getting the next estimate. { const float targetFrameTimeUs = m_params.targetFrameTimeUs; const float coeffEpsilon = 0.001f; // Coefficient must be large enough (and positive) to be considered sensible. const LineParameters estimatorLine = theilSenLinearRegression(dataPoints); int prevMaxCalls = 0; // Find the maximum of the past call counts. for (int i = 0; i < numIterations; i++) prevMaxCalls = de::max(prevMaxCalls, m_calibrateIterations[i].numDrawCalls); if (estimatorLine.coefficient < coeffEpsilon) // Coefficient not good for sensible estimation; increase call count enough to get a reasonably different value. newCallCount = 2*prevMaxCalls; else { // Solve newCallCount such that approximately targetFrameTime = offset + coefficient*newCallCount. newCallCount = (int)((targetFrameTimeUs - estimatorLine.offset) / estimatorLine.coefficient + 0.5f); // We should generally prefer FPS counts below the target rather than above (i.e. higher frame times rather than lower). if (estimatorLine.offset + estimatorLine.coefficient*(float)newCallCount < minGoodFrameTimeUs) newCallCount++; } // Make sure we have at least minimum amount of calls, and don't allow increasing call count too much in one iteration. newCallCount = de::clamp(newCallCount, 1, prevMaxCalls*10); } } m_measureState.start(m_params.maxCalibrateIterationFrames, m_params.calibrateIterationShortcutThreshold, newCallCount); m_calibrateIterations.push_back(CalibrateIteration(newCallCount, 0.0f)); } } void logCalibrationInfo (tcu::TestLog& log, const TheilSenCalibrator& calibrator) { const CalibratorParameters& params = calibrator.getParameters(); const std::vector& calibrateIterations = calibrator.getCalibrationInfo(); // Write out default calibration info. log << TestLog::Section("CalibrationInfo", "Calibration Info") << TestLog::Message << "Target frame time: " << params.targetFrameTimeUs << " us (" << 1000000 / params.targetFrameTimeUs << " fps)" << TestLog::EndMessage; for (int iterNdx = 0; iterNdx < (int)calibrateIterations.size(); iterNdx++) { log << TestLog::Message << " iteration " << iterNdx << ": " << calibrateIterations[iterNdx].numDrawCalls << " calls => " << de::floatToString(calibrateIterations[iterNdx].frameTime, 2) << " us (" << de::floatToString(1000000.0f / calibrateIterations[iterNdx].frameTime, 2) << " fps)" << TestLog::EndMessage; } log << TestLog::Integer("CallCount", "Calibrated call count", "", QP_KEY_TAG_NONE, calibrator.getMeasureState().numDrawCalls) << TestLog::Integer("FrameCount", "Calibrated frame count", "", QP_KEY_TAG_NONE, (int)calibrator.getMeasureState().frameTimes.size()); log << TestLog::EndSection; } } // gls } // deqp