1 /****************************************************************************
2 * Copyright (C) 2014-2015 Intel Corporation.   All Rights Reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * @file state.h
24 *
25 * @brief Definitions for API state - complex function implementation.
26 *
27 ******************************************************************************/
28 #pragma once
29 
30 #include "core/state.h"
31 #include "common/simdintrin.h"
32 
33 
34 template <typename MaskT>
expandThenBlend4(uint32_t * min,uint32_t * max)35 INLINE __m128i SWR_MULTISAMPLE_POS::expandThenBlend4(uint32_t* min, uint32_t* max)
36 {
37     __m128i vMin = _mm_set1_epi32(*min);
38     __m128i vMax = _mm_set1_epi32(*max);
39     return _simd_blend4_epi32<MaskT::value>(vMin, vMax);
40 }
41 
PrecalcSampleData(int numSamples)42 INLINE void SWR_MULTISAMPLE_POS::PrecalcSampleData(int numSamples)
43 {
44     for(int i = 0; i < numSamples; i++)
45     {
46         _vXi[i] = _mm_set1_epi32(_xi[i]);
47         _vYi[i] = _mm_set1_epi32(_yi[i]);
48         _vX[i] = _simd_set1_ps(_x[i]);
49         _vY[i] = _simd_set1_ps(_y[i]);
50     }
51     // precalculate the raster tile BB for the rasterizer.
52     CalcTileSampleOffsets(numSamples);
53 }
54 
CalcTileSampleOffsets(int numSamples)55 INLINE void SWR_MULTISAMPLE_POS::CalcTileSampleOffsets(int numSamples)
56 {
57     auto minXi = std::min_element(std::begin(_xi), &_xi[numSamples]);
58     auto maxXi = std::max_element(std::begin(_xi), &_xi[numSamples]);
59     using xMask = std::integral_constant<int, 0xA>;
60     // BR(max),    BL(min),    UR(max),    UL(min)
61     tileSampleOffsetsX = expandThenBlend4<xMask>(minXi, maxXi);
62 
63     auto minYi = std::min_element(std::begin(_yi), &_yi[numSamples]);
64     auto maxYi = std::max_element(std::begin(_yi), &_yi[numSamples]);
65     using yMask = std::integral_constant<int, 0xC>;
66     // BR(max),    BL(min),    UR(max),    UL(min)
67     tileSampleOffsetsY = expandThenBlend4<yMask>(minYi, maxYi);
68 };
69