1 /*-------------------------------------------------------------------------
2 * drawElements Quality Program OpenGL ES 3.1 Module
3 * -------------------------------------------------
4 *
5 * Copyright 2014 The Android Open Source Project
6 *
7 * Licensed under the Apache License, Version 2.0 (the "License");
8 * you may not use this file except in compliance with the License.
9 * You may obtain a copy of the License at
10 *
11 * http://www.apache.org/licenses/LICENSE-2.0
12 *
13 * Unless required by applicable law or agreed to in writing, software
14 * distributed under the License is distributed on an "AS IS" BASIS,
15 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16 * See the License for the specific language governing permissions and
17 * limitations under the License.
18 *
19 *//*!
20 * \file
21 * \brief Floating-point packing and unpacking function tests.
22 *//*--------------------------------------------------------------------*/
23
24 #include "es31fShaderPackingFunctionTests.hpp"
25 #include "glsShaderExecUtil.hpp"
26 #include "tcuTestLog.hpp"
27 #include "tcuFormatUtil.hpp"
28 #include "tcuFloat.hpp"
29 #include "deRandom.hpp"
30 #include "deMath.h"
31 #include "deString.h"
32
33 namespace deqp
34 {
35 namespace gles31
36 {
37 namespace Functional
38 {
39
40 using std::string;
41 using tcu::TestLog;
42 using namespace gls::ShaderExecUtil;
43
44 namespace
45 {
46
getUlpDiff(float a,float b)47 inline deUint32 getUlpDiff (float a, float b)
48 {
49 const deUint32 aBits = tcu::Float32(a).bits();
50 const deUint32 bBits = tcu::Float32(b).bits();
51 return aBits > bBits ? aBits - bBits : bBits - aBits;
52 }
53
54 struct HexFloat
55 {
56 const float value;
HexFloatdeqp::gles31::Functional::__anon20eac2120111::HexFloat57 HexFloat (const float value_) : value(value_) {}
58 };
59
operator <<(std::ostream & str,const HexFloat & v)60 std::ostream& operator<< (std::ostream& str, const HexFloat& v)
61 {
62 return str << v.value << " / " << tcu::toHex(tcu::Float32(v.value).bits());
63 }
64
65 } // anonymous
66
67 // ShaderPackingFunctionCase
68
69 class ShaderPackingFunctionCase : public TestCase
70 {
71 public:
72 ShaderPackingFunctionCase (Context& context, const char* name, const char* description, glu::ShaderType shaderType);
73 ~ShaderPackingFunctionCase (void);
74
75 void init (void);
76 void deinit (void);
77
78 protected:
79 glu::ShaderType m_shaderType;
80 ShaderSpec m_spec;
81 ShaderExecutor* m_executor;
82
83 private:
84 ShaderPackingFunctionCase (const ShaderPackingFunctionCase& other);
85 ShaderPackingFunctionCase& operator= (const ShaderPackingFunctionCase& other);
86 };
87
ShaderPackingFunctionCase(Context & context,const char * name,const char * description,glu::ShaderType shaderType)88 ShaderPackingFunctionCase::ShaderPackingFunctionCase (Context& context, const char* name, const char* description, glu::ShaderType shaderType)
89 : TestCase (context, name, description)
90 , m_shaderType (shaderType)
91 , m_executor (DE_NULL)
92 {
93 m_spec.version = glu::GLSL_VERSION_310_ES;
94 }
95
~ShaderPackingFunctionCase(void)96 ShaderPackingFunctionCase::~ShaderPackingFunctionCase (void)
97 {
98 ShaderPackingFunctionCase::deinit();
99 }
100
init(void)101 void ShaderPackingFunctionCase::init (void)
102 {
103 DE_ASSERT(!m_executor);
104
105 m_executor = createExecutor(m_context.getRenderContext(), m_shaderType, m_spec);
106 m_testCtx.getLog() << m_executor;
107
108 if (!m_executor->isOk())
109 throw tcu::TestError("Compile failed");
110 }
111
deinit(void)112 void ShaderPackingFunctionCase::deinit (void)
113 {
114 delete m_executor;
115 m_executor = DE_NULL;
116 }
117
118 // Test cases
119
getPrecisionPostfix(glu::Precision precision)120 static const char* getPrecisionPostfix (glu::Precision precision)
121 {
122 static const char* s_postfix[] =
123 {
124 "_lowp",
125 "_mediump",
126 "_highp"
127 };
128 DE_STATIC_ASSERT(DE_LENGTH_OF_ARRAY(s_postfix) == glu::PRECISION_LAST);
129 DE_ASSERT(de::inBounds<int>(precision, 0, DE_LENGTH_OF_ARRAY(s_postfix)));
130 return s_postfix[precision];
131 }
132
getShaderTypePostfix(glu::ShaderType shaderType)133 static const char* getShaderTypePostfix (glu::ShaderType shaderType)
134 {
135 static const char* s_postfix[] =
136 {
137 "_vertex",
138 "_fragment",
139 "_geometry",
140 "_tess_control",
141 "_tess_eval",
142 "_compute"
143 };
144 DE_ASSERT(de::inBounds<int>(shaderType, 0, DE_LENGTH_OF_ARRAY(s_postfix)));
145 return s_postfix[shaderType];
146 }
147
148 class PackSnorm2x16Case : public ShaderPackingFunctionCase
149 {
150 public:
PackSnorm2x16Case(Context & context,glu::ShaderType shaderType,glu::Precision precision)151 PackSnorm2x16Case (Context& context, glu::ShaderType shaderType, glu::Precision precision)
152 : ShaderPackingFunctionCase (context, (string("packsnorm2x16") + getPrecisionPostfix(precision) + getShaderTypePostfix(shaderType)).c_str(), "packSnorm2x16", shaderType)
153 , m_precision (precision)
154 {
155 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision)));
156 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
157
158 m_spec.source = "out0 = packSnorm2x16(in0);";
159 }
160
iterate(void)161 IterateResult iterate (void)
162 {
163 de::Random rnd (deStringHash(getName()) ^ 0x776002);
164 std::vector<tcu::Vec2> inputs;
165 std::vector<deUint32> outputs;
166 const int maxDiff = m_precision == glu::PRECISION_HIGHP ? 1 : // Rounding only.
167 m_precision == glu::PRECISION_MEDIUMP ? 33 : // (2^-10) * (2^15) + 1
168 m_precision == glu::PRECISION_LOWP ? 129 : 0; // (2^-8) * (2^15) + 1
169
170 // Special values to check.
171 inputs.push_back(tcu::Vec2(0.0f, 0.0f));
172 inputs.push_back(tcu::Vec2(-1.0f, 1.0f));
173 inputs.push_back(tcu::Vec2(0.5f, -0.5f));
174 inputs.push_back(tcu::Vec2(-1.5f, 1.5f));
175 inputs.push_back(tcu::Vec2(0.25f, -0.75f));
176
177 // Random values, mostly in range.
178 for (int ndx = 0; ndx < 15; ndx++)
179 {
180 const float x = rnd.getFloat()*2.5f - 1.25f;
181 const float y = rnd.getFloat()*2.5f - 1.25f;
182 inputs.push_back(tcu::Vec2(x, y));
183 }
184
185 // Large random values.
186 for (int ndx = 0; ndx < 80; ndx++)
187 {
188 const float x = rnd.getFloat()*1e6f - 0.5e6f;
189 const float y = rnd.getFloat()*1e6f - 0.5e6f;
190 inputs.push_back(tcu::Vec2(x, y));
191 }
192
193 outputs.resize(inputs.size());
194
195 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
196
197 {
198 const void* in = &inputs[0];
199 void* out = &outputs[0];
200
201 m_executor->useProgram();
202 m_executor->execute((int)inputs.size(), &in, &out);
203 }
204
205 // Verify
206 {
207 const int numValues = (int)inputs.size();
208 const int maxPrints = 10;
209 int numFailed = 0;
210
211 for (int valNdx = 0; valNdx < numValues; valNdx++)
212 {
213 const deUint16 ref0 = (deUint16)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].x(), -1.0f, 1.0f) * 32767.0f), -(1<<15), (1<<15)-1);
214 const deUint16 ref1 = (deUint16)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].y(), -1.0f, 1.0f) * 32767.0f), -(1<<15), (1<<15)-1);
215 const deUint32 ref = (ref1 << 16) | ref0;
216 const deUint32 res = outputs[valNdx];
217 const deUint16 res0 = (deUint16)(res & 0xffff);
218 const deUint16 res1 = (deUint16)(res >> 16);
219 const int diff0 = de::abs((int)ref0 - (int)res0);
220 const int diff1 = de::abs((int)ref1 - (int)res1);
221
222 if (diff0 > maxDiff || diff1 > maxDiff)
223 {
224 if (numFailed < maxPrints)
225 {
226 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx
227 << ", expected packSnorm2x16(" << inputs[valNdx] << ") = " << tcu::toHex(ref)
228 << ", got " << tcu::toHex(res)
229 << "\n diffs = (" << diff0 << ", " << diff1 << "), max diff = " << maxDiff
230 << TestLog::EndMessage;
231 }
232 else if (numFailed == maxPrints)
233 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
234
235 numFailed += 1;
236 }
237 }
238
239 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
240
241 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
242 numFailed == 0 ? "Pass" : "Result comparison failed");
243 }
244
245 return STOP;
246 }
247
248 private:
249 glu::Precision m_precision;
250 };
251
252 class UnpackSnorm2x16Case : public ShaderPackingFunctionCase
253 {
254 public:
UnpackSnorm2x16Case(Context & context,glu::ShaderType shaderType)255 UnpackSnorm2x16Case (Context& context, glu::ShaderType shaderType)
256 : ShaderPackingFunctionCase(context, (string("unpacksnorm2x16") + getShaderTypePostfix(shaderType)).c_str(), "unpackSnorm2x16", shaderType)
257 {
258 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
259 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_FLOAT_VEC2, glu::PRECISION_HIGHP)));
260
261 m_spec.source = "out0 = unpackSnorm2x16(in0);";
262 }
263
iterate(void)264 IterateResult iterate (void)
265 {
266 const deUint32 maxDiff = 1; // Rounding error.
267 de::Random rnd (deStringHash(getName()) ^ 0x776002);
268 std::vector<deUint32> inputs;
269 std::vector<tcu::Vec2> outputs;
270
271 inputs.push_back(0x00000000u);
272 inputs.push_back(0x7fff8000u);
273 inputs.push_back(0x80007fffu);
274 inputs.push_back(0xffffffffu);
275 inputs.push_back(0x0001fffeu);
276
277 // Random values.
278 for (int ndx = 0; ndx < 95; ndx++)
279 inputs.push_back(rnd.getUint32());
280
281 outputs.resize(inputs.size());
282
283 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
284
285 {
286 const void* in = &inputs[0];
287 void* out = &outputs[0];
288
289 m_executor->useProgram();
290 m_executor->execute((int)inputs.size(), &in, &out);
291 }
292
293 // Verify
294 {
295 const int numValues = (int)inputs.size();
296 const int maxPrints = 10;
297 int numFailed = 0;
298
299 for (int valNdx = 0; valNdx < (int)inputs.size(); valNdx++)
300 {
301 const deInt16 in0 = (deInt16)(deUint16)(inputs[valNdx] & 0xffff);
302 const deInt16 in1 = (deInt16)(deUint16)(inputs[valNdx] >> 16);
303 const float ref0 = de::clamp(float(in0) / 32767.f, -1.0f, 1.0f);
304 const float ref1 = de::clamp(float(in1) / 32767.f, -1.0f, 1.0f);
305 const float res0 = outputs[valNdx].x();
306 const float res1 = outputs[valNdx].y();
307
308 const deUint32 diff0 = getUlpDiff(ref0, res0);
309 const deUint32 diff1 = getUlpDiff(ref1, res1);
310
311 if (diff0 > maxDiff || diff1 > maxDiff)
312 {
313 if (numFailed < maxPrints)
314 {
315 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx << ",\n"
316 << " expected unpackSnorm2x16(" << tcu::toHex(inputs[valNdx]) << ") = "
317 << "vec2(" << HexFloat(ref0) << ", " << HexFloat(ref1) << ")"
318 << ", got vec2(" << HexFloat(res0) << ", " << HexFloat(res1) << ")"
319 << "\n ULP diffs = (" << diff0 << ", " << diff1 << "), max diff = " << maxDiff
320 << TestLog::EndMessage;
321 }
322 else if (numFailed == maxPrints)
323 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
324
325 numFailed += 1;
326 }
327 }
328
329 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
330
331 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
332 numFailed == 0 ? "Pass" : "Result comparison failed");
333 }
334
335 return STOP;
336 }
337 };
338
339 class PackUnorm2x16Case : public ShaderPackingFunctionCase
340 {
341 public:
PackUnorm2x16Case(Context & context,glu::ShaderType shaderType,glu::Precision precision)342 PackUnorm2x16Case (Context& context, glu::ShaderType shaderType, glu::Precision precision)
343 : ShaderPackingFunctionCase (context, (string("packunorm2x16") + getPrecisionPostfix(precision) + getShaderTypePostfix(shaderType)).c_str(), "packUnorm2x16", shaderType)
344 , m_precision (precision)
345 {
346 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision)));
347 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
348
349 m_spec.source = "out0 = packUnorm2x16(in0);";
350 }
351
iterate(void)352 IterateResult iterate (void)
353 {
354 de::Random rnd (deStringHash(getName()) ^ 0x776002);
355 std::vector<tcu::Vec2> inputs;
356 std::vector<deUint32> outputs;
357 const int maxDiff = m_precision == glu::PRECISION_HIGHP ? 1 : // Rounding only.
358 m_precision == glu::PRECISION_MEDIUMP ? 65 : // (2^-10) * (2^16) + 1
359 m_precision == glu::PRECISION_LOWP ? 257 : 0; // (2^-8) * (2^16) + 1
360
361 // Special values to check.
362 inputs.push_back(tcu::Vec2(0.0f, 0.0f));
363 inputs.push_back(tcu::Vec2(0.5f, 1.0f));
364 inputs.push_back(tcu::Vec2(1.0f, 0.5f));
365 inputs.push_back(tcu::Vec2(-0.5f, 1.5f));
366 inputs.push_back(tcu::Vec2(0.25f, 0.75f));
367
368 // Random values, mostly in range.
369 for (int ndx = 0; ndx < 15; ndx++)
370 {
371 const float x = rnd.getFloat()*1.25f;
372 const float y = rnd.getFloat()*1.25f;
373 inputs.push_back(tcu::Vec2(x, y));
374 }
375
376 // Large random values.
377 for (int ndx = 0; ndx < 80; ndx++)
378 {
379 const float x = rnd.getFloat()*1e6f - 1e5f;
380 const float y = rnd.getFloat()*1e6f - 1e5f;
381 inputs.push_back(tcu::Vec2(x, y));
382 }
383
384 outputs.resize(inputs.size());
385
386 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
387
388 {
389 const void* in = &inputs[0];
390 void* out = &outputs[0];
391
392 m_executor->useProgram();
393 m_executor->execute((int)inputs.size(), &in, &out);
394 }
395
396 // Verify
397 {
398 const int numValues = (int)inputs.size();
399 const int maxPrints = 10;
400 int numFailed = 0;
401
402 for (int valNdx = 0; valNdx < (int)inputs.size(); valNdx++)
403 {
404 const deUint16 ref0 = (deUint16)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].x(), 0.0f, 1.0f) * 65535.0f), 0, (1<<16)-1);
405 const deUint16 ref1 = (deUint16)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].y(), 0.0f, 1.0f) * 65535.0f), 0, (1<<16)-1);
406 const deUint32 ref = (ref1 << 16) | ref0;
407 const deUint32 res = outputs[valNdx];
408 const deUint16 res0 = (deUint16)(res & 0xffff);
409 const deUint16 res1 = (deUint16)(res >> 16);
410 const int diff0 = de::abs((int)ref0 - (int)res0);
411 const int diff1 = de::abs((int)ref1 - (int)res1);
412
413 if (diff0 > maxDiff || diff1 > maxDiff)
414 {
415 if (numFailed < maxPrints)
416 {
417 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx
418 << ", expected packUnorm2x16(" << inputs[valNdx] << ") = " << tcu::toHex(ref)
419 << ", got " << tcu::toHex(res)
420 << "\n diffs = (" << diff0 << ", " << diff1 << "), max diff = " << maxDiff
421 << TestLog::EndMessage;
422 }
423 else if (numFailed == maxPrints)
424 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
425
426 numFailed += 1;
427 }
428 }
429
430 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
431
432 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
433 numFailed == 0 ? "Pass" : "Result comparison failed");
434 }
435
436 return STOP;
437 }
438
439 private:
440 glu::Precision m_precision;
441 };
442
443 class UnpackUnorm2x16Case : public ShaderPackingFunctionCase
444 {
445 public:
UnpackUnorm2x16Case(Context & context,glu::ShaderType shaderType)446 UnpackUnorm2x16Case (Context& context, glu::ShaderType shaderType)
447 : ShaderPackingFunctionCase(context, (string("unpackunorm2x16") + getShaderTypePostfix(shaderType)).c_str(), "unpackUnorm2x16", shaderType)
448 {
449 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
450 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_FLOAT_VEC2, glu::PRECISION_HIGHP)));
451
452 m_spec.source = "out0 = unpackUnorm2x16(in0);";
453 }
454
iterate(void)455 IterateResult iterate (void)
456 {
457 const deUint32 maxDiff = 1; // Rounding error.
458 de::Random rnd (deStringHash(getName()) ^ 0x776002);
459 std::vector<deUint32> inputs;
460 std::vector<tcu::Vec2> outputs;
461
462 inputs.push_back(0x00000000u);
463 inputs.push_back(0x7fff8000u);
464 inputs.push_back(0x80007fffu);
465 inputs.push_back(0xffffffffu);
466 inputs.push_back(0x0001fffeu);
467
468 // Random values.
469 for (int ndx = 0; ndx < 95; ndx++)
470 inputs.push_back(rnd.getUint32());
471
472 outputs.resize(inputs.size());
473
474 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
475
476 {
477 const void* in = &inputs[0];
478 void* out = &outputs[0];
479
480 m_executor->useProgram();
481 m_executor->execute((int)inputs.size(), &in, &out);
482 }
483
484 // Verify
485 {
486 const int numValues = (int)inputs.size();
487 const int maxPrints = 10;
488 int numFailed = 0;
489
490 for (int valNdx = 0; valNdx < (int)inputs.size(); valNdx++)
491 {
492 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff);
493 const deUint16 in1 = (deUint16)(inputs[valNdx] >> 16);
494 const float ref0 = float(in0) / 65535.0f;
495 const float ref1 = float(in1) / 65535.0f;
496 const float res0 = outputs[valNdx].x();
497 const float res1 = outputs[valNdx].y();
498
499 const deUint32 diff0 = getUlpDiff(ref0, res0);
500 const deUint32 diff1 = getUlpDiff(ref1, res1);
501
502 if (diff0 > maxDiff || diff1 > maxDiff)
503 {
504 if (numFailed < maxPrints)
505 {
506 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx << ",\n"
507 << " expected unpackUnorm2x16(" << tcu::toHex(inputs[valNdx]) << ") = "
508 << "vec2(" << HexFloat(ref0) << ", " << HexFloat(ref1) << ")"
509 << ", got vec2(" << HexFloat(res0) << ", " << HexFloat(res1) << ")"
510 << "\n ULP diffs = (" << diff0 << ", " << diff1 << "), max diff = " << maxDiff
511 << TestLog::EndMessage;
512 }
513 else if (numFailed == maxPrints)
514 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
515
516 numFailed += 1;
517 }
518 }
519
520 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
521
522 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
523 numFailed == 0 ? "Pass" : "Result comparison failed");
524 }
525
526 return STOP;
527 }
528 };
529
530 class PackHalf2x16Case : public ShaderPackingFunctionCase
531 {
532 public:
PackHalf2x16Case(Context & context,glu::ShaderType shaderType)533 PackHalf2x16Case (Context& context, glu::ShaderType shaderType)
534 : ShaderPackingFunctionCase(context, (string("packhalf2x16") + getShaderTypePostfix(shaderType)).c_str(), "packHalf2x16", shaderType)
535 {
536 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, glu::PRECISION_HIGHP)));
537 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
538
539 m_spec.source = "out0 = packHalf2x16(in0);";
540 }
541
iterate(void)542 IterateResult iterate (void)
543 {
544 const int maxDiff = 0; // Values can be represented exactly in mediump.
545 de::Random rnd (deStringHash(getName()) ^ 0x776002);
546 std::vector<tcu::Vec2> inputs;
547 std::vector<deUint32> outputs;
548
549 // Special values to check.
550 inputs.push_back(tcu::Vec2(0.0f, 0.0f));
551 inputs.push_back(tcu::Vec2(0.5f, 1.0f));
552 inputs.push_back(tcu::Vec2(1.0f, 0.5f));
553 inputs.push_back(tcu::Vec2(-0.5f, 1.5f));
554 inputs.push_back(tcu::Vec2(0.25f, 0.75f));
555
556 // Random values.
557 {
558 const int minExp = -14;
559 const int maxExp = 15;
560
561 for (int ndx = 0; ndx < 95; ndx++)
562 {
563 tcu::Vec2 v;
564 for (int c = 0; c < 2; c++)
565 {
566 const int s = rnd.getBool() ? 1 : -1;
567 const int exp = rnd.getInt(minExp, maxExp);
568 const deUint32 mantissa = rnd.getUint32() & ((1<<23)-1);
569
570 v[c] = tcu::Float32::construct(s, exp ? exp : 1 /* avoid denormals */, (1u<<23) | mantissa).asFloat();
571 }
572 inputs.push_back(v);
573 }
574 }
575
576 // Convert input values to fp16 and back to make sure they can be represented exactly in mediump.
577 for (std::vector<tcu::Vec2>::iterator inVal = inputs.begin(); inVal != inputs.end(); ++inVal)
578 *inVal = tcu::Vec2(tcu::Float16(inVal->x()).asFloat(), tcu::Float16(inVal->y()).asFloat());
579
580 outputs.resize(inputs.size());
581
582 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
583
584 {
585 const void* in = &inputs[0];
586 void* out = &outputs[0];
587
588 m_executor->useProgram();
589 m_executor->execute((int)inputs.size(), &in, &out);
590 }
591
592 // Verify
593 {
594 const int numValues = (int)inputs.size();
595 const int maxPrints = 10;
596 int numFailed = 0;
597
598 for (int valNdx = 0; valNdx < (int)inputs.size(); valNdx++)
599 {
600 const deUint16 ref0 = (deUint16)tcu::Float16(inputs[valNdx].x()).bits();
601 const deUint16 ref1 = (deUint16)tcu::Float16(inputs[valNdx].y()).bits();
602 const deUint32 ref = (ref1 << 16) | ref0;
603 const deUint32 res = outputs[valNdx];
604 const deUint16 res0 = (deUint16)(res & 0xffff);
605 const deUint16 res1 = (deUint16)(res >> 16);
606 const int diff0 = de::abs((int)ref0 - (int)res0);
607 const int diff1 = de::abs((int)ref1 - (int)res1);
608
609 if (diff0 > maxDiff || diff1 > maxDiff)
610 {
611 if (numFailed < maxPrints)
612 {
613 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx
614 << ", expected packHalf2x16(" << inputs[valNdx] << ") = " << tcu::toHex(ref)
615 << ", got " << tcu::toHex(res)
616 << "\n diffs = (" << diff0 << ", " << diff1 << "), max diff = " << maxDiff
617 << TestLog::EndMessage;
618 }
619 else if (numFailed == maxPrints)
620 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
621
622 numFailed += 1;
623 }
624 }
625
626 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
627
628 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
629 numFailed == 0 ? "Pass" : "Result comparison failed");
630 }
631
632 return STOP;
633 }
634 };
635
636 class UnpackHalf2x16Case : public ShaderPackingFunctionCase
637 {
638 public:
UnpackHalf2x16Case(Context & context,glu::ShaderType shaderType)639 UnpackHalf2x16Case (Context& context, glu::ShaderType shaderType)
640 : ShaderPackingFunctionCase(context, (string("unpackhalf2x16") + getShaderTypePostfix(shaderType)).c_str(), "unpackHalf2x16", shaderType)
641 {
642 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
643 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_FLOAT_VEC2, glu::PRECISION_MEDIUMP)));
644
645 m_spec.source = "out0 = unpackHalf2x16(in0);";
646 }
647
iterate(void)648 IterateResult iterate (void)
649 {
650 const int maxDiff = 0; // All bits must be accurate.
651 de::Random rnd (deStringHash(getName()) ^ 0x776002);
652 std::vector<deUint32> inputs;
653 std::vector<tcu::Vec2> outputs;
654
655 // Special values.
656 inputs.push_back((tcu::Float16( 0.0f).bits() << 16) | tcu::Float16( 1.0f).bits());
657 inputs.push_back((tcu::Float16( 1.0f).bits() << 16) | tcu::Float16( 0.0f).bits());
658 inputs.push_back((tcu::Float16(-1.0f).bits() << 16) | tcu::Float16( 0.5f).bits());
659 inputs.push_back((tcu::Float16( 0.5f).bits() << 16) | tcu::Float16(-0.5f).bits());
660
661 // Construct random values.
662 {
663 const int minExp = -14;
664 const int maxExp = 15;
665 const int mantBits = 10;
666
667 for (int ndx = 0; ndx < 96; ndx++)
668 {
669 deUint32 inVal = 0;
670 for (int c = 0; c < 2; c++)
671 {
672 const int s = rnd.getBool() ? 1 : -1;
673 const int exp = rnd.getInt(minExp, maxExp);
674 const deUint32 mantissa = rnd.getUint32() & ((1<<mantBits)-1);
675 const deUint16 value = tcu::Float16::construct(s, exp ? exp : 1 /* avoid denorm */, (1u<<10) | mantissa).bits();
676
677 inVal |= value << (16*c);
678 }
679 inputs.push_back(inVal);
680 }
681 }
682
683 outputs.resize(inputs.size());
684
685 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
686
687 {
688 const void* in = &inputs[0];
689 void* out = &outputs[0];
690
691 m_executor->useProgram();
692 m_executor->execute((int)inputs.size(), &in, &out);
693 }
694
695 // Verify
696 {
697 const int numValues = (int)inputs.size();
698 const int maxPrints = 10;
699 int numFailed = 0;
700
701 for (int valNdx = 0; valNdx < (int)inputs.size(); valNdx++)
702 {
703 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff);
704 const deUint16 in1 = (deUint16)(inputs[valNdx] >> 16);
705 const float ref0 = tcu::Float16(in0).asFloat();
706 const float ref1 = tcu::Float16(in1).asFloat();
707 const float res0 = outputs[valNdx].x();
708 const float res1 = outputs[valNdx].y();
709
710 const deUint32 refBits0 = tcu::Float32(ref0).bits();
711 const deUint32 refBits1 = tcu::Float32(ref1).bits();
712 const deUint32 resBits0 = tcu::Float32(res0).bits();
713 const deUint32 resBits1 = tcu::Float32(res1).bits();
714
715 const int diff0 = de::abs((int)refBits0 - (int)resBits0);
716 const int diff1 = de::abs((int)refBits1 - (int)resBits1);
717
718 if (diff0 > maxDiff || diff1 > maxDiff)
719 {
720 if (numFailed < maxPrints)
721 {
722 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx << ",\n"
723 << " expected unpackHalf2x16(" << tcu::toHex(inputs[valNdx]) << ") = "
724 << "vec2(" << ref0 << " / " << tcu::toHex(refBits0) << ", " << ref1 << " / " << tcu::toHex(refBits1) << ")"
725 << ", got vec2(" << res0 << " / " << tcu::toHex(resBits0) << ", " << res1 << " / " << tcu::toHex(resBits1) << ")"
726 << "\n ULP diffs = (" << diff0 << ", " << diff1 << "), max diff = " << maxDiff
727 << TestLog::EndMessage;
728 }
729 else if (numFailed == maxPrints)
730 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
731
732 numFailed += 1;
733 }
734 }
735
736 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
737
738 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
739 numFailed == 0 ? "Pass" : "Result comparison failed");
740 }
741
742 return STOP;
743 }
744 };
745
746 class PackSnorm4x8Case : public ShaderPackingFunctionCase
747 {
748 public:
PackSnorm4x8Case(Context & context,glu::ShaderType shaderType,glu::Precision precision)749 PackSnorm4x8Case (Context& context, glu::ShaderType shaderType, glu::Precision precision)
750 : ShaderPackingFunctionCase (context, (string("packsnorm4x8") + getPrecisionPostfix(precision) + getShaderTypePostfix(shaderType)).c_str(), "packSnorm4x8", shaderType)
751 , m_precision (precision)
752 {
753 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC4, precision)));
754 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
755
756 m_spec.source = "out0 = packSnorm4x8(in0);";
757 }
758
iterate(void)759 IterateResult iterate (void)
760 {
761 de::Random rnd (deStringHash(getName()) ^ 0x42f2c0);
762 std::vector<tcu::Vec4> inputs;
763 std::vector<deUint32> outputs;
764 const int maxDiff = m_precision == glu::PRECISION_HIGHP ? 1 : // Rounding only.
765 m_precision == glu::PRECISION_MEDIUMP ? 1 : // (2^-10) * (2^7) + 1
766 m_precision == glu::PRECISION_LOWP ? 2 : 0; // (2^-8) * (2^7) + 1
767
768 // Special values to check.
769 inputs.push_back(tcu::Vec4(0.0f, 0.0f, 0.0f, 0.0f));
770 inputs.push_back(tcu::Vec4(-1.0f, 1.0f, -1.0f, 1.0f));
771 inputs.push_back(tcu::Vec4(0.5f, -0.5f, -0.5f, 0.5f));
772 inputs.push_back(tcu::Vec4(-1.5f, 1.5f, -1.5f, 1.5f));
773 inputs.push_back(tcu::Vec4(0.25f, -0.75f, -0.25f, 0.75f));
774
775 // Random values, mostly in range.
776 for (int ndx = 0; ndx < 15; ndx++)
777 {
778 const float x = rnd.getFloat()*2.5f - 1.25f;
779 const float y = rnd.getFloat()*2.5f - 1.25f;
780 const float z = rnd.getFloat()*2.5f - 1.25f;
781 const float w = rnd.getFloat()*2.5f - 1.25f;
782 inputs.push_back(tcu::Vec4(x, y, z, w));
783 }
784
785 // Large random values.
786 for (int ndx = 0; ndx < 80; ndx++)
787 {
788 const float x = rnd.getFloat()*1e6f - 0.5e6f;
789 const float y = rnd.getFloat()*1e6f - 0.5e6f;
790 const float z = rnd.getFloat()*1e6f - 0.5e6f;
791 const float w = rnd.getFloat()*1e6f - 0.5e6f;
792 inputs.push_back(tcu::Vec4(x, y, z, w));
793 }
794
795 outputs.resize(inputs.size());
796
797 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
798
799 {
800 const void* in = &inputs[0];
801 void* out = &outputs[0];
802
803 m_executor->useProgram();
804 m_executor->execute((int)inputs.size(), &in, &out);
805 }
806
807 // Verify
808 {
809 const int numValues = (int)inputs.size();
810 const int maxPrints = 10;
811 int numFailed = 0;
812
813 for (int valNdx = 0; valNdx < numValues; valNdx++)
814 {
815 const deUint16 ref0 = (deUint8)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].x(), -1.0f, 1.0f) * 127.0f), -(1<<7), (1<<7)-1);
816 const deUint16 ref1 = (deUint8)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].y(), -1.0f, 1.0f) * 127.0f), -(1<<7), (1<<7)-1);
817 const deUint16 ref2 = (deUint8)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].z(), -1.0f, 1.0f) * 127.0f), -(1<<7), (1<<7)-1);
818 const deUint16 ref3 = (deUint8)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].w(), -1.0f, 1.0f) * 127.0f), -(1<<7), (1<<7)-1);
819 const deUint32 ref = (deUint32(ref3) << 24) | (deUint32(ref2) << 16) | (deUint32(ref1) << 8) | deUint32(ref0);
820 const deUint32 res = outputs[valNdx];
821 const deUint16 res0 = (deUint8)(res & 0xff);
822 const deUint16 res1 = (deUint8)((res >> 8) & 0xff);
823 const deUint16 res2 = (deUint8)((res >> 16) & 0xff);
824 const deUint16 res3 = (deUint8)((res >> 24) & 0xff);
825 const int diff0 = de::abs((int)ref0 - (int)res0);
826 const int diff1 = de::abs((int)ref1 - (int)res1);
827 const int diff2 = de::abs((int)ref2 - (int)res2);
828 const int diff3 = de::abs((int)ref3 - (int)res3);
829
830 if (diff0 > maxDiff || diff1 > maxDiff || diff2 > maxDiff || diff3 > maxDiff)
831 {
832 if (numFailed < maxPrints)
833 {
834 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx
835 << ", expected packSnorm4x8(" << inputs[valNdx] << ") = " << tcu::toHex(ref)
836 << ", got " << tcu::toHex(res)
837 << "\n diffs = " << tcu::IVec4(diff0, diff1, diff2, diff3) << ", max diff = " << maxDiff
838 << TestLog::EndMessage;
839 }
840 else if (numFailed == maxPrints)
841 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
842
843 numFailed += 1;
844 }
845 }
846
847 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
848
849 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
850 numFailed == 0 ? "Pass" : "Result comparison failed");
851 }
852
853 return STOP;
854 }
855
856 private:
857 glu::Precision m_precision;
858 };
859
860 class UnpackSnorm4x8Case : public ShaderPackingFunctionCase
861 {
862 public:
UnpackSnorm4x8Case(Context & context,glu::ShaderType shaderType)863 UnpackSnorm4x8Case (Context& context, glu::ShaderType shaderType)
864 : ShaderPackingFunctionCase(context, (string("unpacksnorm4x8") + getShaderTypePostfix(shaderType)).c_str(), "unpackSnorm4x8", shaderType)
865 {
866 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
867 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_FLOAT_VEC4, glu::PRECISION_HIGHP)));
868
869 m_spec.source = "out0 = unpackSnorm4x8(in0);";
870 }
871
iterate(void)872 IterateResult iterate (void)
873 {
874 const deUint32 maxDiff = 1; // Rounding error.
875 de::Random rnd (deStringHash(getName()) ^ 0x776002);
876 std::vector<deUint32> inputs;
877 std::vector<tcu::Vec4> outputs;
878
879 inputs.push_back(0x00000000u);
880 inputs.push_back(0x7fff8000u);
881 inputs.push_back(0x80007fffu);
882 inputs.push_back(0xffffffffu);
883 inputs.push_back(0x0001fffeu);
884
885 // Random values.
886 for (int ndx = 0; ndx < 95; ndx++)
887 inputs.push_back(rnd.getUint32());
888
889 outputs.resize(inputs.size());
890
891 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
892
893 {
894 const void* in = &inputs[0];
895 void* out = &outputs[0];
896
897 m_executor->useProgram();
898 m_executor->execute((int)inputs.size(), &in, &out);
899 }
900
901 // Verify
902 {
903 const int numValues = (int)inputs.size();
904 const int maxPrints = 10;
905 int numFailed = 0;
906
907 for (int valNdx = 0; valNdx < (int)inputs.size(); valNdx++)
908 {
909 const deInt8 in0 = (deInt8)(deUint8)(inputs[valNdx] & 0xff);
910 const deInt8 in1 = (deInt8)(deUint8)((inputs[valNdx] >> 8) & 0xff);
911 const deInt8 in2 = (deInt8)(deUint8)((inputs[valNdx] >> 16) & 0xff);
912 const deInt8 in3 = (deInt8)(deUint8)(inputs[valNdx] >> 24);
913 const float ref0 = de::clamp(float(in0) / 127.f, -1.0f, 1.0f);
914 const float ref1 = de::clamp(float(in1) / 127.f, -1.0f, 1.0f);
915 const float ref2 = de::clamp(float(in2) / 127.f, -1.0f, 1.0f);
916 const float ref3 = de::clamp(float(in3) / 127.f, -1.0f, 1.0f);
917 const float res0 = outputs[valNdx].x();
918 const float res1 = outputs[valNdx].y();
919 const float res2 = outputs[valNdx].z();
920 const float res3 = outputs[valNdx].w();
921
922 const deUint32 diff0 = getUlpDiff(ref0, res0);
923 const deUint32 diff1 = getUlpDiff(ref1, res1);
924 const deUint32 diff2 = getUlpDiff(ref2, res2);
925 const deUint32 diff3 = getUlpDiff(ref3, res3);
926
927 if (diff0 > maxDiff || diff1 > maxDiff || diff2 > maxDiff || diff3 > maxDiff)
928 {
929 if (numFailed < maxPrints)
930 {
931 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx << ",\n"
932 << " expected unpackSnorm4x8(" << tcu::toHex(inputs[valNdx]) << ") = "
933 << "vec4(" << HexFloat(ref0) << ", " << HexFloat(ref1) << ", " << HexFloat(ref2) << ", " << HexFloat(ref3) << ")"
934 << ", got vec4(" << HexFloat(res0) << ", " << HexFloat(res1) << ", " << HexFloat(res2) << ", " << HexFloat(res3) << ")"
935 << "\n ULP diffs = (" << diff0 << ", " << diff1 << ", " << diff2 << ", " << diff3 << "), max diff = " << maxDiff
936 << TestLog::EndMessage;
937 }
938 else if (numFailed == maxPrints)
939 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
940
941 numFailed += 1;
942 }
943 }
944
945 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
946
947 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
948 numFailed == 0 ? "Pass" : "Result comparison failed");
949 }
950
951 return STOP;
952 }
953 };
954
955 class PackUnorm4x8Case : public ShaderPackingFunctionCase
956 {
957 public:
PackUnorm4x8Case(Context & context,glu::ShaderType shaderType,glu::Precision precision)958 PackUnorm4x8Case (Context& context, glu::ShaderType shaderType, glu::Precision precision)
959 : ShaderPackingFunctionCase (context, (string("packunorm4x8") + getPrecisionPostfix(precision) + getShaderTypePostfix(shaderType)).c_str(), "packUnorm4x8", shaderType)
960 , m_precision (precision)
961 {
962 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC4, precision)));
963 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
964
965 m_spec.source = "out0 = packUnorm4x8(in0);";
966 }
967
iterate(void)968 IterateResult iterate (void)
969 {
970 de::Random rnd (deStringHash(getName()) ^ 0x776002);
971 std::vector<tcu::Vec4> inputs;
972 std::vector<deUint32> outputs;
973 const int maxDiff = m_precision == glu::PRECISION_HIGHP ? 1 : // Rounding only.
974 m_precision == glu::PRECISION_MEDIUMP ? 1 : // (2^-10) * (2^8) + 1
975 m_precision == glu::PRECISION_LOWP ? 2 : 0; // (2^-8) * (2^8) + 1
976
977 // Special values to check.
978 inputs.push_back(tcu::Vec4(0.0f, 0.0f, 0.0f, 0.0f));
979 inputs.push_back(tcu::Vec4(-1.0f, 1.0f, -1.0f, 1.0f));
980 inputs.push_back(tcu::Vec4(0.5f, -0.5f, -0.5f, 0.5f));
981 inputs.push_back(tcu::Vec4(-1.5f, 1.5f, -1.5f, 1.5f));
982 inputs.push_back(tcu::Vec4(0.25f, -0.75f, -0.25f, 0.75f));
983
984 // Random values, mostly in range.
985 for (int ndx = 0; ndx < 15; ndx++)
986 {
987 const float x = rnd.getFloat()*1.25f - 0.125f;
988 const float y = rnd.getFloat()*1.25f - 0.125f;
989 const float z = rnd.getFloat()*1.25f - 0.125f;
990 const float w = rnd.getFloat()*1.25f - 0.125f;
991 inputs.push_back(tcu::Vec4(x, y, z, w));
992 }
993
994 // Large random values.
995 for (int ndx = 0; ndx < 80; ndx++)
996 {
997 const float x = rnd.getFloat()*1e6f - 1e5f;
998 const float y = rnd.getFloat()*1e6f - 1e5f;
999 const float z = rnd.getFloat()*1e6f - 1e5f;
1000 const float w = rnd.getFloat()*1e6f - 1e5f;
1001 inputs.push_back(tcu::Vec4(x, y, z, w));
1002 }
1003
1004 outputs.resize(inputs.size());
1005
1006 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
1007
1008 {
1009 const void* in = &inputs[0];
1010 void* out = &outputs[0];
1011
1012 m_executor->useProgram();
1013 m_executor->execute((int)inputs.size(), &in, &out);
1014 }
1015
1016 // Verify
1017 {
1018 const int numValues = (int)inputs.size();
1019 const int maxPrints = 10;
1020 int numFailed = 0;
1021
1022 for (int valNdx = 0; valNdx < (int)inputs.size(); valNdx++)
1023 {
1024 const deUint16 ref0 = (deUint8)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].x(), 0.0f, 1.0f) * 255.0f), 0, (1<<8)-1);
1025 const deUint16 ref1 = (deUint8)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].y(), 0.0f, 1.0f) * 255.0f), 0, (1<<8)-1);
1026 const deUint16 ref2 = (deUint8)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].z(), 0.0f, 1.0f) * 255.0f), 0, (1<<8)-1);
1027 const deUint16 ref3 = (deUint8)de::clamp(deRoundFloatToInt32(de::clamp(inputs[valNdx].w(), 0.0f, 1.0f) * 255.0f), 0, (1<<8)-1);
1028 const deUint32 ref = (deUint32(ref3) << 24) | (deUint32(ref2) << 16) | (deUint32(ref1) << 8) | deUint32(ref0);
1029 const deUint32 res = outputs[valNdx];
1030 const deUint16 res0 = (deUint8)(res & 0xff);
1031 const deUint16 res1 = (deUint8)((res >> 8) & 0xff);
1032 const deUint16 res2 = (deUint8)((res >> 16) & 0xff);
1033 const deUint16 res3 = (deUint8)((res >> 24) & 0xff);
1034 const int diff0 = de::abs((int)ref0 - (int)res0);
1035 const int diff1 = de::abs((int)ref1 - (int)res1);
1036 const int diff2 = de::abs((int)ref2 - (int)res2);
1037 const int diff3 = de::abs((int)ref3 - (int)res3);
1038
1039 if (diff0 > maxDiff || diff1 > maxDiff || diff2 > maxDiff || diff3 > maxDiff)
1040 {
1041 if (numFailed < maxPrints)
1042 {
1043 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx
1044 << ", expected packUnorm4x8(" << inputs[valNdx] << ") = " << tcu::toHex(ref)
1045 << ", got " << tcu::toHex(res)
1046 << "\n diffs = " << tcu::IVec4(diff0, diff1, diff2, diff3) << ", max diff = " << maxDiff
1047 << TestLog::EndMessage;
1048 }
1049 else if (numFailed == maxPrints)
1050 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
1051
1052 numFailed += 1;
1053 }
1054 }
1055
1056 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
1057
1058 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
1059 numFailed == 0 ? "Pass" : "Result comparison failed");
1060 }
1061
1062 return STOP;
1063 }
1064
1065 private:
1066 glu::Precision m_precision;
1067 };
1068
1069 class UnpackUnorm4x8Case : public ShaderPackingFunctionCase
1070 {
1071 public:
UnpackUnorm4x8Case(Context & context,glu::ShaderType shaderType)1072 UnpackUnorm4x8Case (Context& context, glu::ShaderType shaderType)
1073 : ShaderPackingFunctionCase(context, (string("unpackunorm4x8") + getShaderTypePostfix(shaderType)).c_str(), "unpackUnorm4x8", shaderType)
1074 {
1075 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
1076 m_spec.outputs.push_back(Symbol("out0", glu::VarType(glu::TYPE_FLOAT_VEC4, glu::PRECISION_HIGHP)));
1077
1078 m_spec.source = "out0 = unpackUnorm4x8(in0);";
1079 }
1080
iterate(void)1081 IterateResult iterate (void)
1082 {
1083 const deUint32 maxDiff = 1; // Rounding error.
1084 de::Random rnd (deStringHash(getName()) ^ 0x776002);
1085 std::vector<deUint32> inputs;
1086 std::vector<tcu::Vec4> outputs;
1087
1088 inputs.push_back(0x00000000u);
1089 inputs.push_back(0x7fff8000u);
1090 inputs.push_back(0x80007fffu);
1091 inputs.push_back(0xffffffffu);
1092 inputs.push_back(0x0001fffeu);
1093
1094 // Random values.
1095 for (int ndx = 0; ndx < 95; ndx++)
1096 inputs.push_back(rnd.getUint32());
1097
1098 outputs.resize(inputs.size());
1099
1100 m_testCtx.getLog() << TestLog::Message << "Executing shader for " << inputs.size() << " input values" << tcu::TestLog::EndMessage;
1101
1102 {
1103 const void* in = &inputs[0];
1104 void* out = &outputs[0];
1105
1106 m_executor->useProgram();
1107 m_executor->execute((int)inputs.size(), &in, &out);
1108 }
1109
1110 // Verify
1111 {
1112 const int numValues = (int)inputs.size();
1113 const int maxPrints = 10;
1114 int numFailed = 0;
1115
1116 for (int valNdx = 0; valNdx < (int)inputs.size(); valNdx++)
1117 {
1118 const deUint8 in0 = (deUint8)(inputs[valNdx] & 0xff);
1119 const deUint8 in1 = (deUint8)((inputs[valNdx] >> 8) & 0xff);
1120 const deUint8 in2 = (deUint8)((inputs[valNdx] >> 16) & 0xff);
1121 const deUint8 in3 = (deUint8)(inputs[valNdx] >> 24);
1122 const float ref0 = de::clamp(float(in0) / 255.f, 0.0f, 1.0f);
1123 const float ref1 = de::clamp(float(in1) / 255.f, 0.0f, 1.0f);
1124 const float ref2 = de::clamp(float(in2) / 255.f, 0.0f, 1.0f);
1125 const float ref3 = de::clamp(float(in3) / 255.f, 0.0f, 1.0f);
1126 const float res0 = outputs[valNdx].x();
1127 const float res1 = outputs[valNdx].y();
1128 const float res2 = outputs[valNdx].z();
1129 const float res3 = outputs[valNdx].w();
1130
1131 const deUint32 diff0 = getUlpDiff(ref0, res0);
1132 const deUint32 diff1 = getUlpDiff(ref1, res1);
1133 const deUint32 diff2 = getUlpDiff(ref2, res2);
1134 const deUint32 diff3 = getUlpDiff(ref3, res3);
1135
1136 if (diff0 > maxDiff || diff1 > maxDiff || diff2 > maxDiff || diff3 > maxDiff)
1137 {
1138 if (numFailed < maxPrints)
1139 {
1140 m_testCtx.getLog() << TestLog::Message << "ERROR: Mismatch in value " << valNdx << ",\n"
1141 << " expected unpackUnorm4x8(" << tcu::toHex(inputs[valNdx]) << ") = "
1142 << "vec4(" << HexFloat(ref0) << ", " << HexFloat(ref1) << ", " << HexFloat(ref2) << ", " << HexFloat(ref3) << ")"
1143 << ", got vec4(" << HexFloat(res0) << ", " << HexFloat(res1) << ", " << HexFloat(res2) << ", " << HexFloat(res3) << ")"
1144 << "\n ULP diffs = (" << diff0 << ", " << diff1 << ", " << diff2 << ", " << diff3 << "), max diff = " << maxDiff
1145 << TestLog::EndMessage;
1146 }
1147 else if (numFailed == maxPrints)
1148 m_testCtx.getLog() << TestLog::Message << "..." << TestLog::EndMessage;
1149
1150 numFailed += 1;
1151 }
1152 }
1153
1154 m_testCtx.getLog() << TestLog::Message << (numValues - numFailed) << " / " << numValues << " values passed" << TestLog::EndMessage;
1155
1156 m_testCtx.setTestResult(numFailed == 0 ? QP_TEST_RESULT_PASS : QP_TEST_RESULT_FAIL,
1157 numFailed == 0 ? "Pass" : "Result comparison failed");
1158 }
1159
1160 return STOP;
1161 }
1162 };
1163
ShaderPackingFunctionTests(Context & context)1164 ShaderPackingFunctionTests::ShaderPackingFunctionTests (Context& context)
1165 : TestCaseGroup(context, "pack_unpack", "Floating-point pack and unpack function tests")
1166 {
1167 }
1168
~ShaderPackingFunctionTests(void)1169 ShaderPackingFunctionTests::~ShaderPackingFunctionTests (void)
1170 {
1171 }
1172
init(void)1173 void ShaderPackingFunctionTests::init (void)
1174 {
1175 // New built-in functions in GLES 3.1
1176 {
1177 const glu::ShaderType allShaderTypes[] =
1178 {
1179 glu::SHADERTYPE_VERTEX,
1180 glu::SHADERTYPE_TESSELLATION_CONTROL,
1181 glu::SHADERTYPE_TESSELLATION_EVALUATION,
1182 glu::SHADERTYPE_GEOMETRY,
1183 glu::SHADERTYPE_FRAGMENT,
1184 glu::SHADERTYPE_COMPUTE
1185 };
1186
1187 // packSnorm4x8
1188 for (int prec = 0; prec < glu::PRECISION_LAST; prec++)
1189 {
1190 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(allShaderTypes); shaderTypeNdx++)
1191 addChild(new PackSnorm4x8Case(m_context, allShaderTypes[shaderTypeNdx], glu::Precision(prec)));
1192 }
1193
1194 // unpackSnorm4x8
1195 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(allShaderTypes); shaderTypeNdx++)
1196 addChild(new UnpackSnorm4x8Case(m_context, allShaderTypes[shaderTypeNdx]));
1197
1198 // packUnorm4x8
1199 for (int prec = 0; prec < glu::PRECISION_LAST; prec++)
1200 {
1201 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(allShaderTypes); shaderTypeNdx++)
1202 addChild(new PackUnorm4x8Case(m_context, allShaderTypes[shaderTypeNdx], glu::Precision(prec)));
1203 }
1204
1205 // unpackUnorm4x8
1206 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(allShaderTypes); shaderTypeNdx++)
1207 addChild(new UnpackUnorm4x8Case(m_context, allShaderTypes[shaderTypeNdx]));
1208 }
1209
1210 // GLES 3 functions in new shader types.
1211 {
1212 const glu::ShaderType newShaderTypes[] =
1213 {
1214 glu::SHADERTYPE_GEOMETRY,
1215 glu::SHADERTYPE_COMPUTE
1216 };
1217
1218 // packSnorm2x16
1219 for (int prec = 0; prec < glu::PRECISION_LAST; prec++)
1220 {
1221 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(newShaderTypes); shaderTypeNdx++)
1222 addChild(new PackSnorm2x16Case(m_context, newShaderTypes[shaderTypeNdx], glu::Precision(prec)));
1223 }
1224
1225 // unpackSnorm2x16
1226 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(newShaderTypes); shaderTypeNdx++)
1227 addChild(new UnpackSnorm2x16Case(m_context, newShaderTypes[shaderTypeNdx]));
1228
1229 // packUnorm2x16
1230 for (int prec = 0; prec < glu::PRECISION_LAST; prec++)
1231 {
1232 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(newShaderTypes); shaderTypeNdx++)
1233 addChild(new PackUnorm2x16Case(m_context, newShaderTypes[shaderTypeNdx], glu::Precision(prec)));
1234 }
1235
1236 // unpackUnorm2x16
1237 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(newShaderTypes); shaderTypeNdx++)
1238 addChild(new UnpackUnorm2x16Case(m_context, newShaderTypes[shaderTypeNdx]));
1239
1240 // packHalf2x16
1241 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(newShaderTypes); shaderTypeNdx++)
1242 addChild(new PackHalf2x16Case(m_context, newShaderTypes[shaderTypeNdx]));
1243
1244 // unpackHalf2x16
1245 for (int shaderTypeNdx = 0; shaderTypeNdx < DE_LENGTH_OF_ARRAY(newShaderTypes); shaderTypeNdx++)
1246 addChild(new UnpackHalf2x16Case(m_context, newShaderTypes[shaderTypeNdx]));
1247 }
1248 }
1249
1250 } // Functional
1251 } // gles31
1252 } // deqp
1253