1 /*-------------------------------------------------------------------------
2 * Vulkan Conformance Tests
3 * ------------------------
4 *
5 * Copyright (c) 2015 Google Inc.
6 *
7 * Licensed under the Apache License, Version 2.0 (the "License");
8 * you may not use this file except in compliance with the License.
9 * You may obtain a copy of the License at
10 *
11 * http://www.apache.org/licenses/LICENSE-2.0
12 *
13 * Unless required by applicable law or agreed to in writing, software
14 * distributed under the License is distributed on an "AS IS" BASIS,
15 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16 * See the License for the specific language governing permissions and
17 * limitations under the License.
18 *
19 *//*!
20 * \file
21 * \brief ShaderLibrary Vulkan implementation
22 *//*--------------------------------------------------------------------*/
23
24 #include "vktShaderLibrary.hpp"
25 #include "vktTestCase.hpp"
26
27 #include "vkPrograms.hpp"
28 #include "vkRef.hpp"
29 #include "vkRefUtil.hpp"
30 #include "vkMemUtil.hpp"
31 #include "vkQueryUtil.hpp"
32 #include "vkBuilderUtil.hpp"
33 #include "vkTypeUtil.hpp"
34 #include "vkImageUtil.hpp"
35 #include "vkCmdUtil.hpp"
36 #include "vkObjUtil.hpp"
37
38 #include "gluShaderLibrary.hpp"
39 #include "gluShaderUtil.hpp"
40
41 #include "tcuStringTemplate.hpp"
42 #include "tcuTexture.hpp"
43 #include "tcuTestLog.hpp"
44 #include "tcuVector.hpp"
45 #include "tcuVectorUtil.hpp"
46
47 #include "deStringUtil.hpp"
48 #include "deArrayUtil.hpp"
49 #include "deMemory.h"
50
51 #include <sstream>
52 #include <map>
53
54 namespace vkt
55 {
56
57 using std::string;
58 using std::vector;
59 using std::map;
60 using std::pair;
61 using std::ostringstream;
62
63 using de::MovePtr;
64 using de::UniquePtr;
65
66 using glu::ShaderType;
67 using glu::ProgramSources;
68 using glu::DataType;
69
70 using glu::sl::ShaderCaseSpecification;
71 using glu::sl::ProgramSpecializationParams;
72 using glu::sl::RequiredExtension;
73 using glu::sl::Value;
74 using glu::sl::ValueBlock;
75
76 using tcu::TestStatus;
77 using tcu::StringTemplate;
78 using tcu::Vec2;
79 using tcu::ConstPixelBufferAccess;
80 using tcu::TextureFormat;
81 using tcu::TestLog;
82
83 using vk::SourceCollections;
84 using vk::Move;
85 using vk::Unique;
86
87 namespace
88 {
89
90 enum
91 {
92 REFERENCE_UNIFORM_BINDING = 0,
93 USER_UNIFORM_BINDING = 1
94 };
95
getShaderName(ShaderType shaderType,size_t progNdx)96 string getShaderName (ShaderType shaderType, size_t progNdx)
97 {
98 ostringstream str;
99 str << glu::getShaderTypeName(shaderType);
100 if (progNdx > 0)
101 str << "_" << progNdx;
102 return str.str();
103 }
104
genUniformBlock(ostringstream & out,const string & blockName,const string & instanceName,int setNdx,int bindingNdx,const vector<Value> & uniforms)105 void genUniformBlock (ostringstream& out, const string& blockName, const string& instanceName, int setNdx, int bindingNdx, const vector<Value>& uniforms)
106 {
107 out << "layout(";
108
109 if (setNdx != 0)
110 out << "set = " << setNdx << ", ";
111
112 out << "binding = " << bindingNdx << ", std140) uniform " << blockName << "\n"
113 << "{\n";
114
115 for (vector<Value>::const_iterator val = uniforms.begin(); val != uniforms.end(); ++val)
116 out << "\t" << glu::declare(val->type, val->name, 1) << ";\n";
117
118 out << "}";
119
120 if (!instanceName.empty())
121 out << " " << instanceName;
122
123 out << ";\n";
124 }
125
declareReferenceBlock(ostringstream & out,const ValueBlock & valueBlock)126 void declareReferenceBlock (ostringstream& out, const ValueBlock& valueBlock)
127 {
128 if (!valueBlock.outputs.empty())
129 genUniformBlock(out, "Reference", "ref", 0, REFERENCE_UNIFORM_BINDING, valueBlock.outputs);
130 }
131
declareUniforms(ostringstream & out,const ValueBlock & valueBlock)132 void declareUniforms (ostringstream& out, const ValueBlock& valueBlock)
133 {
134 if (!valueBlock.uniforms.empty())
135 genUniformBlock(out, "Uniforms", "", 0, USER_UNIFORM_BINDING, valueBlock.uniforms);
136 }
137
getTransportType(DataType valueType)138 DataType getTransportType (DataType valueType)
139 {
140 if (isDataTypeBoolOrBVec(valueType))
141 return glu::getDataTypeUintVec(getDataTypeScalarSize(valueType));
142 else
143 return valueType;
144 }
145
getNumTransportLocations(DataType valueType)146 int getNumTransportLocations (DataType valueType)
147 {
148 return isDataTypeMatrix(valueType) ? getDataTypeMatrixNumColumns(valueType) : 1;
149 }
150
151 // This functions builds a matching vertex shader for a 'both' case, when
152 // the fragment shader is being tested.
153 // We need to build attributes and varyings for each 'input'.
genVertexShader(const ShaderCaseSpecification & spec)154 string genVertexShader (const ShaderCaseSpecification& spec)
155 {
156 ostringstream res;
157 int curInputLoc = 0;
158 int curOutputLoc = 0;
159
160 res << glu::getGLSLVersionDeclaration(spec.targetVersion) << "\n";
161
162 // Declarations (position + attribute/varying for each input).
163 res << "precision highp float;\n";
164 res << "precision highp int;\n";
165 res << "\n";
166 res << "layout(location = 0) in highp vec4 dEQP_Position;\n";
167 curInputLoc += 1;
168
169 for (size_t ndx = 0; ndx < spec.values.inputs.size(); ndx++)
170 {
171 const Value& val = spec.values.inputs[ndx];
172 const DataType valueType = val.type.getBasicType();
173 const DataType transportType = getTransportType(valueType);
174 const char* const transportTypeStr = getDataTypeName(transportType);
175 const int numLocs = getNumTransportLocations(valueType);
176
177 res << "layout(location = " << curInputLoc << ") in " << transportTypeStr << " a_" << val.name << ";\n";
178 res << "layout(location = " << curOutputLoc << ") flat out " << transportTypeStr << " " << (transportType != valueType ? "v_" : "") << val.name << ";\n";
179
180 curInputLoc += numLocs;
181 curOutputLoc += numLocs;
182 }
183 res << "\n";
184
185 // Main function.
186 // - gl_Position = dEQP_Position;
187 // - for each input: write attribute directly to varying
188 res << "void main()\n";
189 res << "{\n";
190 res << " gl_Position = dEQP_Position;\n";
191 for (size_t ndx = 0; ndx < spec.values.inputs.size(); ndx++)
192 {
193 const Value& val = spec.values.inputs[ndx];
194 const string& name = val.name;
195
196 res << " " << (getTransportType(val.type.getBasicType()) != val.type.getBasicType() ? "v_" : "")
197 << name << " = a_" << name << ";\n";
198 }
199
200 res << "}\n";
201 return res.str();
202 }
203
genCompareOp(ostringstream & output,const char * dstVec4Var,const ValueBlock & valueBlock,const char * checkVarName)204 void genCompareOp (ostringstream& output, const char* dstVec4Var, const ValueBlock& valueBlock, const char* checkVarName)
205 {
206 bool isFirstOutput = true;
207
208 for (size_t ndx = 0; ndx < valueBlock.outputs.size(); ndx++)
209 {
210 const Value& val = valueBlock.outputs[ndx];
211
212 // Check if we're only interested in one variable (then skip if not the right one).
213 if (checkVarName && val.name != checkVarName)
214 continue;
215
216 // Prefix.
217 if (isFirstOutput)
218 {
219 output << "bool RES = ";
220 isFirstOutput = false;
221 }
222 else
223 output << "RES = RES && ";
224
225 // Generate actual comparison.
226 if (getDataTypeScalarType(val.type.getBasicType()) == glu::TYPE_FLOAT)
227 output << "isOk(" << val.name << ", ref." << val.name << ", 0.05);\n";
228 else
229 output << "isOk(" << val.name << ", ref." << val.name << ");\n";
230 }
231
232 if (isFirstOutput)
233 output << dstVec4Var << " = vec4(1.0);\n";
234 else
235 output << dstVec4Var << " = vec4(RES, RES, RES, 1.0);\n";
236 }
237
genFragmentShader(const ShaderCaseSpecification & spec)238 string genFragmentShader (const ShaderCaseSpecification& spec)
239 {
240 ostringstream shader;
241 ostringstream setup;
242 int curInLoc = 0;
243
244 shader << glu::getGLSLVersionDeclaration(spec.targetVersion) << "\n";
245
246 shader << "precision highp float;\n";
247 shader << "precision highp int;\n";
248 shader << "\n";
249
250 shader << "layout(location = 0) out mediump vec4 dEQP_FragColor;\n";
251 shader << "\n";
252
253 genCompareFunctions(shader, spec.values, false);
254 shader << "\n";
255
256 // Declarations (varying, reference for each output).
257 for (size_t ndx = 0; ndx < spec.values.outputs.size(); ndx++)
258 {
259 const Value& val = spec.values.outputs[ndx];
260 const DataType valueType = val.type.getBasicType();
261 const char* const valueTypeStr = getDataTypeName(valueType);
262 const DataType transportType = getTransportType(valueType);
263 const char* const transportTypeStr = getDataTypeName(transportType);
264 const int numLocs = getNumTransportLocations(valueType);
265
266 shader << "layout(location = " << curInLoc << ") flat in " << transportTypeStr << " " << (valueType != transportType ? "v_" : "") << val.name << ";\n";
267
268 if (valueType != transportType)
269 setup << " " << valueTypeStr << " " << val.name << " = " << valueTypeStr << "(v_" << val.name << ");\n";
270
271 curInLoc += numLocs;
272 }
273
274 declareReferenceBlock(shader, spec.values);
275
276 shader << "\n";
277 shader << "void main()\n";
278 shader << "{\n";
279
280 shader << setup.str();
281
282 shader << " ";
283 genCompareOp(shader, "dEQP_FragColor", spec.values, DE_NULL);
284
285 shader << "}\n";
286 return shader.str();
287 }
288
289 // Specialize a shader for the vertex shader test case.
specializeVertexShader(const ShaderCaseSpecification & spec,const string & src)290 string specializeVertexShader (const ShaderCaseSpecification& spec, const string& src)
291 {
292 ostringstream decl;
293 ostringstream setup;
294 ostringstream output;
295 int curInputLoc = 0;
296 int curOutputLoc = 0;
297
298 // generated from "both" case
299 DE_ASSERT(spec.caseType == glu::sl::CASETYPE_VERTEX_ONLY);
300
301 // Output (write out position).
302 output << "gl_Position = dEQP_Position;\n";
303
304 // Declarations (position + attribute for each input, varying for each output).
305 decl << "layout(location = 0) in highp vec4 dEQP_Position;\n";
306 curInputLoc += 1;
307
308 for (size_t ndx = 0; ndx < spec.values.inputs.size(); ndx++)
309 {
310 const Value& val = spec.values.inputs[ndx];
311 const DataType valueType = val.type.getBasicType();
312 const char* const valueTypeStr = getDataTypeName(valueType);
313 const DataType transportType = getTransportType(valueType);
314 const char* const transportTypeStr = getDataTypeName(transportType);
315 const int numLocs = getNumTransportLocations(valueType);
316
317 decl << "layout(location = " << curInputLoc << ") in ";
318
319 curInputLoc += numLocs;
320
321 if (valueType == transportType)
322 decl << transportTypeStr << " " << val.name << ";\n";
323 else
324 {
325 decl << transportTypeStr << " a_" << val.name << ";\n";
326 setup << valueTypeStr << " " << val.name << " = " << valueTypeStr << "(a_" << val.name << ");\n";
327 }
328 }
329
330 declareUniforms(decl, spec.values);
331
332 for (size_t ndx = 0; ndx < spec.values.outputs.size(); ndx++)
333 {
334 const Value& val = spec.values.outputs[ndx];
335 const DataType valueType = val.type.getBasicType();
336 const char* const valueTypeStr = getDataTypeName(valueType);
337 const DataType transportType = getTransportType(valueType);
338 const char* const transportTypeStr = getDataTypeName(transportType);
339 const int numLocs = getNumTransportLocations(valueType);
340
341 decl << "layout(location = " << curOutputLoc << ") flat out ";
342
343 curOutputLoc += numLocs;
344
345 if (valueType == transportType)
346 decl << transportTypeStr << " " << val.name << ";\n";
347 else
348 {
349 decl << transportTypeStr << " v_" << val.name << ";\n";
350 decl << valueTypeStr << " " << val.name << ";\n";
351
352 output << "v_" << val.name << " = " << transportTypeStr << "(" << val.name << ");\n";
353 }
354 }
355
356 // Shader specialization.
357 map<string, string> params;
358 params.insert(pair<string, string>("DECLARATIONS", decl.str()));
359 params.insert(pair<string, string>("SETUP", setup.str()));
360 params.insert(pair<string, string>("OUTPUT", output.str()));
361 params.insert(pair<string, string>("POSITION_FRAG_COLOR", "gl_Position"));
362
363 StringTemplate tmpl (src);
364 const string baseSrc = tmpl.specialize(params);
365 const string withExt = injectExtensionRequirements(baseSrc, spec.programs[0].requiredExtensions, glu::SHADERTYPE_VERTEX);
366
367 return withExt;
368 }
369
370 // Specialize a shader for the fragment shader test case.
specializeFragmentShader(const ShaderCaseSpecification & spec,const string & src)371 string specializeFragmentShader (const ShaderCaseSpecification& spec, const string& src)
372 {
373 ostringstream decl;
374 ostringstream setup;
375 ostringstream output;
376 int curInputLoc = 0;
377
378 // generated from "both" case
379 DE_ASSERT(spec.caseType == glu::sl::CASETYPE_FRAGMENT_ONLY);
380
381 genCompareFunctions(decl, spec.values, false);
382 genCompareOp(output, "dEQP_FragColor", spec.values, DE_NULL);
383
384 decl << "layout(location = 0) out mediump vec4 dEQP_FragColor;\n";
385
386 for (size_t ndx = 0; ndx < spec.values.inputs.size(); ndx++)
387 {
388 const Value& val = spec.values.inputs[ndx];
389 const DataType valueType = val.type.getBasicType();
390 const char* const valueTypeStr = getDataTypeName(valueType);
391 const DataType transportType = getTransportType(valueType);
392 const char* const transportTypeStr = getDataTypeName(transportType);
393 const int numLocs = getNumTransportLocations(valueType);
394
395 decl << "layout(location = " << curInputLoc << ") flat in ";
396
397 curInputLoc += numLocs;
398
399 if (valueType == transportType)
400 decl << transportTypeStr << " " << val.name << ";\n";
401 else
402 {
403 decl << transportTypeStr << " v_" << val.name << ";\n";
404 setup << valueTypeStr << " " << val.name << " = " << valueTypeStr << "(v_" << val.name << ");\n";
405 }
406 }
407
408 declareUniforms(decl, spec.values);
409 declareReferenceBlock(decl, spec.values);
410
411 for (size_t ndx = 0; ndx < spec.values.outputs.size(); ndx++)
412 {
413 const Value& val = spec.values.outputs[ndx];
414 const DataType basicType = val.type.getBasicType();
415 const char* const refTypeStr = getDataTypeName(basicType);
416
417 decl << refTypeStr << " " << val.name << ";\n";
418 }
419
420 // Shader specialization.
421 map<string, string> params;
422 params.insert(pair<string, string>("DECLARATIONS", decl.str()));
423 params.insert(pair<string, string>("SETUP", setup.str()));
424 params.insert(pair<string, string>("OUTPUT", output.str()));
425 params.insert(pair<string, string>("POSITION_FRAG_COLOR", "dEQP_FragColor"));
426
427 StringTemplate tmpl (src);
428 const string baseSrc = tmpl.specialize(params);
429 const string withExt = injectExtensionRequirements(baseSrc, spec.programs[0].requiredExtensions, glu::SHADERTYPE_FRAGMENT);
430
431 return withExt;
432 }
433
generateVertexSpecialization(const ProgramSpecializationParams & specParams)434 map<string, string> generateVertexSpecialization (const ProgramSpecializationParams& specParams)
435 {
436 ostringstream decl;
437 ostringstream setup;
438 map<string, string> params;
439 int curInputLoc = 0;
440
441 decl << "layout(location = 0) in highp vec4 dEQP_Position;\n";
442 curInputLoc += 1;
443
444 for (size_t ndx = 0; ndx < specParams.caseSpec.values.inputs.size(); ndx++)
445 {
446 const Value& val = specParams.caseSpec.values.inputs[ndx];
447 const DataType valueType = val.type.getBasicType();
448 const char* const valueTypeStr = getDataTypeName(valueType);
449 const DataType transportType = getTransportType(valueType);
450 const char* const transportTypeStr = getDataTypeName(transportType);
451 const int numLocs = getNumTransportLocations(valueType);
452
453 decl << "layout(location = " << curInputLoc << ") in ";
454
455 curInputLoc += numLocs;
456
457 if (valueType == transportType)
458 decl << transportTypeStr << " " << val.name << ";\n";
459 else
460 {
461 decl << transportTypeStr << " a_" << val.name << ";\n";
462 setup << valueTypeStr << " " << val.name << " = " << valueTypeStr << "(a_" << val.name << ");\n";
463 }
464 }
465
466 declareUniforms(decl, specParams.caseSpec.values);
467
468 params.insert(pair<string, string>("VERTEX_DECLARATIONS", decl.str()));
469 params.insert(pair<string, string>("VERTEX_SETUP", setup.str()));
470 params.insert(pair<string, string>("VERTEX_OUTPUT", string("gl_Position = dEQP_Position;\n")));
471
472 return params;
473 }
474
generateFragmentSpecialization(const ProgramSpecializationParams & specParams)475 map<string, string> generateFragmentSpecialization (const ProgramSpecializationParams& specParams)
476 {
477 ostringstream decl;
478 ostringstream output;
479 map<string, string> params;
480
481 genCompareFunctions(decl, specParams.caseSpec.values, false);
482 genCompareOp(output, "dEQP_FragColor", specParams.caseSpec.values, DE_NULL);
483
484 decl << "layout(location = 0) out mediump vec4 dEQP_FragColor;\n";
485
486 for (size_t ndx = 0; ndx < specParams.caseSpec.values.outputs.size(); ndx++)
487 {
488 const Value& val = specParams.caseSpec.values.outputs[ndx];
489 const char* const refTypeStr = getDataTypeName(val.type.getBasicType());
490
491 decl << refTypeStr << " " << val.name << ";\n";
492 }
493
494 declareReferenceBlock(decl, specParams.caseSpec.values);
495 declareUniforms(decl, specParams.caseSpec.values);
496
497 params.insert(pair<string, string>("FRAGMENT_DECLARATIONS", decl.str()));
498 params.insert(pair<string, string>("FRAGMENT_OUTPUT", output.str()));
499 params.insert(pair<string, string>("FRAG_COLOR", "dEQP_FragColor"));
500
501 return params;
502 }
503
generateGeometrySpecialization(const ProgramSpecializationParams & specParams)504 map<string, string> generateGeometrySpecialization (const ProgramSpecializationParams& specParams)
505 {
506 ostringstream decl;
507 map<string, string> params;
508
509 decl << "layout (triangles) in;\n";
510 decl << "layout (triangle_strip, max_vertices=3) out;\n";
511 decl << "\n";
512
513 declareUniforms(decl, specParams.caseSpec.values);
514
515 params.insert(pair<string, string>("GEOMETRY_DECLARATIONS", decl.str()));
516
517 return params;
518 }
519
generateTessControlSpecialization(const ProgramSpecializationParams & specParams)520 map<string, string> generateTessControlSpecialization (const ProgramSpecializationParams& specParams)
521 {
522 ostringstream decl;
523 ostringstream output;
524 map<string, string> params;
525
526 decl << "layout (vertices=3) out;\n";
527 decl << "\n";
528
529 declareUniforms(decl, specParams.caseSpec.values);
530
531 output << "gl_out[gl_InvocationID].gl_Position = gl_in[gl_InvocationID].gl_Position;\n"
532 "gl_TessLevelInner[0] = 2.0;\n"
533 "gl_TessLevelInner[1] = 2.0;\n"
534 "gl_TessLevelOuter[0] = 2.0;\n"
535 "gl_TessLevelOuter[1] = 2.0;\n"
536 "gl_TessLevelOuter[2] = 2.0;\n"
537 "gl_TessLevelOuter[3] = 2.0;";
538
539 params.insert(pair<string, string>("TESSELLATION_CONTROL_DECLARATIONS", decl.str()));
540 params.insert(pair<string, string>("TESSELLATION_CONTROL_OUTPUT", output.str()));
541 params.insert(pair<string, string>("GL_MAX_PATCH_VERTICES", de::toString(specParams.maxPatchVertices)));
542
543 return params;
544 }
545
generateTessEvalSpecialization(const ProgramSpecializationParams & specParams)546 map<string, string> generateTessEvalSpecialization (const ProgramSpecializationParams& specParams)
547 {
548 ostringstream decl;
549 ostringstream output;
550 map<string, string> params;
551
552 decl << "layout (triangles) in;\n";
553 decl << "\n";
554
555 declareUniforms(decl, specParams.caseSpec.values);
556
557 output << "gl_Position = gl_TessCoord[0] * gl_in[0].gl_Position + gl_TessCoord[1] * gl_in[1].gl_Position + gl_TessCoord[2] * gl_in[2].gl_Position;\n";
558
559 params.insert(pair<string, string>("TESSELLATION_EVALUATION_DECLARATIONS", decl.str()));
560 params.insert(pair<string, string>("TESSELLATION_EVALUATION_OUTPUT", output.str()));
561 params.insert(pair<string, string>("GL_MAX_PATCH_VERTICES", de::toString(specParams.maxPatchVertices)));
562
563 return params;
564 }
565
specializeShaderSources(ProgramSources & dst,const ProgramSources & src,const ProgramSpecializationParams & specParams,glu::ShaderType shaderType,map<string,string> (* specializationGenerator)(const ProgramSpecializationParams & specParams))566 void specializeShaderSources (ProgramSources& dst,
567 const ProgramSources& src,
568 const ProgramSpecializationParams& specParams,
569 glu::ShaderType shaderType,
570 map<string, string> (*specializationGenerator) (const ProgramSpecializationParams& specParams))
571 {
572 if (!src.sources[shaderType].empty())
573 {
574 const map<string, string> tmplParams = specializationGenerator(specParams);
575
576 for (size_t ndx = 0; ndx < src.sources[shaderType].size(); ++ndx)
577 {
578 const StringTemplate tmpl (src.sources[shaderType][ndx]);
579 const string baseGLSLCode = tmpl.specialize(tmplParams);
580 const string sourceWithExts = injectExtensionRequirements(baseGLSLCode, specParams.requiredExtensions, shaderType);
581
582 dst << glu::ShaderSource(shaderType, sourceWithExts);
583 }
584 }
585 }
586
specializeProgramSources(glu::ProgramSources & dst,const glu::ProgramSources & src,const ProgramSpecializationParams & specParams)587 void specializeProgramSources (glu::ProgramSources& dst,
588 const glu::ProgramSources& src,
589 const ProgramSpecializationParams& specParams)
590 {
591 specializeShaderSources(dst, src, specParams, glu::SHADERTYPE_VERTEX, generateVertexSpecialization);
592 specializeShaderSources(dst, src, specParams, glu::SHADERTYPE_FRAGMENT, generateFragmentSpecialization);
593 specializeShaderSources(dst, src, specParams, glu::SHADERTYPE_GEOMETRY, generateGeometrySpecialization);
594 specializeShaderSources(dst, src, specParams, glu::SHADERTYPE_TESSELLATION_CONTROL, generateTessControlSpecialization);
595 specializeShaderSources(dst, src, specParams, glu::SHADERTYPE_TESSELLATION_EVALUATION, generateTessEvalSpecialization);
596
597 dst << glu::ProgramSeparable(src.separable);
598 }
599
600 struct ValueBufferLayout
601 {
602 struct Entry
603 {
604 int offset;
605 int vecStride; //! Applies to matrices only
606
Entryvkt::__anon9520bb000111::ValueBufferLayout::Entry607 Entry (void) : offset(0), vecStride(0) {}
Entryvkt::__anon9520bb000111::ValueBufferLayout::Entry608 Entry (int offset_, int vecStride_) : offset(offset_), vecStride(vecStride_) {}
609 };
610
611 vector<Entry> entries;
612 int size;
613
ValueBufferLayoutvkt::__anon9520bb000111::ValueBufferLayout614 ValueBufferLayout (void) : size(0) {}
615 };
616
computeStd140Layout(const vector<Value> & values)617 ValueBufferLayout computeStd140Layout (const vector<Value>& values)
618 {
619 ValueBufferLayout layout;
620
621 layout.entries.resize(values.size());
622
623 for (size_t ndx = 0; ndx < values.size(); ++ndx)
624 {
625 const DataType basicType = values[ndx].type.getBasicType();
626 const bool isMatrix = isDataTypeMatrix(basicType);
627 const int numVecs = isMatrix ? getDataTypeMatrixNumColumns(basicType) : 1;
628 const DataType vecType = isMatrix ? glu::getDataTypeFloatVec(getDataTypeMatrixNumRows(basicType)) : basicType;
629 const int vecSize = getDataTypeScalarSize(vecType);
630 const int alignment = ((isMatrix || vecSize == 3) ? 4 : vecSize)*int(sizeof(deUint32));
631
632 layout.size = deAlign32(layout.size, alignment);
633 layout.entries[ndx] = ValueBufferLayout::Entry(layout.size, alignment);
634 layout.size += alignment*(numVecs-1) + vecSize*int(sizeof(deUint32));
635 }
636
637 return layout;
638 }
639
computeStd430Layout(const vector<Value> & values)640 ValueBufferLayout computeStd430Layout (const vector<Value>& values)
641 {
642 ValueBufferLayout layout;
643
644 layout.entries.resize(values.size());
645
646 for (size_t ndx = 0; ndx < values.size(); ++ndx)
647 {
648 const DataType basicType = values[ndx].type.getBasicType();
649 const int numVecs = isDataTypeMatrix(basicType) ? getDataTypeMatrixNumColumns(basicType) : 1;
650 const DataType vecType = isDataTypeMatrix(basicType) ? glu::getDataTypeFloatVec(getDataTypeMatrixNumRows(basicType)) : basicType;
651 const int vecSize = getDataTypeScalarSize(vecType);
652 const int alignment = (vecSize == 3 ? 4 : vecSize)*int(sizeof(deUint32));
653
654 layout.size = deAlign32(layout.size, alignment);
655 layout.entries[ndx] = ValueBufferLayout::Entry(layout.size, alignment);
656 layout.size += alignment*(numVecs-1) + vecSize*int(sizeof(deUint32));
657 }
658
659 return layout;
660 }
661
copyToLayout(void * dst,const ValueBufferLayout::Entry & entryLayout,const Value & value,int arrayNdx)662 void copyToLayout (void* dst, const ValueBufferLayout::Entry& entryLayout, const Value& value, int arrayNdx)
663 {
664 const DataType basicType = value.type.getBasicType();
665 const int scalarSize = getDataTypeScalarSize(basicType);
666 const int numVecs = isDataTypeMatrix(basicType) ? getDataTypeMatrixNumColumns(basicType) : 1;
667 const int numComps = isDataTypeMatrix(basicType) ? getDataTypeMatrixNumRows(basicType) : scalarSize;
668
669 DE_ASSERT(size_t((arrayNdx+1)*scalarSize) <= value.elements.size());
670
671 if (isDataTypeBoolOrBVec(basicType))
672 {
673 for (int vecNdx = 0; vecNdx < numVecs; vecNdx++)
674 {
675 for (int compNdx = 0; compNdx < numComps; compNdx++)
676 {
677 const deUint32 data = value.elements[arrayNdx*scalarSize + vecNdx*numComps + compNdx].bool32 ? ~0u : 0u;
678
679 deMemcpy((deUint8*)dst + entryLayout.offset + vecNdx*entryLayout.vecStride + compNdx * sizeof(deUint32),
680 &data,
681 sizeof(deUint32));
682 }
683 }
684 }
685 else
686 {
687 for (int vecNdx = 0; vecNdx < numVecs; vecNdx++)
688 deMemcpy((deUint8*)dst + entryLayout.offset + vecNdx*entryLayout.vecStride,
689 &value.elements[arrayNdx*scalarSize + vecNdx*numComps],
690 numComps*sizeof(deUint32));
691 }
692 }
693
copyToLayout(void * dst,const ValueBufferLayout & layout,const vector<Value> & values,int arrayNdx)694 void copyToLayout (void* dst, const ValueBufferLayout& layout, const vector<Value>& values, int arrayNdx)
695 {
696 DE_ASSERT(layout.entries.size() == values.size());
697
698 for (size_t ndx = 0; ndx < values.size(); ndx++)
699 copyToLayout(dst, layout.entries[ndx], values[ndx], arrayNdx);
700 }
701
getShaderStages(const ShaderCaseSpecification & spec)702 deUint32 getShaderStages (const ShaderCaseSpecification& spec)
703 {
704 if (spec.caseType == glu::sl::CASETYPE_COMPLETE)
705 {
706 deUint32 stages = 0u;
707
708 for (size_t progNdx = 0; progNdx < spec.programs.size(); progNdx++)
709 {
710 for (int shaderType = 0; shaderType < glu::SHADERTYPE_LAST; shaderType++)
711 {
712 if (!spec.programs[progNdx].sources.sources[shaderType].empty())
713 stages |= (1u << shaderType);
714 }
715 }
716
717 return stages;
718 }
719 else
720 return (1u << glu::SHADERTYPE_VERTEX) | (1u << glu::SHADERTYPE_FRAGMENT);
721 }
722
723 class PipelineProgram
724 {
725 public:
726 PipelineProgram (Context& context, const ShaderCaseSpecification& spec);
727
getStages(void) const728 deUint32 getStages (void) const { return m_stages; }
729
hasShader(glu::ShaderType type) const730 bool hasShader (glu::ShaderType type) const { return (m_stages & (1u << type)) != 0; }
getShader(glu::ShaderType type) const731 vk::VkShaderModule getShader (glu::ShaderType type) const { return *m_shaderModules[type]; }
732
733 private:
734 const deUint32 m_stages;
735 Move<vk::VkShaderModule> m_shaderModules[glu::SHADERTYPE_LAST];
736 };
737
PipelineProgram(Context & context,const ShaderCaseSpecification & spec)738 PipelineProgram::PipelineProgram (Context& context, const ShaderCaseSpecification& spec)
739 : m_stages(getShaderStages(spec))
740 {
741 // \note Currently only a single source program is supported as framework lacks SPIR-V linking capability
742 TCU_CHECK_INTERNAL(spec.programs.size() == 1);
743
744 for (int shaderType = 0; shaderType < glu::SHADERTYPE_LAST; shaderType++)
745 {
746 if ((m_stages & (1u << shaderType)) != 0)
747 {
748 m_shaderModules[shaderType] = vk::createShaderModule(context.getDeviceInterface(), context.getDevice(),
749 context.getBinaryCollection().get(getShaderName((glu::ShaderType)shaderType, 0)), 0u);
750 }
751 }
752 }
753
createBuffer(Context & context,vk::VkDeviceSize size,vk::VkBufferUsageFlags usageFlags)754 Move<vk::VkBuffer> createBuffer (Context& context, vk::VkDeviceSize size, vk::VkBufferUsageFlags usageFlags)
755 {
756 const deUint32 queueFamilyIndex = context.getUniversalQueueFamilyIndex();
757 const vk::VkBufferCreateInfo params =
758 {
759 vk::VK_STRUCTURE_TYPE_BUFFER_CREATE_INFO, // sType
760 DE_NULL, // pNext
761 0u, // flags
762 size, // size
763 usageFlags, // usage
764 vk::VK_SHARING_MODE_EXCLUSIVE, // sharingMode
765 1u, // queueFamilyCount
766 &queueFamilyIndex, // pQueueFamilyIndices
767 };
768
769 return vk::createBuffer(context.getDeviceInterface(), context.getDevice(), ¶ms);
770 }
771
createImage2D(Context & context,deUint32 width,deUint32 height,vk::VkFormat format,vk::VkImageTiling tiling,vk::VkImageUsageFlags usageFlags)772 Move<vk::VkImage> createImage2D (Context& context, deUint32 width, deUint32 height, vk::VkFormat format, vk::VkImageTiling tiling, vk::VkImageUsageFlags usageFlags)
773 {
774 const deUint32 queueFamilyIndex = context.getUniversalQueueFamilyIndex();
775 const vk::VkImageCreateInfo params =
776 {
777 vk::VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO, // sType
778 DE_NULL, // pNext
779 0u, // flags
780 vk::VK_IMAGE_TYPE_2D, // imageType
781 format, // format
782 { width, height, 1u }, // extent
783 1u, // mipLevels
784 1u, // arraySize
785 vk::VK_SAMPLE_COUNT_1_BIT, // samples
786 tiling, // tiling
787 usageFlags, // usage
788 vk::VK_SHARING_MODE_EXCLUSIVE, // sharingMode
789 1u, // queueFamilyCount
790 &queueFamilyIndex, // pQueueFamilyIndices
791 vk::VK_IMAGE_LAYOUT_UNDEFINED, // initialLayout
792 };
793
794 return vk::createImage(context.getDeviceInterface(), context.getDevice(), ¶ms);
795 }
796
createAttachmentView(Context & context,vk::VkImage image,vk::VkFormat format)797 Move<vk::VkImageView> createAttachmentView (Context& context, vk::VkImage image, vk::VkFormat format)
798 {
799 const vk::VkImageViewCreateInfo params =
800 {
801 vk::VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO, // sType
802 DE_NULL, // pNext
803 0u, // flags
804 image, // image
805 vk::VK_IMAGE_VIEW_TYPE_2D, // viewType
806 format, // format
807 vk::makeComponentMappingRGBA(), // channels
808 {
809 vk::VK_IMAGE_ASPECT_COLOR_BIT, // aspectMask
810 0u, // baseMipLevel
811 1u, // mipLevels
812 0u, // baseArrayLayer
813 1u, // arraySize
814 }, // subresourceRange
815 };
816
817 return vk::createImageView(context.getDeviceInterface(), context.getDevice(), ¶ms);
818 }
819
createRenderPass(Context & context,vk::VkFormat colorAttFormat,deUint32 size)820 Move<vk::VkRenderPass> createRenderPass (Context& context, vk::VkFormat colorAttFormat, deUint32 size)
821 {
822 vk::VkAttachmentDescription colorAttDesc[4];
823 vk::VkAttachmentReference colorAttRef[4];
824
825 for (deUint32 i = 0; i < size; i++)
826 {
827 vk::VkAttachmentDescription desc =
828 {
829 0u, // flags
830 colorAttFormat, // format
831 vk::VK_SAMPLE_COUNT_1_BIT, // samples
832 vk::VK_ATTACHMENT_LOAD_OP_CLEAR, // loadOp
833 vk::VK_ATTACHMENT_STORE_OP_STORE, // storeOp
834 vk::VK_ATTACHMENT_LOAD_OP_DONT_CARE, // stencilLoadOp
835 vk::VK_ATTACHMENT_STORE_OP_DONT_CARE, // stencilStoreOp
836 vk::VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL, // initialLayout
837 vk::VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL, // finalLayout
838 };
839 colorAttDesc[i] = desc;
840
841 vk::VkAttachmentReference ref =
842 {
843 i, // attachment
844 vk::VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL, // layout
845 };
846 colorAttRef[i] = ref;
847 }
848
849 const vk::VkAttachmentReference dsAttRef =
850 {
851 VK_ATTACHMENT_UNUSED, // attachment
852 vk::VK_IMAGE_LAYOUT_GENERAL, // layout
853 };
854 const vk::VkSubpassDescription subpassDesc =
855 {
856 (vk::VkSubpassDescriptionFlags)0,
857 vk::VK_PIPELINE_BIND_POINT_GRAPHICS, // pipelineBindPoint
858 0u, // inputCount
859 DE_NULL, // pInputAttachments
860 size, // colorCount
861 &colorAttRef[0], // pColorAttachments
862 DE_NULL, // pResolveAttachments
863 &dsAttRef, // depthStencilAttachment
864 0u, // preserveCount
865 DE_NULL, // pPreserveAttachments
866
867 };
868 const vk::VkRenderPassCreateInfo renderPassParams =
869 {
870 vk::VK_STRUCTURE_TYPE_RENDER_PASS_CREATE_INFO, // sType
871 DE_NULL, // pNext
872 (vk::VkRenderPassCreateFlags)0,
873 size, // attachmentCount
874 &colorAttDesc[0], // pAttachments
875 1u, // subpassCount
876 &subpassDesc, // pSubpasses
877 0u, // dependencyCount
878 DE_NULL, // pDependencies
879 };
880
881 return vk::createRenderPass(context.getDeviceInterface(), context.getDevice(), &renderPassParams);
882 }
883
getVkStageFlags(deUint32 stages)884 vk::VkShaderStageFlags getVkStageFlags (deUint32 stages)
885 {
886 vk::VkShaderStageFlags vkStages = 0u;
887
888 for (int shaderType = 0; shaderType < glu::SHADERTYPE_LAST; shaderType++)
889 {
890 if ((stages & (1u << shaderType)) != 0)
891 vkStages |= vk::getVkShaderStage((glu::ShaderType)shaderType);
892 }
893
894 return vkStages;
895 }
896
createDescriptorSetLayout(Context & context,deUint32 shaderStages)897 Move<vk::VkDescriptorSetLayout> createDescriptorSetLayout (Context& context, deUint32 shaderStages)
898 {
899 DE_STATIC_ASSERT(REFERENCE_UNIFORM_BINDING == 0);
900 DE_STATIC_ASSERT(USER_UNIFORM_BINDING == 1);
901
902 return vk::DescriptorSetLayoutBuilder()
903 .addSingleBinding(vk::VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, vk::VK_SHADER_STAGE_FRAGMENT_BIT)
904 .addSingleBinding(vk::VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, getVkStageFlags(shaderStages))
905 .build(context.getDeviceInterface(), context.getDevice());
906 }
907
createPipelineLayout(Context & context,vk::VkDescriptorSetLayout descriptorSetLayout)908 Move<vk::VkPipelineLayout> createPipelineLayout (Context& context, vk::VkDescriptorSetLayout descriptorSetLayout)
909 {
910 const vk::VkPipelineLayoutCreateInfo params =
911 {
912 vk::VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO, // sType
913 DE_NULL, // pNext
914 (vk::VkPipelineLayoutCreateFlags)0,
915 1u, // descriptorSetCount
916 &descriptorSetLayout, // pSetLayouts
917 0u, // pushConstantRangeCount
918 DE_NULL, // pPushConstantRanges
919 };
920
921 return vk::createPipelineLayout(context.getDeviceInterface(), context.getDevice(), ¶ms);
922 }
923
getVecFormat(DataType scalarType,int scalarSize)924 vk::VkFormat getVecFormat (DataType scalarType, int scalarSize)
925 {
926 switch (scalarType)
927 {
928 case glu::TYPE_FLOAT:
929 {
930 const vk::VkFormat vecFmts[] =
931 {
932 vk::VK_FORMAT_R32_SFLOAT,
933 vk::VK_FORMAT_R32G32_SFLOAT,
934 vk::VK_FORMAT_R32G32B32_SFLOAT,
935 vk::VK_FORMAT_R32G32B32A32_SFLOAT,
936 };
937 return de::getSizedArrayElement<4>(vecFmts, scalarSize-1);
938 }
939
940 case glu::TYPE_INT:
941 {
942 const vk::VkFormat vecFmts[] =
943 {
944 vk::VK_FORMAT_R32_SINT,
945 vk::VK_FORMAT_R32G32_SINT,
946 vk::VK_FORMAT_R32G32B32_SINT,
947 vk::VK_FORMAT_R32G32B32A32_SINT,
948 };
949 return de::getSizedArrayElement<4>(vecFmts, scalarSize-1);
950 }
951
952 case glu::TYPE_UINT:
953 {
954 const vk::VkFormat vecFmts[] =
955 {
956 vk::VK_FORMAT_R32_UINT,
957 vk::VK_FORMAT_R32G32_UINT,
958 vk::VK_FORMAT_R32G32B32_UINT,
959 vk::VK_FORMAT_R32G32B32A32_UINT,
960 };
961 return de::getSizedArrayElement<4>(vecFmts, scalarSize-1);
962 }
963
964 case glu::TYPE_BOOL:
965 {
966 const vk::VkFormat vecFmts[] =
967 {
968 vk::VK_FORMAT_R32_UINT,
969 vk::VK_FORMAT_R32G32_UINT,
970 vk::VK_FORMAT_R32G32B32_UINT,
971 vk::VK_FORMAT_R32G32B32A32_UINT,
972 };
973 return de::getSizedArrayElement<4>(vecFmts, scalarSize-1);
974 }
975
976 default:
977 DE_FATAL("Unknown scalar type");
978 return vk::VK_FORMAT_R8G8B8A8_UINT;
979 }
980 }
981
getVertexAttributeDescriptions(const vector<Value> & inputValues,const ValueBufferLayout & layout)982 vector<vk::VkVertexInputAttributeDescription> getVertexAttributeDescriptions (const vector<Value>& inputValues, const ValueBufferLayout& layout)
983 {
984 vector<vk::VkVertexInputAttributeDescription> attribs;
985
986 // Position
987 {
988 const vk::VkVertexInputAttributeDescription posDesc =
989 {
990 0u, // location
991 0u, // binding
992 vk::VK_FORMAT_R32G32_SFLOAT, // format
993 0u, // offset
994 };
995
996 attribs.push_back(posDesc);
997 }
998
999 // Input values
1000 for (size_t inputNdx = 0; inputNdx < inputValues.size(); inputNdx++)
1001 {
1002 const Value& input = inputValues[inputNdx];
1003 const ValueBufferLayout::Entry& layoutEntry = layout.entries[inputNdx];
1004 const DataType basicType = input.type.getBasicType();
1005 const int numVecs = isDataTypeMatrix(basicType)
1006 ? getDataTypeMatrixNumColumns(basicType)
1007 : 1;
1008 const int vecSize = isDataTypeMatrix(basicType)
1009 ? getDataTypeMatrixNumRows(basicType)
1010 : getDataTypeScalarSize(basicType);
1011 const DataType scalarType = getDataTypeScalarType(basicType);
1012 const vk::VkFormat vecFmt = getVecFormat(scalarType, vecSize);
1013
1014 for (int vecNdx = 0; vecNdx < numVecs; vecNdx++)
1015 {
1016 const deUint32 curLoc = (deUint32)attribs.size();
1017 const deUint32 offset = (deUint32)(layoutEntry.offset + layoutEntry.vecStride*vecNdx);
1018 const vk::VkVertexInputAttributeDescription desc =
1019 {
1020 curLoc, // location
1021 1u, // binding
1022 vecFmt, // format
1023 offset, // offset
1024 };
1025
1026 attribs.push_back(desc);
1027 }
1028 }
1029
1030 return attribs;
1031 }
1032
createPipeline(Context & context,const vector<Value> & inputValues,const ValueBufferLayout & inputLayout,const PipelineProgram & program,vk::VkRenderPass renderPass,vk::VkPipelineLayout pipelineLayout,tcu::UVec2 renderSize,deUint32 size)1033 Move<vk::VkPipeline> createPipeline (Context& context,
1034 const vector<Value>& inputValues,
1035 const ValueBufferLayout& inputLayout,
1036 const PipelineProgram& program,
1037 vk::VkRenderPass renderPass,
1038 vk::VkPipelineLayout pipelineLayout,
1039 tcu::UVec2 renderSize,
1040 deUint32 size)
1041 {
1042 const vk::VkShaderModule vertShader = program.hasShader(glu::SHADERTYPE_VERTEX) ? program.getShader(glu::SHADERTYPE_VERTEX) : DE_NULL;
1043 const vk::VkShaderModule tessControlShader = program.hasShader(glu::SHADERTYPE_TESSELLATION_CONTROL) ? program.getShader(glu::SHADERTYPE_TESSELLATION_CONTROL) : DE_NULL;
1044 const vk::VkShaderModule tessEvalShader = program.hasShader(glu::SHADERTYPE_TESSELLATION_EVALUATION) ? program.getShader(glu::SHADERTYPE_TESSELLATION_EVALUATION) : DE_NULL;
1045 const vk::VkShaderModule geomShader = program.hasShader(glu::SHADERTYPE_GEOMETRY) ? program.getShader(glu::SHADERTYPE_GEOMETRY) : DE_NULL;
1046 const vk::VkShaderModule fragShader = program.hasShader(glu::SHADERTYPE_FRAGMENT) ? program.getShader(glu::SHADERTYPE_FRAGMENT) : DE_NULL;
1047 const vector<vk::VkVertexInputAttributeDescription> vertexAttribParams (getVertexAttributeDescriptions(inputValues, inputLayout));
1048 const vector<vk::VkViewport> viewports (1, vk::makeViewport(renderSize));
1049 const vector<vk::VkRect2D> scissors (1, vk::makeRect2D(renderSize));
1050 const vk::VkVertexInputBindingDescription vertexBindings[] =
1051 {
1052 {
1053 0u, // binding
1054 (deUint32)sizeof(tcu::Vec2), // stride
1055 vk::VK_VERTEX_INPUT_RATE_VERTEX, // stepRate
1056 },
1057 {
1058 1u, // binding
1059 0u, // stride
1060 vk::VK_VERTEX_INPUT_RATE_INSTANCE, // stepRate
1061 },
1062 };
1063 const vk::VkPipelineVertexInputStateCreateInfo vertexInputStateParams =
1064 {
1065 vk::VK_STRUCTURE_TYPE_PIPELINE_VERTEX_INPUT_STATE_CREATE_INFO, // sType
1066 DE_NULL, // pNext
1067 (vk::VkPipelineVertexInputStateCreateFlags)0,
1068 (inputValues.empty() ? 1u : 2u), // bindingCount
1069 vertexBindings, // pVertexBindingDescriptions
1070 (deUint32)vertexAttribParams.size(), // attributeCount
1071 &vertexAttribParams[0], // pVertexAttributeDescriptions
1072 };
1073 const vk::VkColorComponentFlags allCompMask = vk::VK_COLOR_COMPONENT_R_BIT
1074 | vk::VK_COLOR_COMPONENT_G_BIT
1075 | vk::VK_COLOR_COMPONENT_B_BIT
1076 | vk::VK_COLOR_COMPONENT_A_BIT;
1077 vk::VkPipelineColorBlendAttachmentState attBlendParams[4];
1078 for (deUint32 i = 0; i < size; i++)
1079 {
1080 vk::VkPipelineColorBlendAttachmentState blend =
1081 {
1082 VK_FALSE, // blendEnable
1083 vk::VK_BLEND_FACTOR_ONE, // srcBlendColor
1084 vk::VK_BLEND_FACTOR_ZERO, // destBlendColor
1085 vk::VK_BLEND_OP_ADD, // blendOpColor
1086 vk::VK_BLEND_FACTOR_ONE, // srcBlendAlpha
1087 vk::VK_BLEND_FACTOR_ZERO, // destBlendAlpha
1088 vk::VK_BLEND_OP_ADD, // blendOpAlpha
1089 allCompMask, // componentWriteMask
1090 };
1091 attBlendParams[i] = blend;
1092 }
1093
1094 const vk::VkPipelineColorBlendStateCreateInfo blendParams =
1095 {
1096 vk::VK_STRUCTURE_TYPE_PIPELINE_COLOR_BLEND_STATE_CREATE_INFO, // sType
1097 DE_NULL, // pNext
1098 (vk::VkPipelineColorBlendStateCreateFlags)0,
1099 VK_FALSE, // logicOpEnable
1100 vk::VK_LOGIC_OP_COPY, // logicOp
1101 size, // attachmentCount
1102 &attBlendParams[0], // pAttachments
1103 { 0.0f, 0.0f, 0.0f, 0.0f }, // blendConstants
1104 };
1105
1106 return vk::makeGraphicsPipeline(context.getDeviceInterface(), // const DeviceInterface& vk
1107 context.getDevice(), // const VkDevice device
1108 pipelineLayout, // const VkPipelineLayout pipelineLayout
1109 vertShader, // const VkShaderModule vertexShaderModule
1110 tessControlShader, // const VkShaderModule tessellationControlShaderModule
1111 tessEvalShader, // const VkShaderModule tessellationEvalShaderModule
1112 geomShader, // const VkShaderModule geometryShaderModule
1113 fragShader, // const VkShaderModule fragmentShaderModule
1114 renderPass, // const VkRenderPass renderPass
1115 viewports, // const std::vector<VkViewport>& viewports
1116 scissors, // const std::vector<VkRect2D>& scissors
1117 vk::VK_PRIMITIVE_TOPOLOGY_TRIANGLE_LIST, // const VkPrimitiveTopology topology
1118 0u, // const deUint32 subpass
1119 0u, // const deUint32 patchControlPoints
1120 &vertexInputStateParams, // const VkPipelineVertexInputStateCreateInfo* vertexInputStateCreateInfo
1121 DE_NULL, // const VkPipelineRasterizationStateCreateInfo* rasterizationStateCreateInfo
1122 DE_NULL, // const VkPipelineMultisampleStateCreateInfo* multisampleStateCreateInfo
1123 DE_NULL, // const VkPipelineDepthStencilStateCreateInfo* depthStencilStateCreateInfo
1124 &blendParams); // const VkPipelineColorBlendStateCreateInfo* colorBlendStateCreateInfo
1125 }
1126
createFramebuffer(Context & context,vk::VkRenderPass renderPass,Move<vk::VkImageView> colorAttView[4],deUint32 size,int width,int height)1127 Move<vk::VkFramebuffer> createFramebuffer (Context& context, vk::VkRenderPass renderPass, Move<vk::VkImageView> colorAttView[4], deUint32 size, int width, int height)
1128 {
1129 vk::VkImageView att[4];
1130 for (deUint32 i = 0; i < size; i++)
1131 {
1132 att[i] = *colorAttView[i];
1133 }
1134 const vk::VkFramebufferCreateInfo framebufferParams =
1135 {
1136 vk::VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO, // sType
1137 DE_NULL, // pNext
1138 (vk::VkFramebufferCreateFlags)0,
1139 renderPass, // renderPass
1140 size, // attachmentCount
1141 &att[0], // pAttachments
1142 (deUint32)width, // width
1143 (deUint32)height, // height
1144 1u, // layers
1145 };
1146
1147 return vk::createFramebuffer(context.getDeviceInterface(), context.getDevice(), &framebufferParams);
1148 }
1149
createCommandPool(Context & context)1150 Move<vk::VkCommandPool> createCommandPool (Context& context)
1151 {
1152 const deUint32 queueFamilyIndex = context.getUniversalQueueFamilyIndex();
1153
1154 return vk::createCommandPool(context.getDeviceInterface(), context.getDevice(), (vk::VkCommandPoolCreateFlags)0u, queueFamilyIndex);
1155 }
1156
createDescriptorPool(Context & context)1157 Move<vk::VkDescriptorPool> createDescriptorPool (Context& context)
1158 {
1159 return vk::DescriptorPoolBuilder()
1160 .addType(vk::VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, 2u)
1161 .build(context.getDeviceInterface(), context.getDevice(), vk::VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT, 1u);
1162 }
1163
allocateDescriptorSet(Context & context,vk::VkDescriptorPool descriptorPool,vk::VkDescriptorSetLayout setLayout)1164 Move<vk::VkDescriptorSet> allocateDescriptorSet (Context& context, vk::VkDescriptorPool descriptorPool, vk::VkDescriptorSetLayout setLayout)
1165 {
1166 const vk::VkDescriptorSetAllocateInfo params =
1167 {
1168 vk::VK_STRUCTURE_TYPE_DESCRIPTOR_SET_ALLOCATE_INFO,
1169 DE_NULL,
1170 descriptorPool,
1171 1u,
1172 &setLayout
1173 };
1174
1175 return vk::allocateDescriptorSet(context.getDeviceInterface(), context.getDevice(), ¶ms);
1176 }
1177
allocateCommandBuffer(Context & context,vk::VkCommandPool cmdPool)1178 Move<vk::VkCommandBuffer> allocateCommandBuffer (Context& context, vk::VkCommandPool cmdPool)
1179 {
1180 return vk::allocateCommandBuffer(context.getDeviceInterface(), context.getDevice(), cmdPool, vk::VK_COMMAND_BUFFER_LEVEL_PRIMARY);
1181 }
1182
allocateAndBindMemory(Context & context,vk::VkBuffer buffer,vk::MemoryRequirement memReqs)1183 MovePtr<vk::Allocation> allocateAndBindMemory (Context& context, vk::VkBuffer buffer, vk::MemoryRequirement memReqs)
1184 {
1185 const vk::DeviceInterface& vkd = context.getDeviceInterface();
1186 const vk::VkMemoryRequirements bufReqs = vk::getBufferMemoryRequirements(vkd, context.getDevice(), buffer);
1187 MovePtr<vk::Allocation> memory = context.getDefaultAllocator().allocate(bufReqs, memReqs);
1188
1189 vkd.bindBufferMemory(context.getDevice(), buffer, memory->getMemory(), memory->getOffset());
1190
1191 return memory;
1192 }
1193
getRenderTargetFormat(DataType dataType)1194 vk::VkFormat getRenderTargetFormat (DataType dataType)
1195 {
1196 switch (dataType)
1197 {
1198 case glu::TYPE_FLOAT_VEC2:
1199 return vk::VK_FORMAT_R8G8_UNORM;
1200 case glu::TYPE_FLOAT_VEC3:
1201 return vk::VK_FORMAT_R5G6B5_UNORM_PACK16;
1202 case glu::TYPE_FLOAT_VEC4:
1203 return vk::VK_FORMAT_R8G8B8A8_UNORM;
1204 case glu::TYPE_INT_VEC2:
1205 return vk::VK_FORMAT_R8G8_SINT;
1206 case glu::TYPE_INT_VEC4:
1207 return vk::VK_FORMAT_R8G8B8A8_SINT;
1208 default:
1209 return vk::VK_FORMAT_R8G8B8A8_UNORM;
1210 }
1211 }
1212
allocateAndBindMemory(Context & context,vk::VkImage image,vk::MemoryRequirement memReqs)1213 MovePtr<vk::Allocation> allocateAndBindMemory (Context& context, vk::VkImage image, vk::MemoryRequirement memReqs)
1214 {
1215 const vk::DeviceInterface& vkd = context.getDeviceInterface();
1216 const vk::VkMemoryRequirements imgReqs = vk::getImageMemoryRequirements(vkd, context.getDevice(), image);
1217 MovePtr<vk::Allocation> memory = context.getDefaultAllocator().allocate(imgReqs, memReqs);
1218
1219 vkd.bindImageMemory(context.getDevice(), image, memory->getMemory(), memory->getOffset());
1220
1221 return memory;
1222 }
1223
writeValuesToMem(Context & context,const vk::Allocation & dst,const ValueBufferLayout & layout,const vector<Value> & values,int arrayNdx)1224 void writeValuesToMem (Context& context, const vk::Allocation& dst, const ValueBufferLayout& layout, const vector<Value>& values, int arrayNdx)
1225 {
1226 copyToLayout(dst.getHostPtr(), layout, values, arrayNdx);
1227
1228 // \note Buffers are not allocated with coherency / uncached requirement so we need to manually flush CPU write caches
1229 flushAlloc(context.getDeviceInterface(), context.getDevice(), dst);
1230 }
1231
1232 class ShaderCaseInstance : public TestInstance
1233 {
1234 public:
1235 ShaderCaseInstance (Context& context, const ShaderCaseSpecification& spec);
1236 ~ShaderCaseInstance (void);
1237
1238 TestStatus iterate (void);
1239
1240 private:
1241 enum
1242 {
1243 RENDER_WIDTH = 64,
1244 RENDER_HEIGHT = 64,
1245
1246 POSITIONS_OFFSET = 0,
1247 POSITIONS_SIZE = (int)sizeof(Vec2)*4,
1248
1249 INDICES_OFFSET = POSITIONS_SIZE,
1250 INDICES_SIZE = (int)sizeof(deUint16)*6,
1251
1252 TOTAL_POS_NDX_SIZE = POSITIONS_SIZE+INDICES_SIZE
1253 };
1254
1255 const ShaderCaseSpecification& m_spec;
1256
1257 const Unique<vk::VkBuffer> m_posNdxBuffer;
1258 const UniquePtr<vk::Allocation> m_posNdxMem;
1259
1260 const ValueBufferLayout m_inputLayout;
1261 const Unique<vk::VkBuffer> m_inputBuffer; // Input values (attributes). Can be NULL if no inputs present
1262 const UniquePtr<vk::Allocation> m_inputMem; // Input memory, can be NULL if no input buffer exists
1263
1264 const ValueBufferLayout m_referenceLayout;
1265 const Unique<vk::VkBuffer> m_referenceBuffer; // Output (reference) values. Can be NULL if no outputs present
1266 const UniquePtr<vk::Allocation> m_referenceMem; // Output (reference) memory, can be NULL if no reference buffer exists
1267
1268 const ValueBufferLayout m_uniformLayout;
1269 const Unique<vk::VkBuffer> m_uniformBuffer; // Uniform values. Can be NULL if no uniforms present
1270 const UniquePtr<vk::Allocation> m_uniformMem; // Uniform memory, can be NULL if no uniform buffer exists
1271
1272 const vk::VkFormat m_rtFormat;
1273 deUint32 m_outputCount;
1274 Move<vk::VkImage> m_rtImage [4];
1275 MovePtr<vk::Allocation> m_rtMem[4];
1276 Move<vk::VkImageView> m_rtView[4];
1277
1278 Move<vk::VkBuffer> m_readImageBuffer[4];
1279 MovePtr<vk::Allocation> m_readImageMem[4];
1280
1281 const Unique<vk::VkRenderPass> m_renderPass;
1282 Move<vk::VkFramebuffer> m_framebuffer;
1283 const PipelineProgram m_program;
1284 const Unique<vk::VkDescriptorSetLayout> m_descriptorSetLayout;
1285 const Unique<vk::VkPipelineLayout> m_pipelineLayout;
1286 const Unique<vk::VkPipeline> m_pipeline;
1287
1288 const Unique<vk::VkDescriptorPool> m_descriptorPool;
1289 const Unique<vk::VkDescriptorSet> m_descriptorSet;
1290
1291 const Unique<vk::VkCommandPool> m_cmdPool;
1292 const Unique<vk::VkCommandBuffer> m_cmdBuffer;
1293
1294 int m_subCaseNdx;
1295 };
1296
ShaderCaseInstance(Context & context,const ShaderCaseSpecification & spec)1297 ShaderCaseInstance::ShaderCaseInstance (Context& context, const ShaderCaseSpecification& spec)
1298 : TestInstance (context)
1299 , m_spec (spec)
1300
1301 , m_posNdxBuffer (createBuffer(context, (vk::VkDeviceSize)TOTAL_POS_NDX_SIZE, vk::VK_BUFFER_USAGE_INDEX_BUFFER_BIT|vk::VK_BUFFER_USAGE_VERTEX_BUFFER_BIT))
1302 , m_posNdxMem (allocateAndBindMemory(context, *m_posNdxBuffer, vk::MemoryRequirement::HostVisible))
1303
1304 , m_inputLayout (computeStd430Layout(spec.values.inputs))
1305 , m_inputBuffer (m_inputLayout.size > 0 ? createBuffer(context, (vk::VkDeviceSize)m_inputLayout.size, vk::VK_BUFFER_USAGE_VERTEX_BUFFER_BIT) : Move<vk::VkBuffer>())
1306 , m_inputMem (m_inputLayout.size > 0 ? allocateAndBindMemory(context, *m_inputBuffer, vk::MemoryRequirement::HostVisible) : MovePtr<vk::Allocation>())
1307
1308 , m_referenceLayout (computeStd140Layout(spec.values.outputs))
1309 , m_referenceBuffer (m_referenceLayout.size > 0 ? createBuffer(context, (vk::VkDeviceSize)m_referenceLayout.size, vk::VK_BUFFER_USAGE_UNIFORM_BUFFER_BIT) : Move<vk::VkBuffer>())
1310 , m_referenceMem (m_referenceLayout.size > 0 ? allocateAndBindMemory(context, *m_referenceBuffer, vk::MemoryRequirement::HostVisible) : MovePtr<vk::Allocation>())
1311
1312 , m_uniformLayout (computeStd140Layout(spec.values.uniforms))
1313 , m_uniformBuffer (m_uniformLayout.size > 0 ? createBuffer(context, (vk::VkDeviceSize)m_uniformLayout.size, vk::VK_BUFFER_USAGE_UNIFORM_BUFFER_BIT) : Move<vk::VkBuffer>())
1314 , m_uniformMem (m_uniformLayout.size > 0 ? allocateAndBindMemory(context, *m_uniformBuffer, vk::MemoryRequirement::HostVisible) : MovePtr<vk::Allocation>())
1315
1316 , m_rtFormat (getRenderTargetFormat(spec.outputFormat))
1317 , m_outputCount (((deUint32)m_spec.values.outputs.size() == 0 || m_spec.outputType == glu::sl::OUTPUT_RESULT) ? 1 : (deUint32)m_spec.values.outputs.size())
1318 , m_rtImage ()
1319 , m_rtMem ()
1320 , m_rtView ()
1321
1322 , m_readImageBuffer ()
1323 , m_readImageMem ()
1324
1325 , m_renderPass (createRenderPass(context, m_rtFormat, m_outputCount))
1326 , m_framebuffer ()
1327 , m_program (context, spec)
1328 , m_descriptorSetLayout (createDescriptorSetLayout(context, m_program.getStages()))
1329 , m_pipelineLayout (createPipelineLayout(context, *m_descriptorSetLayout))
1330 , m_pipeline (createPipeline(context, spec.values.inputs, m_inputLayout, m_program, *m_renderPass, *m_pipelineLayout, tcu::UVec2(RENDER_WIDTH, RENDER_HEIGHT), m_outputCount))
1331
1332 , m_descriptorPool (createDescriptorPool(context))
1333 , m_descriptorSet (allocateDescriptorSet(context, *m_descriptorPool, *m_descriptorSetLayout))
1334
1335 , m_cmdPool (createCommandPool(context))
1336 , m_cmdBuffer (allocateCommandBuffer(context, *m_cmdPool))
1337
1338 , m_subCaseNdx (0)
1339 {
1340 {
1341 // Initialize the resources for each color attachment needed by the shader
1342 for (deUint32 outNdx = 0; outNdx < m_outputCount; outNdx++)
1343 {
1344 m_rtImage[outNdx] = createImage2D(context, RENDER_WIDTH, RENDER_HEIGHT, m_rtFormat, vk::VK_IMAGE_TILING_OPTIMAL, vk::VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT| vk::VK_IMAGE_USAGE_TRANSFER_SRC_BIT);
1345 m_rtMem[outNdx] = allocateAndBindMemory(context, *m_rtImage[outNdx], vk::MemoryRequirement::Any);
1346 m_rtView[outNdx] = createAttachmentView(context, *m_rtImage[outNdx], m_rtFormat);
1347
1348 m_readImageBuffer[outNdx] = createBuffer(context, (vk::VkDeviceSize)(RENDER_WIDTH * RENDER_HEIGHT * tcu::getPixelSize(vk::mapVkFormat(m_rtFormat))), vk::VK_BUFFER_USAGE_TRANSFER_DST_BIT);
1349 m_readImageMem[outNdx] = allocateAndBindMemory(context, *m_readImageBuffer[outNdx], vk::MemoryRequirement::HostVisible);
1350 }
1351 m_framebuffer = createFramebuffer(context, *m_renderPass, m_rtView, m_outputCount, RENDER_WIDTH, RENDER_HEIGHT);
1352 }
1353
1354 const vk::DeviceInterface& vkd = context.getDeviceInterface();
1355 const deUint32 queueFamilyIndex = context.getUniversalQueueFamilyIndex();
1356
1357 {
1358 const Vec2 s_positions[] =
1359 {
1360 Vec2(-1.0f, -1.0f),
1361 Vec2(-1.0f, +1.0f),
1362 Vec2(+1.0f, -1.0f),
1363 Vec2(+1.0f, +1.0f)
1364 };
1365 const deUint16 s_indices[] =
1366 {
1367 0, 1, 2,
1368 1, 3, 2
1369 };
1370
1371 DE_STATIC_ASSERT(sizeof(s_positions) == POSITIONS_SIZE);
1372 DE_STATIC_ASSERT(sizeof(s_indices) == INDICES_SIZE);
1373
1374 deMemcpy((deUint8*)m_posNdxMem->getHostPtr() + POSITIONS_OFFSET, &s_positions[0], sizeof(s_positions));
1375 deMemcpy((deUint8*)m_posNdxMem->getHostPtr() + INDICES_OFFSET, &s_indices[0], sizeof(s_indices));
1376
1377 flushAlloc(m_context.getDeviceInterface(), context.getDevice(), *m_posNdxMem);
1378 }
1379
1380 if (!m_spec.values.uniforms.empty())
1381 {
1382 const vk::VkDescriptorBufferInfo bufInfo =
1383 {
1384 *m_uniformBuffer,
1385 (vk::VkDeviceSize)0, // offset
1386 (vk::VkDeviceSize)m_uniformLayout.size
1387 };
1388
1389 vk::DescriptorSetUpdateBuilder()
1390 .writeSingle(*m_descriptorSet, vk::DescriptorSetUpdateBuilder::Location::binding(USER_UNIFORM_BINDING),
1391 vk::VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, &bufInfo)
1392 .update(vkd, m_context.getDevice());
1393 }
1394
1395 if (!m_spec.values.outputs.empty())
1396 {
1397 const vk::VkDescriptorBufferInfo bufInfo =
1398 {
1399 *m_referenceBuffer,
1400 (vk::VkDeviceSize)0, // offset
1401 (vk::VkDeviceSize)m_referenceLayout.size
1402 };
1403
1404 vk::DescriptorSetUpdateBuilder()
1405 .writeSingle(*m_descriptorSet, vk::DescriptorSetUpdateBuilder::Location::binding(REFERENCE_UNIFORM_BINDING),
1406 vk::VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER, &bufInfo)
1407 .update(vkd, m_context.getDevice());
1408 }
1409
1410 // Record command buffer
1411
1412 beginCommandBuffer(vkd, *m_cmdBuffer, 0u);
1413
1414 {
1415 const vk::VkMemoryBarrier vertFlushBarrier =
1416 {
1417 vk::VK_STRUCTURE_TYPE_MEMORY_BARRIER, // sType
1418 DE_NULL, // pNext
1419 vk::VK_ACCESS_HOST_WRITE_BIT, // srcAccessMask
1420 vk::VK_ACCESS_VERTEX_ATTRIBUTE_READ_BIT|vk::VK_ACCESS_UNIFORM_READ_BIT, // dstAccessMask
1421 };
1422 vk::VkImageMemoryBarrier colorAttBarrier [4];
1423 for (deUint32 outNdx = 0; outNdx < m_outputCount; outNdx++)
1424 {
1425 vk::VkImageMemoryBarrier barrier =
1426 {
1427 vk::VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER, // sType
1428 DE_NULL, // pNext
1429 0u, // srcAccessMask
1430 vk::VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT, // dstAccessMask
1431 vk::VK_IMAGE_LAYOUT_UNDEFINED, // oldLayout
1432 vk::VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL, // newLayout
1433 queueFamilyIndex, // srcQueueFamilyIndex
1434 queueFamilyIndex, // destQueueFamilyIndex
1435 *m_rtImage[outNdx], // image
1436 {
1437 vk::VK_IMAGE_ASPECT_COLOR_BIT, // aspectMask
1438 0u, // baseMipLevel
1439 1u, // mipLevels
1440 0u, // baseArraySlice
1441 1u, // arraySize
1442 } // subresourceRange
1443 };
1444 colorAttBarrier[outNdx] = barrier;
1445 }
1446 vkd.cmdPipelineBarrier(*m_cmdBuffer, vk::VK_PIPELINE_STAGE_HOST_BIT, vk::VK_PIPELINE_STAGE_ALL_GRAPHICS_BIT, (vk::VkDependencyFlags)0,
1447 1, &vertFlushBarrier,
1448 0, (const vk::VkBufferMemoryBarrier*)DE_NULL,
1449 m_outputCount, &colorAttBarrier[0]);
1450 }
1451
1452 {
1453 vk::VkClearValue clearValue[4];
1454 for (deUint32 outNdx = 0; outNdx < m_outputCount; outNdx++)
1455 {
1456 vk::VkClearValue value = vk::makeClearValueColorF32(0.125f, 0.25f, 0.75f, 1.0f);
1457 clearValue[outNdx] = value;
1458 }
1459 beginRenderPass(vkd, *m_cmdBuffer, *m_renderPass, *m_framebuffer, vk::makeRect2D(0, 0, RENDER_WIDTH, RENDER_HEIGHT), m_outputCount, clearValue);
1460 }
1461
1462 vkd.cmdBindPipeline(*m_cmdBuffer, vk::VK_PIPELINE_BIND_POINT_GRAPHICS, *m_pipeline);
1463
1464 if (!m_spec.values.uniforms.empty() || !m_spec.values.outputs.empty())
1465 vkd.cmdBindDescriptorSets(*m_cmdBuffer, vk::VK_PIPELINE_BIND_POINT_GRAPHICS, *m_pipelineLayout, 0u, 1u, &*m_descriptorSet, 0u, DE_NULL);
1466
1467 {
1468 const vk::VkBuffer buffers[] = { *m_posNdxBuffer, *m_inputBuffer };
1469 const vk::VkDeviceSize offsets[] = { POSITIONS_OFFSET, 0u };
1470 const deUint32 numBuffers = buffers[1] != 0 ? 2u : 1u;
1471 vkd.cmdBindVertexBuffers(*m_cmdBuffer, 0u, numBuffers, buffers, offsets);
1472 }
1473
1474 vkd.cmdBindIndexBuffer (*m_cmdBuffer, *m_posNdxBuffer, (vk::VkDeviceSize)INDICES_OFFSET, vk::VK_INDEX_TYPE_UINT16);
1475 vkd.cmdDrawIndexed (*m_cmdBuffer, 6u, 1u, 0u, 0u, 0u);
1476 endRenderPass (vkd, *m_cmdBuffer);
1477
1478 {
1479 vk::VkImageMemoryBarrier renderFinishBarrier[4];
1480 for (deUint32 outNdx = 0; outNdx < m_outputCount; outNdx++)
1481 {
1482 vk::VkImageMemoryBarrier barrier =
1483 {
1484 vk::VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER, // sType
1485 DE_NULL, // pNext
1486 vk::VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT, // srcAccessMask
1487 vk::VK_ACCESS_TRANSFER_READ_BIT, // dstAccessMask
1488 vk::VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL, // oldLayout
1489 vk::VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL, // newLayout
1490 queueFamilyIndex, // srcQueueFamilyIndex
1491 queueFamilyIndex, // destQueueFamilyIndex
1492 *m_rtImage[outNdx], // image
1493 {
1494 vk::VK_IMAGE_ASPECT_COLOR_BIT, // aspectMask
1495 0u, // baseMipLevel
1496 1u, // mipLevels
1497 0u, // baseArraySlice
1498 1u, // arraySize
1499 } // subresourceRange
1500 };
1501 renderFinishBarrier[outNdx] = barrier;
1502 }
1503
1504 vkd.cmdPipelineBarrier(*m_cmdBuffer, vk::VK_PIPELINE_STAGE_ALL_GRAPHICS_BIT, vk::VK_PIPELINE_STAGE_TRANSFER_BIT, (vk::VkDependencyFlags)0,
1505 0, (const vk::VkMemoryBarrier*)DE_NULL,
1506 0, (const vk::VkBufferMemoryBarrier*)DE_NULL,
1507 m_outputCount, &renderFinishBarrier[0]);
1508 }
1509
1510 {
1511 for (deUint32 outNdx = 0; outNdx < m_outputCount; outNdx++)
1512 {
1513 const vk::VkBufferImageCopy copyParams =
1514 {
1515 (vk::VkDeviceSize)0u, // bufferOffset
1516 (deUint32)RENDER_WIDTH, // bufferRowLength
1517 (deUint32)RENDER_HEIGHT, // bufferImageHeight
1518 {
1519 vk::VK_IMAGE_ASPECT_COLOR_BIT, // aspect
1520 0u, // mipLevel
1521 0u, // arrayLayer
1522 1u, // arraySize
1523 }, // imageSubresource
1524 { 0u, 0u, 0u }, // imageOffset
1525 { RENDER_WIDTH, RENDER_HEIGHT, 1u } // imageExtent
1526 };
1527
1528 vkd.cmdCopyImageToBuffer(*m_cmdBuffer, *m_rtImage[outNdx], vk::VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL, *m_readImageBuffer[outNdx], 1u, ©Params);
1529 }
1530 }
1531
1532 {
1533 const vk::VkDeviceSize size = (vk::VkDeviceSize)(RENDER_WIDTH * RENDER_HEIGHT * tcu::getPixelSize(vk::mapVkFormat(m_rtFormat)));
1534 vk::VkBufferMemoryBarrier copyFinishBarrier[4];
1535 for (deUint32 outNdx = 0; outNdx < m_outputCount; outNdx++)
1536 {
1537 vk::VkBufferMemoryBarrier barrier =
1538 {
1539 vk::VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER, // sType
1540 DE_NULL, // pNext
1541 vk::VK_ACCESS_TRANSFER_WRITE_BIT, // srcAccessMask
1542 vk::VK_ACCESS_HOST_READ_BIT, // dstAccessMask
1543 queueFamilyIndex, // srcQueueFamilyIndex
1544 queueFamilyIndex, // destQueueFamilyIndex
1545 *m_readImageBuffer[outNdx], // buffer
1546 0u, // offset
1547 size // size
1548 };
1549 copyFinishBarrier[outNdx] = barrier;
1550 }
1551 vkd.cmdPipelineBarrier(*m_cmdBuffer, vk::VK_PIPELINE_STAGE_TRANSFER_BIT, vk::VK_PIPELINE_STAGE_HOST_BIT, (vk::VkDependencyFlags)0,
1552 0, (const vk::VkMemoryBarrier*)DE_NULL,
1553 m_outputCount, ©FinishBarrier[0],
1554 0, (const vk::VkImageMemoryBarrier*)DE_NULL);
1555 }
1556
1557 endCommandBuffer(vkd, *m_cmdBuffer);
1558 }
1559
~ShaderCaseInstance(void)1560 ShaderCaseInstance::~ShaderCaseInstance (void)
1561 {
1562 }
1563
getNumSubCases(const ValueBlock & values)1564 int getNumSubCases (const ValueBlock& values)
1565 {
1566 if (!values.outputs.empty())
1567 return int(values.outputs[0].elements.size() / values.outputs[0].type.getScalarSize());
1568 else
1569 return 1; // Always run at least one iteration even if no output values are specified
1570 }
1571
checkResultImage(const ConstPixelBufferAccess & result)1572 bool checkResultImage (const ConstPixelBufferAccess& result)
1573 {
1574 const tcu::IVec4 refPix (255, 255, 255, 255);
1575
1576 for (int y = 0; y < result.getHeight(); y++)
1577 {
1578 for (int x = 0; x < result.getWidth(); x++)
1579 {
1580 const tcu::IVec4 resPix = result.getPixelInt(x, y);
1581
1582 if (boolAny(notEqual(resPix, refPix)))
1583 return false;
1584 }
1585 }
1586
1587 return true;
1588 }
1589
checkResultImageWithReference(const ConstPixelBufferAccess & result,tcu::IVec4 refPix)1590 bool checkResultImageWithReference (const ConstPixelBufferAccess& result, tcu::IVec4 refPix)
1591 {
1592 for (int y = 0; y < result.getHeight(); y++)
1593 {
1594 for (int x = 0; x < result.getWidth(); x++)
1595 {
1596 const tcu::IVec4 resPix = result.getPixelInt(x, y);
1597
1598 if (boolAny(notEqual(resPix, refPix)))
1599 return false;
1600 }
1601 }
1602
1603 return true;
1604 }
iterate(void)1605 TestStatus ShaderCaseInstance::iterate (void)
1606 {
1607 const vk::DeviceInterface& vkd = m_context.getDeviceInterface();
1608 const vk::VkDevice device = m_context.getDevice();
1609 const vk::VkQueue queue = m_context.getUniversalQueue();
1610
1611 if (!m_spec.values.inputs.empty())
1612 writeValuesToMem(m_context, *m_inputMem, m_inputLayout, m_spec.values.inputs, m_subCaseNdx);
1613
1614 if (!m_spec.values.outputs.empty())
1615 writeValuesToMem(m_context, *m_referenceMem, m_referenceLayout, m_spec.values.outputs, m_subCaseNdx);
1616
1617 if (!m_spec.values.uniforms.empty())
1618 writeValuesToMem(m_context, *m_uniformMem, m_uniformLayout, m_spec.values.uniforms, m_subCaseNdx);
1619
1620 submitCommandsAndWait(vkd, device, queue, m_cmdBuffer.get());
1621
1622 // Result was checked in fragment shader
1623 if (m_spec.outputType == glu::sl::OUTPUT_RESULT)
1624 {
1625 const ConstPixelBufferAccess imgAccess (TextureFormat(TextureFormat::RGBA, TextureFormat::UNORM_INT8), RENDER_WIDTH, RENDER_HEIGHT, 1, m_readImageMem[0]->getHostPtr());
1626
1627 invalidateMappedMemoryRange(vkd, device, m_readImageMem[0]->getMemory(), m_readImageMem[0]->getOffset(), (vk::VkDeviceSize)(RENDER_WIDTH*RENDER_HEIGHT*4));
1628
1629 if (!checkResultImage(imgAccess))
1630 {
1631 TestLog& log = m_context.getTestContext().getLog();
1632
1633 log << TestLog::Message << "ERROR: Got non-white pixels on sub-case " << m_subCaseNdx << TestLog::EndMessage
1634 << TestLog::Image("Result", "Result", imgAccess);
1635
1636 dumpValues(log, m_spec.values, m_subCaseNdx);
1637
1638 return TestStatus::fail(string("Got invalid pixels at sub-case ") + de::toString(m_subCaseNdx));
1639 }
1640 }
1641 // Result was written to color buffer
1642 else
1643 {
1644 for (deUint32 outNdx = 0; outNdx < m_outputCount; outNdx++)
1645 {
1646 const ConstPixelBufferAccess imgAccess (vk::mapVkFormat(m_rtFormat), RENDER_WIDTH, RENDER_HEIGHT, 1, m_readImageMem[outNdx]->getHostPtr());
1647 const DataType dataType = m_spec.values.outputs[outNdx].type.getBasicType();
1648 const int numComponents = getDataTypeScalarSize(dataType);
1649 tcu::IVec4 reference (0, 0, 0, 1);
1650
1651 for (int refNdx = 0; refNdx < numComponents; refNdx++)
1652 {
1653 if (isDataTypeFloatOrVec(dataType))
1654 reference[refNdx] = (int)m_spec.values.outputs[outNdx].elements[m_subCaseNdx * numComponents + refNdx].float32;
1655 else if (isDataTypeIntOrIVec(dataType))
1656 reference[refNdx] = m_spec.values.outputs[outNdx].elements[m_subCaseNdx * numComponents + refNdx].int32;
1657 else
1658 DE_FATAL("Unknown data type");
1659 }
1660
1661 invalidateMappedMemoryRange(vkd, device, m_readImageMem[outNdx]->getMemory(), m_readImageMem[outNdx]->getOffset(), (vk::VkDeviceSize)(RENDER_WIDTH * RENDER_HEIGHT * tcu::getPixelSize(vk::mapVkFormat(m_rtFormat))));
1662
1663 if (!checkResultImageWithReference(imgAccess, reference))
1664 {
1665 TestLog& log = m_context.getTestContext().getLog();
1666
1667 log << TestLog::Message << "ERROR: Got nonmatching pixels on sub-case " << m_subCaseNdx << " output " << outNdx << TestLog::EndMessage
1668 << TestLog::Image("Result", "Result", imgAccess);
1669
1670 dumpValues(log, m_spec.values, m_subCaseNdx);
1671
1672 return TestStatus::fail(string("Got invalid pixels at sub-case ") + de::toString(m_subCaseNdx));
1673 }
1674 }
1675 }
1676
1677 if (++m_subCaseNdx < getNumSubCases(m_spec.values))
1678 return TestStatus::incomplete();
1679 else
1680 return TestStatus::pass("All sub-cases passed");
1681 }
1682
1683 class ShaderCase : public TestCase
1684 {
1685 public:
1686 ShaderCase (tcu::TestContext& testCtx, const string& name, const string& description, const ShaderCaseSpecification& spec);
1687
1688
1689 void initPrograms (SourceCollections& programCollection) const;
1690 TestInstance* createInstance (Context& context) const;
1691
1692 private:
1693 const ShaderCaseSpecification m_spec;
1694 };
1695
ShaderCase(tcu::TestContext & testCtx,const string & name,const string & description,const ShaderCaseSpecification & spec)1696 ShaderCase::ShaderCase (tcu::TestContext& testCtx, const string& name, const string& description, const ShaderCaseSpecification& spec)
1697 : TestCase (testCtx, name, description)
1698 , m_spec (spec)
1699 {
1700 }
1701
initPrograms(SourceCollections & sourceCollection) const1702 void ShaderCase::initPrograms (SourceCollections& sourceCollection) const
1703 {
1704 vector<ProgramSources> specializedSources (m_spec.programs.size());
1705
1706 DE_ASSERT(isValid(m_spec));
1707
1708 if (m_spec.expectResult != glu::sl::EXPECT_PASS)
1709 TCU_THROW(InternalError, "Only EXPECT_PASS is supported");
1710
1711 if (m_spec.caseType == glu::sl::CASETYPE_VERTEX_ONLY)
1712 {
1713 DE_ASSERT(m_spec.programs.size() == 1 && m_spec.programs[0].sources.sources[glu::SHADERTYPE_VERTEX].size() == 1);
1714 specializedSources[0] << glu::VertexSource(specializeVertexShader(m_spec, m_spec.programs[0].sources.sources[glu::SHADERTYPE_VERTEX][0]))
1715 << glu::FragmentSource(genFragmentShader(m_spec));
1716 }
1717 else if (m_spec.caseType == glu::sl::CASETYPE_FRAGMENT_ONLY)
1718 {
1719 DE_ASSERT(m_spec.programs.size() == 1 && m_spec.programs[0].sources.sources[glu::SHADERTYPE_FRAGMENT].size() == 1);
1720 specializedSources[0] << glu::VertexSource(genVertexShader(m_spec))
1721 << glu::FragmentSource(specializeFragmentShader(m_spec, m_spec.programs[0].sources.sources[glu::SHADERTYPE_FRAGMENT][0]));
1722 }
1723 else
1724 {
1725 DE_ASSERT(m_spec.caseType == glu::sl::CASETYPE_COMPLETE);
1726
1727 const int maxPatchVertices = 4; // \todo [2015-08-05 pyry] Query
1728
1729 for (size_t progNdx = 0; progNdx < m_spec.programs.size(); progNdx++)
1730 {
1731 const ProgramSpecializationParams progSpecParams (m_spec, m_spec.programs[progNdx].requiredExtensions, maxPatchVertices);
1732
1733 specializeProgramSources(specializedSources[progNdx], m_spec.programs[progNdx].sources, progSpecParams);
1734 }
1735 }
1736
1737 for (size_t progNdx = 0; progNdx < specializedSources.size(); progNdx++)
1738 {
1739 for (int shaderType = 0; shaderType < glu::SHADERTYPE_LAST; shaderType++)
1740 {
1741 if (!specializedSources[progNdx].sources[shaderType].empty())
1742 {
1743 vk::GlslSource& curSrc = sourceCollection.glslSources.add(getShaderName((glu::ShaderType)shaderType, progNdx));
1744 curSrc.sources[shaderType] = specializedSources[progNdx].sources[shaderType];
1745 }
1746 }
1747 }
1748 }
1749
createInstance(Context & context) const1750 TestInstance* ShaderCase::createInstance (Context& context) const
1751 {
1752 return new ShaderCaseInstance(context, m_spec);
1753 }
1754
1755 class ShaderCaseFactory : public glu::sl::ShaderCaseFactory
1756 {
1757 public:
ShaderCaseFactory(tcu::TestContext & testCtx)1758 ShaderCaseFactory (tcu::TestContext& testCtx)
1759 : m_testCtx(testCtx)
1760 {
1761 }
1762
createGroup(const string & name,const string & description,const vector<tcu::TestNode * > & children)1763 tcu::TestCaseGroup* createGroup (const string& name, const string& description, const vector<tcu::TestNode*>& children)
1764 {
1765 return new tcu::TestCaseGroup(m_testCtx, name.c_str(), description.c_str(), children);
1766 }
1767
createCase(const string & name,const string & description,const ShaderCaseSpecification & spec)1768 tcu::TestCase* createCase (const string& name, const string& description, const ShaderCaseSpecification& spec)
1769 {
1770 return new ShaderCase(m_testCtx, name, description, spec);
1771 }
1772
1773 private:
1774 tcu::TestContext& m_testCtx;
1775 };
1776
1777 class ShaderLibraryGroup : public tcu::TestCaseGroup
1778 {
1779 public:
ShaderLibraryGroup(tcu::TestContext & testCtx,const string & name,const string & description,const string & filename)1780 ShaderLibraryGroup (tcu::TestContext& testCtx, const string& name, const string& description, const string& filename)
1781 : tcu::TestCaseGroup (testCtx, name.c_str(), description.c_str())
1782 , m_filename (filename)
1783 {
1784 }
1785
init(void)1786 void init (void)
1787 {
1788 ShaderCaseFactory caseFactory (m_testCtx);
1789 const vector<tcu::TestNode*> children = glu::sl::parseFile(m_testCtx.getArchive(), m_filename, &caseFactory);
1790
1791 for (size_t ndx = 0; ndx < children.size(); ndx++)
1792 {
1793 try
1794 {
1795 addChild(children[ndx]);
1796 }
1797 catch (...)
1798 {
1799 for (; ndx < children.size(); ndx++)
1800 delete children[ndx];
1801 throw;
1802 }
1803 }
1804 }
1805
1806 private:
1807 const string m_filename;
1808 };
1809
1810 } // anonymous
1811
createShaderLibraryGroup(tcu::TestContext & testCtx,const string & name,const string & description,const string & filename)1812 MovePtr<tcu::TestCaseGroup> createShaderLibraryGroup (tcu::TestContext& testCtx, const string& name, const string& description, const string& filename)
1813 {
1814 return MovePtr<tcu::TestCaseGroup>(new ShaderLibraryGroup(testCtx, name, description, filename));
1815 }
1816
1817 } // vkt
1818