1 /*-------------------------------------------------------------------------
2  * Vulkan Conformance Tests
3  * ------------------------
4  *
5  * Copyright (c) 2017 The Khronos Group Inc.
6  *
7  * Licensed under the Apache License, Version 2.0 (the "License");
8  * you may not use this file except in compliance with the License.
9  * You may obtain a copy of the License at
10  *
11  *      http://www.apache.org/licenses/LICENSE-2.0
12  *
13  * Unless required by applicable law or agreed to in writing, software
14  * distributed under the License is distributed on an "AS IS" BASIS,
15  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16  * See the License for the specific language governing permissions and
17  * limitations under the License.
18  *
19  *//*!
20  * \file
21  * \brief SPIR-V Loop Control for DependencyInfinite qualifier tests
22  *//*--------------------------------------------------------------------*/
23 
24 #include "vkApiVersion.hpp"
25 
26 #include "vktSpvAsmLoopDepInfTests.hpp"
27 #include "vktTestCase.hpp"
28 #include "vktSpvAsmComputeShaderCase.hpp"
29 
30 #include "deRandom.hpp"
31 
32 namespace vkt
33 {
34 namespace SpirVAssembly
35 {
36 
37 using namespace vk;
38 using std::map;
39 using std::string;
40 using std::vector;
41 
42 // Assembly code used for testing loop control with dependencies is based on GLSL source code:
43 // #version 430
44 //
45 // layout(std140, set = 0, binding = 0) readonly buffer Input {
46 //   float elements[];
47 // } input_data;
48 // layout(std140, set = 0, binding = 1) writeonly buffer Output {
49 //   float elements[];
50 // } output_data;
51 //
52 // void main() {
53 //   const uint n = 12;
54 //   float c[n];
55 //   uint x = gl_GlobalInvocationID.x;
56 //
57 //   for (uint i = 0; i < n; ++i)
58 //     c[i] = float(i) * input_data.elements[x];
59 //
60 //   output_data.elements[x] = 0.0f;
61 //   for (uint i = 0; i < n; ++i)
62 //     output_data.elements[x] += c[i];
63 // }
getComputeSourceCode(std::string & computeSourceCode)64 static void getComputeSourceCode (std::string& computeSourceCode)
65 {
66 	computeSourceCode =
67 		string(getComputeAsmShaderPreamble()) +
68 
69 		"OpSource GLSL 430\n"
70 		"OpName %main \"main\"\n"
71 		"OpName %id \"gl_GlobalInvocationID\"\n"
72 
73 		"OpDecorate %id BuiltIn GlobalInvocationId\n"
74 
75 		+ string(getComputeAsmInputOutputBufferTraits()) + string(getComputeAsmCommonTypes()) + string(getComputeAsmInputOutputBuffer()) +
76 
77 		"%u32ptr        = OpTypePointer Function %u32\n"
78 
79 		"%id            = OpVariable %uvec3ptr Input\n"
80 		"%zero          = OpConstant %i32 0\n"
81 		"%uzero         = OpConstant %u32 0\n"
82 		"%fzero         = OpConstant %f32 0\n"
83 		"%one           = OpConstant %i32 1\n"
84 		"%twelve        = OpConstant %u32 12\n"
85                 "%f32arr12_t    = OpTypeArray %f32 %twelve\n"
86                 "%f32arr12ptr_t = OpTypePointer Function %f32arr12_t\n"
87 		"%f32funcptr    = OpTypePointer Function %f32\n"
88 		"%main          = OpFunction %void None %voidf\n"
89 		"%entry         = OpLabel\n"
90 
91 		"%f32arr12      = OpVariable %f32arr12ptr_t Function\n"
92 
93 		"%i1            = OpVariable %u32ptr Function\n"
94 		"%i2            = OpVariable %u32ptr Function\n"
95 		"                 OpStore %i1 %uzero\n"
96 		"                 OpStore %i2 %uzero\n"
97 
98 		"%idval         = OpLoad %uvec3 %id\n"
99 		"%x             = OpCompositeExtract %u32 %idval 0\n"
100 		"%inloc         = OpAccessChain %f32ptr %indata %zero %x\n"
101 		"%inval         = OpLoad %f32 %inloc\n"
102 
103 		// for (uint i = 0; i < 12; ++i) c[i] = float(i) * input_data.elements[x];
104 		"                 OpBranch %loop1_entry\n"
105 		"%loop1_entry   = OpLabel\n"
106 		"%i1_val        = OpLoad %u32 %i1\n"
107 		"%cmp1_lt       = OpULessThan %bool %i1_val %twelve\n"
108 		"                 OpLoopMerge %loop1_merge %loop1_body DependencyInfinite\n"
109 		"                 OpBranchConditional %cmp1_lt %loop1_body %loop1_merge\n"
110 		"%loop1_body    = OpLabel\n"
111 		"%i1_valf32     = OpConvertUToF %f32 %i1_val\n"
112 		"%mulf1         = OpFMul %f32 %i1_valf32 %inval\n"
113 		"%outloc1       = OpAccessChain %f32funcptr %f32arr12 %i1_val\n"
114 		"                 OpStore %outloc1 %mulf1\n"
115 		"%new1_i        = OpIAdd %u32 %i1_val %one\n"
116 		"                 OpStore %i1 %new1_i\n"
117 		"                 OpBranch %loop1_entry\n"
118 		"%loop1_merge   = OpLabel\n"
119 
120 		//   output_data.elements[x] = 0.0f;
121 		"%outloc        = OpAccessChain %f32ptr %outdata %zero %x\n"
122 		"                 OpStore %outloc %fzero\n"
123 		"                 OpBranch %loop2_entry\n"
124 
125 		//   for (uint i = 0; i < n; ++i) output_data.elements[x] += c[i];
126 		"%loop2_entry   = OpLabel\n"
127 		"%i2_val        = OpLoad %u32 %i2\n"
128 		"%cmp2_lt       = OpULessThan %bool %i2_val %twelve\n"
129 		"                 OpLoopMerge %loop2_merge %loop2_body None\n"
130 		"                 OpBranchConditional %cmp2_lt %loop2_body %loop2_merge\n"
131 		"%loop2_body    = OpLabel\n"
132 		"%arr1_i2loc    = OpAccessChain %f32funcptr %f32arr12 %i2_val\n"
133 		"%arr1_i2val    = OpLoad %f32 %arr1_i2loc\n"
134 		"%outval        = OpLoad %f32 %outloc\n"
135 		"%addf1         = OpFAdd %f32 %outval %arr1_i2val\n"
136 		"                 OpStore %outloc %addf1\n"
137 		"%new_i2        = OpIAdd %u32 %i2_val %one\n"
138 		"                 OpStore %i2 %new_i2\n"
139 		"                 OpBranch %loop2_entry\n"
140 		"%loop2_merge   = OpLabel\n"
141 
142 		"                 OpReturn\n"
143 		"                 OpFunctionEnd\n";
144 }
145 
getComputeShaderSpec()146 static ComputeShaderSpec getComputeShaderSpec ()
147 {
148 	de::Random			rnd				(0xABC);
149 	const int			numElements		= 100;
150 	vector<float>		inputFloats		(numElements, 0);
151 	vector<float>		outputFloats	(numElements, 0);
152 	ComputeShaderSpec	spec;
153 
154 	for (size_t ndx = 0; ndx < numElements; ++ndx)
155 		inputFloats[ndx] = deFloatFloor(rnd.getFloat(1.0f, 100.0f));
156 
157 	for (size_t ndx = 0; ndx < numElements; ++ndx)
158 	{
159 		const deUint32 n = 12;
160 		float c[n];
161 		float result = 0.0f;
162 
163 		for (deUint32 i = 0; i < n; ++i)
164 			c[i] = float(i) * inputFloats[ndx];
165 
166 		for (deUint32 i = 0; i < n; ++i)
167 			result += c[i];
168 
169 		outputFloats[ndx] = result;
170 	}
171 
172 	// Shader source code can be retrieved to complete definition of ComputeShaderSpec, though it is not required at this stage
173 	// getComputeSourceCode (spec.assembly);
174 
175 	spec.inputs.push_back(BufferSp(new Float32Buffer(inputFloats)));
176 	spec.outputs.push_back(BufferSp(new Float32Buffer(outputFloats)));
177 	spec.numWorkGroups	= tcu::IVec3(numElements, 1, 1);
178 	spec.verifyIO		= &verifyOutput;
179 
180 	return spec;
181 }
182 
183 
184 class SpvAsmLoopControlDependencyInfiniteInstance : public ComputeShaderSpec, public SpvAsmComputeShaderInstance
185 {
186 public:
187 	SpvAsmLoopControlDependencyInfiniteInstance	(Context& ctx);
188 };
189 
SpvAsmLoopControlDependencyInfiniteInstance(Context & ctx)190 SpvAsmLoopControlDependencyInfiniteInstance::SpvAsmLoopControlDependencyInfiniteInstance (Context& ctx)
191 	: ComputeShaderSpec(getComputeShaderSpec())
192 	, SpvAsmComputeShaderInstance(ctx, *this)
193 {
194 }
195 
SpvAsmLoopControlDependencyInfiniteCase(tcu::TestContext & testCtx,const char * name,const char * description)196 SpvAsmLoopControlDependencyInfiniteCase::SpvAsmLoopControlDependencyInfiniteCase (tcu::TestContext& testCtx, const char* name, const char* description)
197 	: TestCase			(testCtx, name, description)
198 {
199 }
200 
initPrograms(SourceCollections & programCollection) const201 void SpvAsmLoopControlDependencyInfiniteCase::initPrograms (SourceCollections& programCollection) const
202 {
203 	std::string comp;
204 
205 	getComputeSourceCode(comp);
206 
207 	programCollection.spirvAsmSources.add("compute") << SpirVAsmBuildOptions(programCollection.usedVulkanVersion, SPIRV_VERSION_1_3) << comp;
208 }
209 
createInstance(Context & context) const210 TestInstance* SpvAsmLoopControlDependencyInfiniteCase::createInstance (Context& context) const
211 {
212 	if (!context.contextSupports(vk::ApiVersion(1, 1, 0)))
213 		TCU_THROW(NotSupportedError, "SPIR-V higher than 1.3 is required for this test to run");
214 
215 	return new SpvAsmLoopControlDependencyInfiniteInstance(context);
216 }
217 
218 } // SpirVAssembly
219 } // vkt
220