1 /*-------------------------------------------------------------------------
2  * Vulkan Conformance Tests
3  * ------------------------
4  *
5  * Copyright (c) 2018 Google Inc.
6  * Copyright (c) 2018 The Khronos Group Inc.
7  *
8  * Licensed under the Apache License, Version 2.0 (the "License");
9  * you may not use this file except in compliance with the License.
10  * You may obtain a copy of the License at
11  *
12  *      http://www.apache.org/licenses/LICENSE-2.0
13  *
14  * Unless required by applicable law or agreed to in writing, software
15  * distributed under the License is distributed on an "AS IS" BASIS,
16  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17  * See the License for the specific language governing permissions and
18  * limitations under the License.
19  *
20  *//*!
21  * \file
22  * \brief Tests for subpass dependency
23  *//*--------------------------------------------------------------------*/
24 
25 #include "vktRenderPassSubpassDependencyTests.hpp"
26 #include "vktRenderPassTestsUtil.hpp"
27 
28 #include "vktTestCaseUtil.hpp"
29 #include "vktTestGroupUtil.hpp"
30 #include "vkImageUtil.hpp"
31 #include "vkQueryUtil.hpp"
32 #include "vkRefUtil.hpp"
33 #include "vkCmdUtil.hpp"
34 #include "vkObjUtil.hpp"
35 #include "vkBuilderUtil.hpp"
36 
37 #include "tcuImageCompare.hpp"
38 #include "tcuResultCollector.hpp"
39 #include "tcuTestLog.hpp"
40 #include "tcuTextureUtil.hpp"
41 
42 #include "rrRenderer.hpp"
43 #include "deRandom.hpp"
44 #include "deMath.h"
45 
46 using namespace vk;
47 
48 using tcu::UVec4;
49 using tcu::Vec2;
50 using tcu::UVec2;
51 using tcu::Vec4;
52 
53 using tcu::ConstPixelBufferAccess;
54 using tcu::PixelBufferAccess;
55 
56 using tcu::TestLog;
57 
58 using std::string;
59 using std::vector;
60 using de::SharedPtr;
61 
62 typedef de::SharedPtr<Unique<VkImage> >					SharedPtrVkImage;
63 typedef de::SharedPtr<Unique<VkImageView> >				SharedPtrVkImageView;
64 typedef de::SharedPtr<Unique<VkPipeline> >				SharedPtrVkPipeline;
65 typedef de::SharedPtr<Unique<VkSampler> >				SharedPtrVkSampler;
66 typedef de::SharedPtr<Unique<VkRenderPass> >			SharedPtrVkRenderPass;
67 typedef de::SharedPtr<Unique<VkFramebuffer> >			SharedPtrVkFramebuffer;
68 typedef de::SharedPtr<Unique<VkDescriptorPool> >		SharedPtrVkDescriptorPool;
69 typedef de::SharedPtr<Unique<VkDescriptorSetLayout> >	SharedPtrVkDescriptorLayout;
70 typedef de::SharedPtr<Unique<VkDescriptorSet> >			SharedPtrVkDescriptorSet;
71 typedef de::SharedPtr<Unique<VkPipelineLayout> >		SharedPtrVkPipelineLayout;
72 typedef de::SharedPtr<Unique<VkPipeline> >				SharedPtrVkPipeline;
73 
74 namespace vkt
75 {
76 namespace
77 {
78 using namespace renderpass;
79 
80 template<typename T>
makeSharedPtr(Move<T> move)81 inline SharedPtr<Unique<T> > makeSharedPtr(Move<T> move)
82 {
83 	return SharedPtr<Unique<T> >(new Unique<T>(move));
84 }
85 
getRepresentableDepthChannel(const ConstPixelBufferAccess & access)86 tcu::TextureLevel getRepresentableDepthChannel (const ConstPixelBufferAccess& access)
87 {
88 	tcu::TextureLevel depthChannel (mapVkFormat(VK_FORMAT_R8G8B8_UNORM), access.getWidth(), access.getHeight());
89 
90 	for (int y = 0; y < access.getHeight(); y++)
91 	for (int x = 0; x < access.getWidth(); x++)
92 		depthChannel.getAccess().setPixel(tcu::Vec4(access.getPixDepth(x, y)), x, y);
93 
94 	return depthChannel;
95 }
96 
verifyDepth(Context & context,const ConstPixelBufferAccess & reference,const ConstPixelBufferAccess & result,const float threshold)97 bool verifyDepth (Context&						context,
98 				  const ConstPixelBufferAccess&	reference,
99 				  const ConstPixelBufferAccess&	result,
100 				  const float					threshold)
101 {
102 	tcu::TestLog& log (context.getTestContext().getLog());
103 
104 	return tcu::floatThresholdCompare(log,										// log
105 									  "Depth channel",							// imageSetName
106 									  "Depth compare",							// imageSetDesc
107 									  getRepresentableDepthChannel(reference),	// reference
108 									  getRepresentableDepthChannel(result),		// result
109 									  Vec4(threshold),							// threshold
110 									  tcu::COMPARE_LOG_RESULT);					// logMode
111 }
112 
verifyStencil(Context & context,const ConstPixelBufferAccess & reference,const ConstPixelBufferAccess & result)113 bool verifyStencil (Context&						context,
114 					const ConstPixelBufferAccess&	reference,
115 					const ConstPixelBufferAccess&	result)
116 {
117 	tcu::TextureLevel	stencilErrorImage	(tcu::TextureFormat(tcu::TextureFormat::RGBA, tcu::TextureFormat::UNORM_INT8), result.getWidth(), result.getHeight());
118 	tcu::TestLog&		log					(context.getTestContext().getLog());
119 	bool				stencilOk			(DE_TRUE);
120 
121 	for (int y = 0; y < result.getHeight(); y++)
122 	for (int x = 0; x < result.getWidth(); x++)
123 	{
124 		if (result.getPixStencil(x, y) != reference.getPixStencil(x, y))
125 		{
126 			stencilErrorImage.getAccess().setPixel(Vec4(1.0f, 0.0f, 0.0f, 1.0f), x, y);
127 			stencilOk = DE_FALSE;
128 		}
129 		else
130 			stencilErrorImage.getAccess().setPixel(Vec4(0.0f, 1.0f, 0.0f, 1.0f), x, y);
131 	}
132 
133 	log << tcu::TestLog::ImageSet("Stencil compare", "Stencil compare")
134 		<< tcu::TestLog::Image("Result stencil channel", "Result stencil channel", result)
135 		<< tcu::TestLog::Image("Reference stencil channel", "Reference stencil channel", reference);
136 
137 	if (!stencilOk)
138 		log << tcu::TestLog::Image("Stencil error mask", "Stencil error mask", stencilErrorImage);
139 
140 	log << tcu::TestLog::EndImageSet;
141 
142 	return stencilOk;
143 }
144 
145 // Reference renderer shaders
146 class DepthVertShader : public rr::VertexShader
147 {
148 public:
DepthVertShader(void)149 	DepthVertShader (void)
150 	: rr::VertexShader (1, 1)
151 	{
152 		m_inputs[0].type	= rr::GENERICVECTYPE_FLOAT;
153 		m_outputs[0].type	= rr::GENERICVECTYPE_FLOAT;
154 	}
155 
shadeVertices(const rr::VertexAttrib * inputs,rr::VertexPacket * const * packets,const int numPackets) const156 	void shadeVertices (const rr::VertexAttrib* inputs, rr::VertexPacket* const* packets, const int numPackets) const
157 	{
158 		for (int packetNdx = 0; packetNdx < numPackets; ++packetNdx)
159 		{
160 			packets[packetNdx]->position	= rr::readVertexAttribFloat(inputs[0],
161 																		packets[packetNdx]->instanceNdx,
162 																		packets[packetNdx]->vertexNdx);
163 
164 			packets[packetNdx]->outputs[0]	= rr::readVertexAttribFloat(inputs[0],
165 																		packets[packetNdx]->instanceNdx,
166 																		packets[packetNdx]->vertexNdx);
167 		}
168 	}
169 };
170 
171 class DepthFragShader : public rr::FragmentShader
172 {
173 public:
DepthFragShader(void)174 	DepthFragShader (void)
175 	: rr::FragmentShader(1, 1)
176 	{
177 		m_inputs[0].type	= rr::GENERICVECTYPE_FLOAT;
178 		m_outputs[0].type	= rr::GENERICVECTYPE_FLOAT;
179 	}
180 
shadeFragments(rr::FragmentPacket * packets,const int numPackets,const rr::FragmentShadingContext & context) const181 	void shadeFragments (rr::FragmentPacket* packets, const int numPackets, const rr::FragmentShadingContext& context) const
182 	{
183 		for (int packetNdx = 0; packetNdx < numPackets; ++packetNdx)
184 		{
185 			rr::FragmentPacket& packet = packets[packetNdx];
186 			for (deUint32 fragNdx = 0; fragNdx < rr::NUM_FRAGMENTS_PER_PACKET; ++fragNdx)
187 			{
188 				const tcu::Vec4 vtxPosition = rr::readVarying<float>(packet, context, 0, fragNdx);
189 
190 				rr::writeFragmentDepth(context, packetNdx, fragNdx, 0, vtxPosition.z());
191 			}
192 		}
193 	}
194 };
195 
196 class SelfDependencyBackwardsVertShader : public rr::VertexShader
197 {
198 public:
SelfDependencyBackwardsVertShader(void)199 	SelfDependencyBackwardsVertShader (void)
200 	: rr::VertexShader (1, 0)
201 	{
202 		m_inputs[0].type	= rr::GENERICVECTYPE_FLOAT;
203 	}
204 
shadeVertices(const rr::VertexAttrib * inputs,rr::VertexPacket * const * packets,const int numPackets) const205 	void shadeVertices (const rr::VertexAttrib* inputs, rr::VertexPacket* const* packets, const int numPackets) const
206 	{
207 		for (int packetNdx = 0; packetNdx < numPackets; ++packetNdx)
208 		{
209 			packets[packetNdx]->position	= rr::readVertexAttribFloat(inputs[0],
210 																		packets[packetNdx]->instanceNdx,
211 																		packets[packetNdx]->vertexNdx);
212 		}
213 	}
214 };
215 
216 class SelfDependencyBackwardsFragShader : public rr::FragmentShader
217 {
218 public:
SelfDependencyBackwardsFragShader(void)219 	SelfDependencyBackwardsFragShader (void)
220 	: rr::FragmentShader(0, 1)
221 	{
222 		m_outputs[0].type	= rr::GENERICVECTYPE_FLOAT;
223 	}
224 
shadeFragments(rr::FragmentPacket * packets,const int numPackets,const rr::FragmentShadingContext & context) const225 	void shadeFragments (rr::FragmentPacket* packets, const int numPackets, const rr::FragmentShadingContext& context) const
226 	{
227 		DE_UNREF(packets);
228 
229 		for (int packetNdx = 0; packetNdx < numPackets; ++packetNdx)
230 			for (deUint32 fragNdx = 0; fragNdx < rr::NUM_FRAGMENTS_PER_PACKET; ++fragNdx)
231 				rr::writeFragmentOutput<tcu::Vec4>(context, packetNdx, fragNdx, 0, tcu::Vec4(1.0f, 0.0f, 0.0f, 1.0f));
232 	}
233 };
234 
createBufferMemory(const DeviceInterface & vk,VkDevice device,Allocator & allocator,VkBuffer buffer)235 de::MovePtr<Allocation> createBufferMemory (const DeviceInterface&	vk,
236 											VkDevice				device,
237 											Allocator&				allocator,
238 											VkBuffer				buffer)
239 {
240 	de::MovePtr<Allocation> allocation (allocator.allocate(getBufferMemoryRequirements(vk, device, buffer), MemoryRequirement::HostVisible));
241 
242 	VK_CHECK(vk.bindBufferMemory(device, buffer, allocation->getMemory(), allocation->getOffset()));
243 
244 	return allocation;
245 }
246 
createImageView(const DeviceInterface & vk,VkDevice device,VkImageViewCreateFlags flags,VkImage image,VkImageViewType viewType,VkFormat format,VkComponentMapping components,VkImageSubresourceRange subresourceRange)247 Move<VkImageView> createImageView (const DeviceInterface&	vk,
248 								   VkDevice					device,
249 								   VkImageViewCreateFlags	flags,
250 								   VkImage					image,
251 								   VkImageViewType			viewType,
252 								   VkFormat					format,
253 								   VkComponentMapping		components,
254 								   VkImageSubresourceRange	subresourceRange)
255 {
256 	const VkImageViewCreateInfo pCreateInfo =
257 	{
258 		VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,	// VkStructureType			sType
259 		DE_NULL,									// const void*				pNext
260 		flags,										// VkImageViewCreateFlags	flags
261 		image,										// VkImage					image
262 		viewType,									// VkImageViewType			viewType
263 		format,										// VkFormat					format
264 		components,									// VkComponentMapping		components
265 		subresourceRange,							// VkImageSubresourceRange	subresourceRange
266 	};
267 
268 	return createImageView(vk, device, &pCreateInfo);
269 }
270 
createImageViews(const DeviceInterface & vkd,VkDevice device,vector<SharedPtrVkImage> images,VkFormat format,VkImageAspectFlags aspect)271 vector<SharedPtrVkImageView> createImageViews (const DeviceInterface&	vkd,
272 											   VkDevice					device,
273 											   vector<SharedPtrVkImage>	images,
274 											   VkFormat					format,
275 											   VkImageAspectFlags		aspect)
276 {
277 	vector<SharedPtrVkImageView> imageViews;
278 
279 	for (size_t imageViewNdx = 0; imageViewNdx < images.size(); imageViewNdx++)
280 	{
281 		const VkImageSubresourceRange range =
282 		{
283 			aspect,	// VkImageAspectFlags	aspectMask
284 			0u,		// uint32_t				baseMipLevel
285 			1u,		// uint32_t				levelCount
286 			0u,		// uint32_t				baseArrayLayer
287 			1u		// uint32_t				layerCount
288 		};
289 
290 		imageViews.push_back(makeSharedPtr(createImageView(vkd, device, 0u, **images[imageViewNdx], VK_IMAGE_VIEW_TYPE_2D, format, makeComponentMappingRGBA(), range)));
291 	}
292 
293 	return imageViews;
294 }
295 
createBuffer(const DeviceInterface & vkd,VkDevice device,VkFormat format,deUint32 width,deUint32 height)296 Move<VkBuffer> createBuffer (const DeviceInterface&	vkd,
297 							 VkDevice				device,
298 							 VkFormat				format,
299 							 deUint32				width,
300 							 deUint32				height)
301 {
302 	const VkBufferUsageFlags	bufferUsage	(VK_BUFFER_USAGE_TRANSFER_SRC_BIT | VK_BUFFER_USAGE_TRANSFER_DST_BIT);
303 	const VkDeviceSize			pixelSize	= mapVkFormat(format).getPixelSize();
304 	const VkBufferCreateInfo	createInfo	=
305 	{
306 		VK_STRUCTURE_TYPE_BUFFER_CREATE_INFO,	// VkStructureType		sType
307 		DE_NULL,								// const void*			pNext
308 		0u,										// VkBufferCreateFlags	flags
309 		width * height * pixelSize,				// VkDeviceSize			size
310 		bufferUsage,							// VkBufferUsageFlags	usage
311 		VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode		sharingMode
312 		0u,										// uint32_t				queueFamilyIndexCount
313 		DE_NULL									// const uint32_t*		pQueueFamilyIndices
314 	};
315 
316 	return createBuffer(vkd, device, &createInfo);
317 }
318 
createDescriptorSetLayouts(const DeviceInterface & vkd,VkDevice device,vector<SharedPtrVkSampler> & samplers)319 vector<SharedPtrVkDescriptorLayout> createDescriptorSetLayouts (const DeviceInterface&		vkd,
320 																VkDevice					device,
321 																vector<SharedPtrVkSampler>&	samplers)
322 {
323 	vector<SharedPtrVkDescriptorLayout> layouts;
324 
325 	for (size_t layoutNdx = 0; layoutNdx < samplers.size(); layoutNdx++)
326 	{
327 		const VkDescriptorSetLayoutBinding		bindings	=
328 		{
329 				0u,											// uint32_t				binding
330 				VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER,	// VkDescriptorType		descriptorType
331 				1u,											// uint32_t				descriptorCount
332 				VK_SHADER_STAGE_FRAGMENT_BIT,				// VkShaderStageFlags	stageFlags
333 				&**samplers[layoutNdx]						// const VkSampler*		pImmutableSamplers
334 		};
335 
336 		const VkDescriptorSetLayoutCreateInfo	createInfo	=
337 		{
338 			VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO,	// VkStructureType						sType
339 			DE_NULL,												// const void*							pNext
340 			0u,														// VkDescriptorSetLayoutCreateFlags		flags
341 			1u,														// uint32_t								bindingCount
342 			&bindings												// const VkDescriptorSetLayoutBinding*	pBindings
343 		};
344 
345 		layouts.push_back(makeSharedPtr(createDescriptorSetLayout(vkd, device, &createInfo)));
346 	}
347 
348 	return layouts;
349 }
350 
createDescriptorPools(const DeviceInterface & vkd,VkDevice device,vector<SharedPtrVkDescriptorLayout> & layouts,VkDescriptorType type)351 vector<SharedPtrVkDescriptorPool> createDescriptorPools (const DeviceInterface&					vkd,
352 														 VkDevice								device,
353 														 vector<SharedPtrVkDescriptorLayout>&	layouts,
354 														 VkDescriptorType						type)
355 {
356 	vector<SharedPtrVkDescriptorPool> descriptorPools;
357 
358 	for (size_t poolNdx = 0; poolNdx < layouts.size(); poolNdx++)
359 	{
360 		const VkDescriptorPoolSize			size		=
361 		{
362 			type,	// VkDescriptorType		type
363 			1u		// uint32_t				descriptorCount
364 		};
365 
366 		const VkDescriptorPoolCreateInfo	createInfo	=
367 		{
368 			VK_STRUCTURE_TYPE_DESCRIPTOR_POOL_CREATE_INFO,		// VkStructureType				sType
369 			DE_NULL,											// const void*					pNext
370 			VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT,	// VkDescriptorPoolCreateFlags	flags
371 			1u,													// uint32_t						maxSets
372 			1u,													// uint32_t						poolSizeCount
373 			&size												// const VkDescriptorPoolSize*	pPoolSizes
374 		};
375 
376 		descriptorPools.push_back(makeSharedPtr(createDescriptorPool(vkd, device, &createInfo)));
377 	}
378 
379 	return descriptorPools;
380 }
381 
382 struct ExternalTestConfig
383 {
ExternalTestConfigvkt::__anon104c10a40111::ExternalTestConfig384 	ExternalTestConfig	(VkFormat				format_,
385 						 UVec2					imageSize_,
386 						 vector<RenderPass>		renderPasses_,
387 						 RenderPassType			renderPassType_,
388 						 SynchronizationType	synchronizationType_,
389 						 deUint32				blurKernel_ = 4)
390 		: format				(format_)
391 		, imageSize				(imageSize_)
392 		, renderPasses			(renderPasses_)
393 		, renderPassType		(renderPassType_)
394 		, synchronizationType	(synchronizationType_)
395 		, blurKernel			(blurKernel_)
396 	{
397 	}
398 
399 	VkFormat			format;
400 	UVec2				imageSize;
401 	vector<RenderPass>	renderPasses;
402 	RenderPassType		renderPassType;
403 	SynchronizationType	synchronizationType;
404 	deUint32			blurKernel;
405 };
406 
407 class ExternalDependencyTestInstance : public TestInstance
408 {
409 public:
410 											ExternalDependencyTestInstance	(Context& context, ExternalTestConfig testConfig);
411 											~ExternalDependencyTestInstance	(void);
412 
413 	vector<SharedPtrVkImage>				createAndAllocateImages			(const DeviceInterface&					vk,
414 																			 VkDevice								device,
415 																			 Allocator&								allocator,
416 																			 vector<de::SharedPtr<Allocation> >&	imageMemories,
417 																			 deUint32								universalQueueFamilyIndex,
418 																			 VkFormat								format,
419 																			 deUint32								width,
420 																			 deUint32								height,
421 																			 vector<RenderPass>						renderPasses);
422 
423 	vector<SharedPtrVkSampler>				createSamplers					(const DeviceInterface&					vkd,
424 																			 const VkDevice							device,
425 																			 vector<RenderPass>&					renderPasses);
426 
427 	vector<SharedPtrVkRenderPass>			createRenderPasses				(const DeviceInterface&					vkd,
428 																			 VkDevice								device,
429 																			 vector<RenderPass>						renderPassInfos,
430 																			 const RenderPassType					renderPassType,
431 																			 const SynchronizationType				synchronizationType);
432 
433 	vector<SharedPtrVkFramebuffer>			createFramebuffers				(const DeviceInterface&					vkd,
434 																			 VkDevice								device,
435 																			 vector<SharedPtrVkRenderPass>&			renderPasses,
436 																			 vector<SharedPtrVkImageView>&			dstImageViews,
437 																			 deUint32								width,
438 																			 deUint32								height);
439 
440 	vector<SharedPtrVkPipelineLayout>		createRenderPipelineLayouts		(const DeviceInterface&					vkd,
441 																			 VkDevice								device,
442 																			 vector<SharedPtrVkRenderPass>&			renderPasses,
443 																			 vector<SharedPtrVkDescriptorLayout>&	descriptorSetLayouts);
444 
445 	vector<SharedPtrVkPipeline>				createRenderPipelines			(const DeviceInterface&					vkd,
446 																			 VkDevice								device,
447 																			 vector<SharedPtrVkRenderPass>&			renderPasses,
448 																			 vector<SharedPtrVkPipelineLayout>&		pipelineLayouts,
449 																			 const BinaryCollection&				binaryCollection,
450 																			 deUint32								width,
451 																			 deUint32								height);
452 
453 	vector<SharedPtrVkDescriptorSet>		createDescriptorSets			(const DeviceInterface&					vkd,
454 																			 VkDevice								device,
455 																			 vector<SharedPtrVkDescriptorPool>&		pools,
456 																			 vector<SharedPtrVkDescriptorLayout>&	layouts,
457 																			 vector<SharedPtrVkImageView>&			imageViews,
458 																			 vector<SharedPtrVkSampler>&			samplers);
459 
460 	tcu::TestStatus							iterate							(void);
461 
462 	template<typename RenderpassSubpass>
463 	tcu::TestStatus							iterateInternal					(void);
464 
465 private:
466 	const bool								m_renderPass2Supported;
467 	const bool								m_synchronization2Supported;
468 	const RenderPassType					m_renderPassType;
469 
470 	const deUint32							m_width;
471 	const deUint32							m_height;
472 	const deUint32							m_blurKernel;
473 	const VkFormat							m_format;
474 
475 	vector<de::SharedPtr<Allocation> >		m_imageMemories;
476 	vector<SharedPtrVkImage>				m_images;
477 	vector<SharedPtrVkImageView>			m_imageViews;
478 	vector<SharedPtrVkSampler>				m_samplers;
479 
480 	const Unique<VkBuffer>					m_dstBuffer;
481 	const de::UniquePtr<Allocation>			m_dstBufferMemory;
482 
483 	vector<SharedPtrVkRenderPass>			m_renderPasses;
484 	vector<SharedPtrVkFramebuffer>			m_framebuffers;
485 
486 	vector<SharedPtrVkDescriptorLayout>		m_subpassDescriptorSetLayouts;
487 	vector<SharedPtrVkDescriptorPool>		m_subpassDescriptorPools;
488 	vector<SharedPtrVkDescriptorSet>		m_subpassDescriptorSets;
489 
490 	vector<SharedPtrVkPipelineLayout>		m_renderPipelineLayouts;
491 	vector<SharedPtrVkPipeline>				m_renderPipelines;
492 
493 	const Unique<VkCommandPool>				m_commandPool;
494 	tcu::ResultCollector					m_resultCollector;
495 };
496 
ExternalDependencyTestInstance(Context & context,ExternalTestConfig testConfig)497 ExternalDependencyTestInstance::ExternalDependencyTestInstance (Context& context, ExternalTestConfig testConfig)
498 	: TestInstance					(context)
499 	, m_renderPass2Supported		((testConfig.renderPassType == RENDERPASS_TYPE_RENDERPASS2) && context.requireDeviceFunctionality("VK_KHR_create_renderpass2"))
500 	, m_synchronization2Supported	((testConfig.synchronizationType == SYNCHRONIZATION_TYPE_SYNCHRONIZATION2) && context.requireDeviceFunctionality("VK_KHR_synchronization2"))
501 	, m_renderPassType				(testConfig.renderPassType)
502 	, m_width						(testConfig.imageSize.x())
503 	, m_height						(testConfig.imageSize.y())
504 	, m_blurKernel					(testConfig.blurKernel)
505 	, m_format						(testConfig.format)
506 	, m_images						(createAndAllocateImages(context.getDeviceInterface(), context.getDevice(), context.getDefaultAllocator(), m_imageMemories, context.getUniversalQueueFamilyIndex(), m_format, m_width, m_height, testConfig.renderPasses))
507 	, m_imageViews					(createImageViews(context.getDeviceInterface(), context.getDevice(), m_images, m_format, VK_IMAGE_ASPECT_COLOR_BIT))
508 	, m_samplers					(createSamplers(context.getDeviceInterface(), context.getDevice(), testConfig.renderPasses))
509 	, m_dstBuffer					(createBuffer(context.getDeviceInterface(), context.getDevice(), m_format, m_width, m_height))
510 	, m_dstBufferMemory				(createBufferMemory(context.getDeviceInterface(), context.getDevice(), context.getDefaultAllocator(), *m_dstBuffer))
511 	, m_renderPasses				(createRenderPasses(context.getDeviceInterface(), context.getDevice(), testConfig.renderPasses, testConfig.renderPassType, testConfig.synchronizationType))
512 	, m_framebuffers				(createFramebuffers(context.getDeviceInterface(), context.getDevice(), m_renderPasses, m_imageViews, m_width, m_height))
513 	, m_subpassDescriptorSetLayouts	(createDescriptorSetLayouts(context.getDeviceInterface(), context.getDevice(), m_samplers))
514 	, m_subpassDescriptorPools		(createDescriptorPools(context.getDeviceInterface(), context.getDevice(), m_subpassDescriptorSetLayouts, VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER))
515 	, m_subpassDescriptorSets		(createDescriptorSets(context.getDeviceInterface(), context.getDevice(), m_subpassDescriptorPools, m_subpassDescriptorSetLayouts, m_imageViews, m_samplers))
516 	, m_renderPipelineLayouts		(createRenderPipelineLayouts(context.getDeviceInterface(), context.getDevice(), m_renderPasses, m_subpassDescriptorSetLayouts))
517 	, m_renderPipelines				(createRenderPipelines(context.getDeviceInterface(), context.getDevice(), m_renderPasses, m_renderPipelineLayouts, context.getBinaryCollection(), m_width, m_height))
518 	, m_commandPool					(createCommandPool(context.getDeviceInterface(), context.getDevice(), VK_COMMAND_POOL_CREATE_TRANSIENT_BIT, context.getUniversalQueueFamilyIndex()))
519 {
520 }
521 
~ExternalDependencyTestInstance(void)522 ExternalDependencyTestInstance::~ExternalDependencyTestInstance (void)
523 {
524 }
525 
createAndAllocateImages(const DeviceInterface & vk,VkDevice device,Allocator & allocator,vector<de::SharedPtr<Allocation>> & imageMemories,deUint32 universalQueueFamilyIndex,VkFormat format,deUint32 width,deUint32 height,vector<RenderPass> renderPasses)526 vector<SharedPtrVkImage> ExternalDependencyTestInstance::createAndAllocateImages (const DeviceInterface&				vk,
527 																				  VkDevice								device,
528 																				  Allocator&							allocator,
529 																				  vector<de::SharedPtr<Allocation> >&	imageMemories,
530 																				  deUint32								universalQueueFamilyIndex,
531 																				  VkFormat								format,
532 																				  deUint32								width,
533 																				  deUint32								height,
534 																				  vector<RenderPass>					renderPasses)
535 {
536 	vector<SharedPtrVkImage> images;
537 
538 	for (size_t imageNdx = 0; imageNdx < renderPasses.size(); imageNdx++)
539 	{
540 		const VkExtent3D		imageExtent		=
541 		{
542 			width,		// uint32_t		width
543 			height,		// uint32_t		height
544 			1u			// uint32_t		depth
545 		};
546 
547 		const VkImageCreateInfo	imageCreateInfo	=
548 		{
549 			VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,	// VkStructureType			sType
550 			DE_NULL,								// const void*				pNext
551 			0u,										// VkImageCreateFlags		flags
552 			VK_IMAGE_TYPE_2D,						// VkImageType				imageType
553 			format,									// VkFormat					format
554 			imageExtent,							// VkExtent3D				extent
555 			1u,										// uint32_t					mipLevels
556 			1u,										// uint32_t					arrayLayers
557 			VK_SAMPLE_COUNT_1_BIT,					// VkSampleCountFlagBits	samples
558 			VK_IMAGE_TILING_OPTIMAL,				// VkImageTiling			tiling
559 			VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT
560 				| VK_IMAGE_USAGE_SAMPLED_BIT
561 				| VK_IMAGE_USAGE_TRANSFER_SRC_BIT,	// VkImageUsageFlags		usage
562 			VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode			sharingMode
563 			1u,										// uint32_t					queueFamilyIndexCount
564 			&universalQueueFamilyIndex,				// const uint32_t*			pQueueFamilyIndices
565 			VK_IMAGE_LAYOUT_UNDEFINED				// VkImageLayout			initialLayout
566 		};
567 
568 		images.push_back(makeSharedPtr(vk::createImage(vk, device, &imageCreateInfo, DE_NULL)));
569 		imageMemories.push_back((de::SharedPtr<Allocation>)allocator.allocate(getImageMemoryRequirements(vk, device, **images[imageNdx]), MemoryRequirement::Any).release());
570 		VK_CHECK(vk.bindImageMemory(device, **images[imageNdx], imageMemories[imageNdx]->getMemory(), imageMemories[imageNdx]->getOffset()));
571 	}
572 
573 	return images;
574 }
575 
createSamplers(const DeviceInterface & vkd,const VkDevice device,vector<RenderPass> & renderPasses)576 vector<SharedPtrVkSampler> ExternalDependencyTestInstance::createSamplers (const DeviceInterface&	vkd,
577 																		   const VkDevice			device,
578 																		   vector<RenderPass>&		renderPasses)
579 {
580 	vector<SharedPtrVkSampler> samplers;
581 
582 	for (size_t samplerNdx = 0; samplerNdx < renderPasses.size() - 1; samplerNdx++)
583 	{
584 		const VkSamplerCreateInfo samplerInfo =
585 		{
586 			VK_STRUCTURE_TYPE_SAMPLER_CREATE_INFO,		// VkStructureType			sType
587 			DE_NULL,									// const void*				pNext
588 			0u,											// VkSamplerCreateFlags		flags
589 			VK_FILTER_NEAREST,							// VkFilter					magFilter
590 			VK_FILTER_NEAREST,							// VkFilter					minFilter
591 			VK_SAMPLER_MIPMAP_MODE_NEAREST,				// VkSamplerMipmapMode		mipmapMode
592 			VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,		// VkSamplerAddressMode		addressModeU
593 			VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,		// VkSamplerAddressMode		addressModeV
594 			VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,		// VkSamplerAddressMode		addressModeW
595 			0.0f,										// float					mipLodBias
596 			VK_FALSE,									// VkBool32					anisotropyEnable
597 			1.0f,										// float					maxAnisotropy
598 			VK_FALSE,									// VkBool32					compareEnable
599 			VK_COMPARE_OP_ALWAYS,						// VkCompareOp				compareOp
600 			0.0f,										// float					minLod
601 			0.0f,										// float					maxLod
602 			VK_BORDER_COLOR_FLOAT_TRANSPARENT_BLACK,	// VkBorderColor			borderColor
603 			VK_FALSE,									// VkBool32					unnormalizedCoordinates
604 		};
605 
606 		samplers.push_back(makeSharedPtr(createSampler(vkd, device, &samplerInfo)));
607 	}
608 
609 	return samplers;
610 }
611 
createRenderPasses(const DeviceInterface & vkd,VkDevice device,vector<RenderPass> renderPassInfos,const RenderPassType renderPassType,const SynchronizationType synchronizationType)612 vector<SharedPtrVkRenderPass> ExternalDependencyTestInstance::createRenderPasses (const DeviceInterface&	vkd,
613 																				  VkDevice					device,
614 																				  vector<RenderPass>		renderPassInfos,
615 																				  const RenderPassType		renderPassType,
616 																				  const SynchronizationType	synchronizationType)
617 {
618 	vector<SharedPtrVkRenderPass> renderPasses;
619 	renderPasses.reserve(renderPassInfos.size());
620 
621 	for (const auto& renderPassInfo : renderPassInfos)
622 		renderPasses.push_back(makeSharedPtr(createRenderPass(vkd, device, renderPassInfo, renderPassType, synchronizationType)));
623 
624 	return renderPasses;
625 }
626 
createFramebuffers(const DeviceInterface & vkd,VkDevice device,vector<SharedPtrVkRenderPass> & renderPasses,vector<SharedPtrVkImageView> & dstImageViews,deUint32 width,deUint32 height)627 vector<SharedPtrVkFramebuffer> ExternalDependencyTestInstance::createFramebuffers (const DeviceInterface&			vkd,
628 																				   VkDevice							device,
629 																				   vector<SharedPtrVkRenderPass>&	renderPasses,
630 																				   vector<SharedPtrVkImageView>&	dstImageViews,
631 																				   deUint32							width,
632 																				   deUint32							height)
633 {
634 	vector<SharedPtrVkFramebuffer> framebuffers;
635 
636 	for (size_t renderPassNdx = 0; renderPassNdx < renderPasses.size(); renderPassNdx++)
637 	{
638 		VkRenderPass renderPass (**renderPasses[renderPassNdx]);
639 
640 		const VkFramebufferCreateInfo createInfo =
641 		{
642 			VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO,	// VkStructureType			sType
643 			DE_NULL,									// const void*				pNext
644 			0u,											// VkFramebufferCreateFlags	flags
645 			renderPass,									// VkRenderPass				renderPass
646 			1u,											// uint32_t					attachmentCount
647 			&**dstImageViews[renderPassNdx],			// const VkImageView*		pAttachments
648 			width,										// uint32_t					width
649 			height,										// uint32_t					height
650 			1u											// uint32_t					layers
651 		};
652 
653 		framebuffers.push_back(makeSharedPtr(createFramebuffer(vkd, device, &createInfo)));
654 	}
655 
656 	return framebuffers;
657 }
658 
createDescriptorSets(const DeviceInterface & vkd,VkDevice device,vector<SharedPtrVkDescriptorPool> & pools,vector<SharedPtrVkDescriptorLayout> & layouts,vector<SharedPtrVkImageView> & imageViews,vector<SharedPtrVkSampler> & samplers)659 vector<SharedPtrVkDescriptorSet> ExternalDependencyTestInstance::createDescriptorSets (const DeviceInterface&				vkd,
660 																					   VkDevice								device,
661 																					   vector<SharedPtrVkDescriptorPool>&	pools,
662 																					   vector<SharedPtrVkDescriptorLayout>&	layouts,
663 																					   vector<SharedPtrVkImageView>&		imageViews,
664 																					   vector<SharedPtrVkSampler>&			samplers)
665 {
666 	vector<SharedPtrVkDescriptorSet> descriptorSets;
667 
668 	for (size_t setNdx = 0; setNdx < layouts.size(); setNdx++)
669 	{
670 		const VkDescriptorSetAllocateInfo allocateInfo =
671 		{
672 			VK_STRUCTURE_TYPE_DESCRIPTOR_SET_ALLOCATE_INFO,	// VkStructureType					sType
673 			DE_NULL,										// const void*						pNext
674 			**pools[setNdx],								// VkDescriptorPool					descriptorPool
675 			1u,												// uint32_t							descriptorSetCount
676 			&**layouts[setNdx]								// const VkDescriptorSetLayout*		pSetLayouts
677 		};
678 
679 		descriptorSets.push_back(makeSharedPtr(allocateDescriptorSet(vkd, device, &allocateInfo)));
680 
681 		{
682 			const VkDescriptorImageInfo	imageInfo	=
683 			{
684 				**samplers[setNdx],							// VkSampler		sampler
685 				**imageViews[setNdx],						// VkImageView		imageView
686 				VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL	// VkImageLayout	imageLayout
687 			};
688 
689 			const VkWriteDescriptorSet	write		=
690 			{
691 				VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET,		// VkStructureType					sType
692 				DE_NULL,									// const void*						pNext
693 				**descriptorSets[setNdx],					// VkDescriptorSet					dstSet
694 				0u,											// uint32_t							dstBinding
695 				0u,											// uint32_t							dstArrayElement
696 				1u,											// uint32_t							descriptorCount
697 				VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER,	// VkDescriptorType					descriptorType
698 				&imageInfo,									// const VkDescriptorImageInfo*		pImageInfo
699 				DE_NULL,									// const VkDescriptorBufferInfo*	pBufferInfo
700 				DE_NULL										// const VkBufferView*				pTexelBufferView
701 			};
702 
703 			vkd.updateDescriptorSets(device, 1u, &write, 0u, DE_NULL);
704 		}
705 	}
706 
707 	return descriptorSets;
708 }
709 
createRenderPipelineLayouts(const DeviceInterface & vkd,VkDevice device,vector<SharedPtrVkRenderPass> & renderPasses,vector<SharedPtrVkDescriptorLayout> & descriptorSetLayouts)710 vector<SharedPtrVkPipelineLayout> ExternalDependencyTestInstance::createRenderPipelineLayouts (const DeviceInterface&				vkd,
711 																							   VkDevice								device,
712 																							   vector<SharedPtrVkRenderPass>&		renderPasses,
713 																							   vector<SharedPtrVkDescriptorLayout>&	descriptorSetLayouts)
714 {
715 	vector<SharedPtrVkPipelineLayout> pipelineLayouts;
716 
717 	for (size_t renderPassNdx = 0; renderPassNdx < renderPasses.size(); renderPassNdx++)
718 	{
719 		const VkPipelineLayoutCreateInfo createInfo =
720 		{
721 			VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,								// VkStructureType				sType
722 			DE_NULL,																	// const void*					pNext
723 			(vk::VkPipelineLayoutCreateFlags)0,											// VkPipelineLayoutCreateFlags	flags
724 			renderPassNdx > 0 ? 1u : 0u,												// deUint32						setLayoutCount
725 			renderPassNdx > 0 ? &**descriptorSetLayouts[renderPassNdx - 1] : DE_NULL,	// const VkDescriptorSetLayout*	pSetLayouts
726 			0u,																			// deUint32						pushConstantRangeCount
727 			DE_NULL																		// const VkPushConstantRange*	pPushConstantRanges
728 		};
729 
730 		pipelineLayouts.push_back(makeSharedPtr(createPipelineLayout(vkd, device, &createInfo)));
731 	}
732 
733 	return pipelineLayouts;
734 }
735 
createRenderPipelines(const DeviceInterface & vkd,VkDevice device,vector<SharedPtrVkRenderPass> & renderPasses,vector<SharedPtrVkPipelineLayout> & pipelineLayouts,const BinaryCollection & binaryCollection,deUint32 width,deUint32 height)736 vector<SharedPtrVkPipeline> ExternalDependencyTestInstance::createRenderPipelines (const DeviceInterface&				vkd,
737 																				   VkDevice								device,
738 																				   vector<SharedPtrVkRenderPass>&		renderPasses,
739 																				   vector<SharedPtrVkPipelineLayout>&	pipelineLayouts,
740 																				   const BinaryCollection&				binaryCollection,
741 																				   deUint32								width,
742 																				   deUint32								height)
743 {
744 	vector<SharedPtrVkPipeline> pipelines;
745 
746 	for (size_t renderPassNdx = 0; renderPassNdx < renderPasses.size(); renderPassNdx++)
747 	{
748 		const Unique<VkShaderModule>					vertexShaderModule		(createShaderModule(vkd, device, binaryCollection.get("quad-vert-" + de::toString(renderPassNdx)), 0u));
749 		const Unique<VkShaderModule>					fragmentShaderModule	(createShaderModule(vkd, device, binaryCollection.get("quad-frag-" + de::toString(renderPassNdx)), 0u));
750 
751 		const VkPipelineVertexInputStateCreateInfo		vertexInputState		=
752 		{
753 			VK_STRUCTURE_TYPE_PIPELINE_VERTEX_INPUT_STATE_CREATE_INFO,	// VkStructureType							sType
754 			DE_NULL,													// const void*								pNext
755 			(VkPipelineVertexInputStateCreateFlags)0u,					// VkPipelineVertexInputStateCreateFlags	flags
756 			0u,															// uint32_t									vertexBindingDescriptionCount
757 			DE_NULL,													// const VkVertexInputBindingDescription*	pVertexBindingDescriptions
758 			0u,															// uint32_t									vertexAttributeDescriptionCount
759 			DE_NULL														// const VkVertexInputAttributeDescription*	pVertexAttributeDescriptions
760 		};
761 
762 		const std::vector<VkViewport>					viewports				(1, makeViewport(tcu::UVec2(width, height)));
763 		const std::vector<VkRect2D>						scissors				(1, makeRect2D(tcu::UVec2(width, height)));
764 		const VkRenderPass								renderPass				(**renderPasses[renderPassNdx]);
765 		const VkPipelineLayout							layout					(**pipelineLayouts[renderPassNdx]);
766 
767 		pipelines.push_back(makeSharedPtr(makeGraphicsPipeline(vkd,									// const DeviceInterface&						vk
768 															   device,								// const VkDevice								device
769 															   layout,								// const VkPipelineLayout						pipelineLayout
770 															   *vertexShaderModule,					// const VkShaderModule							vertexShaderModule
771 															   DE_NULL,								// const VkShaderModule							tessellationControlShaderModule
772 															   DE_NULL,								// const VkShaderModule							tessellationEvalShaderModule
773 															   DE_NULL,								// const VkShaderModule							geometryShaderModule
774 															   *fragmentShaderModule,				// const VkShaderModule							fragmentShaderModule
775 															   renderPass,							// const VkRenderPass							renderPass
776 															   viewports,							// const std::vector<VkViewport>&				viewports
777 															   scissors,							// const std::vector<VkRect2D>&					scissors
778 															   VK_PRIMITIVE_TOPOLOGY_TRIANGLE_LIST,	// const VkPrimitiveTopology					topology
779 															   0u,									// const deUint32								subpass
780 															   0u,									// const deUint32								patchControlPoints
781 															   &vertexInputState)));				// const VkPipelineVertexInputStateCreateInfo*	vertexInputStateCreateInfo
782 	}
783 
784 	return pipelines;
785 }
786 
iterate(void)787 tcu::TestStatus ExternalDependencyTestInstance::iterate (void)
788 {
789 	switch (m_renderPassType)
790 	{
791 		case RENDERPASS_TYPE_LEGACY:
792 			return iterateInternal<RenderpassSubpass1>();
793 		case RENDERPASS_TYPE_RENDERPASS2:
794 			return iterateInternal<RenderpassSubpass2>();
795 		default:
796 			TCU_THROW(InternalError, "Impossible");
797 	}
798 }
799 
800 template<typename RenderpassSubpass>
iterateInternal(void)801 tcu::TestStatus ExternalDependencyTestInstance::iterateInternal (void)
802 {
803 	const DeviceInterface&								vkd					(m_context.getDeviceInterface());
804 	const Unique<VkCommandBuffer>						commandBuffer		(allocateCommandBuffer(vkd, m_context.getDevice(), *m_commandPool, VK_COMMAND_BUFFER_LEVEL_PRIMARY));
805 	const typename RenderpassSubpass::SubpassBeginInfo	subpassBeginInfo	(DE_NULL, VK_SUBPASS_CONTENTS_INLINE);
806 	const typename RenderpassSubpass::SubpassEndInfo	subpassEndInfo		(DE_NULL);
807 
808 	beginCommandBuffer(vkd, *commandBuffer);
809 
810 	for (size_t renderPassNdx = 0; renderPassNdx < m_renderPasses.size(); renderPassNdx++)
811 	{
812 		// Begin render pass
813 		{
814 			VkRect2D renderArea =
815 			{
816 				{ 0u, 0u },				// VkOffset2D	offset
817 				{ m_width, m_height }	// VkExtent2D	extent
818 			};
819 
820 			const VkRenderPassBeginInfo beginInfo =
821 			{
822 				VK_STRUCTURE_TYPE_RENDER_PASS_BEGIN_INFO,	// VkStructureType		sType
823 				DE_NULL,									// const void*			pNext
824 				**m_renderPasses[renderPassNdx],			// VkRenderPass			renderPass
825 				**m_framebuffers[renderPassNdx],			// VkFramebuffer		framebuffer
826 				renderArea,									// VkRect2D				renderArea
827 				0u,											// uint32_t				clearValueCount
828 				DE_NULL										// const VkClearValue*	pClearValues
829 			};
830 
831 			RenderpassSubpass::cmdBeginRenderPass(vkd, *commandBuffer, &beginInfo, &subpassBeginInfo);
832 		}
833 
834 		vkd.cmdBindPipeline(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, **m_renderPipelines[renderPassNdx]);
835 
836 		// Use results from the previous pass as input texture
837 		if (renderPassNdx > 0)
838 			vkd.cmdBindDescriptorSets(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, **m_renderPipelineLayouts[renderPassNdx], 0, 1, &**m_subpassDescriptorSets[renderPassNdx - 1], 0, DE_NULL);
839 
840 		vkd.cmdDraw(*commandBuffer, 6u, 1u, 0u, 0u);
841 
842 		RenderpassSubpass::cmdEndRenderPass(vkd, *commandBuffer, &subpassEndInfo);
843 	}
844 
845 	// Memory barrier between rendering and copy
846 	{
847 		VkImageSubresourceRange		imageSubresourceRange	=
848 		{
849 			VK_IMAGE_ASPECT_COLOR_BIT,	// VkImageAspectFlags	aspectMask
850 			0u,							// uint32_t				baseMipLevel
851 			1u,							// uint32_t				levelCount
852 			0u,							// uint32_t				baseArrayLayer
853 			1u							// uint32_t				layerCount
854 		};
855 
856 		const VkImageMemoryBarrier	barrier					=
857 		{
858 			VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,		// VkStructureType			sType
859 			DE_NULL,									// const void*				pNext
860 			0,											// VkAccessFlags			srcAccessMask
861 			VK_ACCESS_TRANSFER_READ_BIT,				// VkAccessFlags			dstAccessMask
862 			VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL,	// VkImageLayout			oldLayout
863 			VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL,		// VkImageLayout			newLayout
864 			VK_QUEUE_FAMILY_IGNORED,					// uint32_t					srcQueueFamilyIndex
865 			VK_QUEUE_FAMILY_IGNORED,					// uint32_t					dstQueueFamilyIndex
866 			**m_images[m_renderPasses.size() - 1],		// VkImage					image
867 			imageSubresourceRange						// VkImageSubresourceRange	subresourceRange
868 		};
869 		// Since the implicit 'end' subpass dependency has VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT in its dstStageMask,
870 		// we can't form an execution dependency chain with a specific pipeline stage. The cases that provide an explict
871 		// 'end' subpass dependency could use a specific pipline stage, but there isn't a way to distinguish between the
872 		// implicit and explicit cases here.
873 		vkd.cmdPipelineBarrier(*commandBuffer, VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT, 0u, 0u, DE_NULL, 0u, DE_NULL, 1u, &barrier);
874 	}
875 
876 	// Copy image memory to buffer
877 	{
878 		const VkImageSubresourceLayers imageSubresourceLayers =
879 		{
880 			VK_IMAGE_ASPECT_COLOR_BIT,	// VkImageAspectFlags	aspectMask
881 			0u,							// deUint32				mipLevel
882 			0u,							// deUint32				baseArrayLayer
883 			1u							// deUint32				layerCount
884 		};
885 
886 		const VkBufferImageCopy region =
887 		{
888 			0u,							// VkDeviceSize				bufferOffset
889 			0u,							// uint32_t					bufferRowLength
890 			0u,							// uint32_t					bufferImageHeight
891 			imageSubresourceLayers,		// VkImageSubresourceLayers	imageSubresource
892 			{ 0u, 0u, 0u },				// VkOffset3D				imageOffset
893 			{ m_width, m_height, 1u }	// VkExtent3D				imageExtent
894 		};
895 
896 		vkd.cmdCopyImageToBuffer(*commandBuffer, **m_images[m_renderPasses.size() - 1], VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL, *m_dstBuffer, 1u, &region);
897 	}
898 
899 	// Memory barrier between copy and host access
900 	{
901 		const VkBufferMemoryBarrier barrier =
902 		{
903 			VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER,	// VkStructureType	sType
904 			DE_NULL,									// const void*		pNext
905 			VK_ACCESS_TRANSFER_WRITE_BIT,				// VkAccessFlags	srcAccessMask
906 			VK_ACCESS_HOST_READ_BIT,					// VkAccessFlags	dstAccessMask
907 			VK_QUEUE_FAMILY_IGNORED,					// uint32_t			srcQueueFamilyIndex
908 			VK_QUEUE_FAMILY_IGNORED,					// uint32_t			dstQueueFamilyIndex
909 			*m_dstBuffer,								// VkBuffer			buffer
910 			0u,											// VkDeviceSize		offset
911 			VK_WHOLE_SIZE								// VkDeviceSize		size
912 		};
913 
914 		vkd.cmdPipelineBarrier(*commandBuffer, VK_PIPELINE_STAGE_TRANSFER_BIT, VK_PIPELINE_STAGE_HOST_BIT, 0u, 0u, DE_NULL, 1u, &barrier, 0u, DE_NULL);
915 	}
916 
917 	endCommandBuffer(vkd, *commandBuffer);
918 	submitCommandsAndWait(vkd, m_context.getDevice(), m_context.getUniversalQueue(), *commandBuffer);
919 	invalidateMappedMemoryRange(vkd, m_context.getDevice(), m_dstBufferMemory->getMemory(), m_dstBufferMemory->getOffset(), VK_WHOLE_SIZE);
920 
921 	{
922 		const tcu::TextureFormat			format		(mapVkFormat(m_format));
923 		const void* const					ptr			(m_dstBufferMemory->getHostPtr());
924 		const tcu::ConstPixelBufferAccess	access		(format, m_width, m_height, 1, ptr);
925 		tcu::TextureLevel					reference	(format, m_width, m_height);
926 		tcu::TextureLevel					textureA	(format, m_width, m_height);
927 		tcu::TextureLevel					textureB	(format, m_width, m_height);
928 
929 		for (deUint32 renderPassNdx = 0; renderPassNdx < m_renderPasses.size(); renderPassNdx++)
930 		{
931 			// First pass renders four quads of different color, which will be blurred in the following passes
932 			if (renderPassNdx == 0)
933 			{
934 				for (deUint32 y = 0; y < m_height; y++)
935 				for (deUint32 x = 0; x < m_width; x++)
936 				{
937 					if (x <= (m_width - 1) / 2 && y <= (m_height - 1) / 2)
938 						textureA.getAccess().setPixel(Vec4(1.0f, 0.0f, 0.0f, 1.0f), x, y);
939 					else if (x > (m_width - 1) / 2 && y <= (m_height - 1) / 2)
940 						textureA.getAccess().setPixel(Vec4(0.0f, 1.0f, 0.0f, 1.0f), x, y);
941 					else if (x <= (m_width - 1) / 2 && y > (m_height - 1) / 2)
942 						textureA.getAccess().setPixel(Vec4(0.0f, 0.0f, 1.0f, 1.0f), x, y);
943 					else
944 						textureA.getAccess().setPixel(Vec4(0.0f, 0.0f, 0.0f, 1.0f), x, y);
945 				}
946 			}
947 			// Blur previous pass
948 			else
949 			{
950 				for (deUint32 y = 0; y < m_height; y++)
951 				for (deUint32 x = 0; x < m_width; x++)
952 				{
953 					Vec4 blurColor (Vec4(0.0));
954 
955 					for (deUint32 sampleNdx = 0; sampleNdx < (m_blurKernel + 1); sampleNdx++)
956 					{
957 						if (renderPassNdx % 2 == 0)
958 						{
959 							// Do a horizontal blur
960 							blurColor += 0.12f * textureB.getAccess().getPixel(deClamp32((deInt32)x - (m_blurKernel / 2) + sampleNdx, 0u, m_width - 1u), y);
961 						}
962 						else
963 						{
964 							// Do a vertical blur
965 							blurColor += 0.12f * textureA.getAccess().getPixel(x, deClamp32((deInt32)y - (m_blurKernel / 2) + sampleNdx, 0u, m_height - 1u));
966 						}
967 					}
968 
969 					renderPassNdx % 2 == 0 ? textureA.getAccess().setPixel(blurColor, x, y) : textureB.getAccess().setPixel(blurColor, x, y);
970 				}
971 			}
972 		}
973 
974 		reference = m_renderPasses.size() % 2 == 0 ? textureB : textureA;
975 
976 		{
977 			// Allow error of 4 times the minimum presentable difference
978 			const Vec4 threshold (4.0f * 1.0f / ((UVec4(1u) << tcu::getTextureFormatMantissaBitDepth(format).cast<deUint32>()) - 1u).cast<float>());
979 
980 			if (!tcu::floatThresholdCompare(m_context.getTestContext().getLog(), "", "", reference.getAccess(), access, threshold, tcu::COMPARE_LOG_ON_ERROR))
981 				m_resultCollector.fail("Compare failed.");
982 		}
983 	}
984 
985 	return tcu::TestStatus(m_resultCollector.getResult(), m_resultCollector.getMessage());
986 }
987 
988 struct SubpassTestConfig
989 {
SubpassTestConfigvkt::__anon104c10a40111::SubpassTestConfig990 		SubpassTestConfig	(VkFormat		format_,
991 							 UVec2			imageSize_,
992 							 RenderPass		renderPass_,
993 							 RenderPassType	renderPassType_)
994 		: format			(format_)
995 		, imageSize			(imageSize_)
996 		, renderPass		(renderPass_)
997 		, renderPassType	(renderPassType_)
998 	{
999 	}
1000 
1001 	VkFormat			format;
1002 	UVec2				imageSize;
1003 	RenderPass			renderPass;
1004 	RenderPassType		renderPassType;
1005 };
1006 
1007 class SubpassDependencyTestInstance : public TestInstance
1008 {
1009 public:
1010 										SubpassDependencyTestInstance	(Context&								context,
1011 																		 SubpassTestConfig						testConfig);
1012 
1013 										~SubpassDependencyTestInstance	(void);
1014 
1015 	vector<SharedPtrVkImage>			createAndAllocateImages			(const DeviceInterface&					vk,
1016 																		 VkDevice								device,
1017 																		 Allocator&								allocator,
1018 																		 vector<de::SharedPtr<Allocation> >&	imageMemories,
1019 																		 deUint32								universalQueueFamilyIndex,
1020 																		 RenderPass								renderPassInfo,
1021 																		 VkFormat								format,
1022 																		 deUint32								width,
1023 																		 deUint32								height);
1024 
1025 	vector<SharedPtrVkPipelineLayout>	createRenderPipelineLayouts		(const DeviceInterface&					vkd,
1026 																		 VkDevice								device,
1027 																		 RenderPass								renderPassInfo,
1028 																		 vector<SharedPtrVkDescriptorLayout>	descriptorSetLayouts);
1029 
1030 	vector<SharedPtrVkPipeline>			createRenderPipelines			(const DeviceInterface&					vkd,
1031 																		 VkDevice								device,
1032 																		 RenderPass								renderPassInfo,
1033 																		 VkRenderPass							renderPass,
1034 																		 vector<SharedPtrVkPipelineLayout>&		pipelineLayouts,
1035 																		 const BinaryCollection&				binaryCollection,
1036 																		 VkFormat								format,
1037 																		 deUint32								width,
1038 																		 deUint32								height);
1039 
1040 	Move<VkFramebuffer>					createFramebuffer				(const DeviceInterface&					vkd,
1041 																		 VkDevice								device,
1042 																		 RenderPass								renderPassInfo,
1043 																		 VkRenderPass							renderPass,
1044 																		 vector<SharedPtrVkImageView>&			dstImageViews,
1045 																		 deUint32								width,
1046 																		 deUint32								height);
1047 
1048 	vector<SharedPtrVkDescriptorLayout>	createDescriptorSetLayouts		(const DeviceInterface&					vkd,
1049 																		 VkDevice								device,
1050 																		 RenderPass								renderPassInfo);
1051 
1052 	vector<SharedPtrVkDescriptorSet>	createDescriptorSets			(const DeviceInterface&					vkd,
1053 																		 VkDevice								device,
1054 																		 VkFormat								format,
1055 																		 vector<SharedPtrVkDescriptorPool>&		pools,
1056 																		 vector<SharedPtrVkDescriptorLayout>&	layouts,
1057 																		 vector<SharedPtrVkImageView>&			imageViews);
1058 
1059 	tcu::TestStatus						iterate							(void);
1060 
1061 	template<typename RenderpassSubpass>
1062 	tcu::TestStatus						iterateInternal					(void);
1063 
1064 private:
1065 	const bool							m_extensionSupported;
1066 	const RenderPass					m_renderPassInfo;
1067 	const RenderPassType				m_renderPassType;
1068 
1069 	const deUint32						m_width;
1070 	const deUint32						m_height;
1071 	const VkFormat						m_format;
1072 
1073 	vector<de::SharedPtr<Allocation> >	m_imageMemories;
1074 	vector<SharedPtrVkImage>			m_images;
1075 	vector<SharedPtrVkImageView>		m_imageViews;
1076 
1077 	const Unique<VkBuffer>				m_primaryBuffer;
1078 	const Unique<VkBuffer>				m_secondaryBuffer;
1079 	const de::UniquePtr<Allocation>		m_primaryBufferMemory;
1080 	const de::UniquePtr<Allocation>		m_secondaryBufferMemory;
1081 
1082 	const Unique<VkRenderPass>			m_renderPass;
1083 	const Unique<VkFramebuffer>			m_framebuffer;
1084 
1085 	vector<SharedPtrVkDescriptorLayout>	m_subpassDescriptorSetLayouts;
1086 	vector<SharedPtrVkDescriptorPool>	m_subpassDescriptorPools;
1087 	vector<SharedPtrVkDescriptorSet>	m_subpassDescriptorSets;
1088 
1089 	vector<SharedPtrVkPipelineLayout>	m_renderPipelineLayouts;
1090 	vector<SharedPtrVkPipeline>			m_renderPipelines;
1091 
1092 	const Unique<VkCommandPool>			m_commandPool;
1093 	tcu::ResultCollector				m_resultCollector;
1094 };
1095 
SubpassDependencyTestInstance(Context & context,SubpassTestConfig testConfig)1096 SubpassDependencyTestInstance::SubpassDependencyTestInstance (Context& context, SubpassTestConfig testConfig)
1097 	: TestInstance					(context)
1098 	, m_extensionSupported			((testConfig.renderPassType == RENDERPASS_TYPE_RENDERPASS2) && context.requireDeviceFunctionality("VK_KHR_create_renderpass2"))
1099 	, m_renderPassInfo				(testConfig.renderPass)
1100 	, m_renderPassType				(testConfig.renderPassType)
1101 	, m_width						(testConfig.imageSize.x())
1102 	, m_height						(testConfig.imageSize.y())
1103 	, m_format						(testConfig.format)
1104 	, m_images						(createAndAllocateImages(context.getDeviceInterface(), context.getDevice(), context.getDefaultAllocator(), m_imageMemories, context.getUniversalQueueFamilyIndex(), m_renderPassInfo, m_format, m_width, m_height))
1105 	, m_imageViews					(createImageViews(context.getDeviceInterface(), context.getDevice(), m_images, m_format, isDepthStencilFormat(m_format) ? VK_IMAGE_ASPECT_DEPTH_BIT : VK_IMAGE_ASPECT_COLOR_BIT))
1106 	, m_primaryBuffer				(createBuffer(context.getDeviceInterface(), context.getDevice(), m_format, m_width, m_height))
1107 	, m_secondaryBuffer				(createBuffer(context.getDeviceInterface(), context.getDevice(), m_format, m_width, m_height))
1108 	, m_primaryBufferMemory			(createBufferMemory(context.getDeviceInterface(), context.getDevice(), context.getDefaultAllocator(), *m_primaryBuffer))
1109 	, m_secondaryBufferMemory		(createBufferMemory(context.getDeviceInterface(), context.getDevice(), context.getDefaultAllocator(), *m_secondaryBuffer))
1110 	, m_renderPass					(createRenderPass(context.getDeviceInterface(), context.getDevice(), m_renderPassInfo, testConfig.renderPassType))
1111 	, m_framebuffer					(createFramebuffer(context.getDeviceInterface(), context.getDevice(), m_renderPassInfo, *m_renderPass, m_imageViews, m_width, m_height))
1112 	, m_subpassDescriptorSetLayouts	(createDescriptorSetLayouts(context.getDeviceInterface(), context.getDevice(), m_renderPassInfo))
1113 	, m_subpassDescriptorPools		(createDescriptorPools(context.getDeviceInterface(), context.getDevice(), m_subpassDescriptorSetLayouts, VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT))
1114 	, m_subpassDescriptorSets		(createDescriptorSets(context.getDeviceInterface(), context.getDevice(), m_format, m_subpassDescriptorPools, m_subpassDescriptorSetLayouts, m_imageViews))
1115 	, m_renderPipelineLayouts		(createRenderPipelineLayouts(context.getDeviceInterface(), context.getDevice(), m_renderPassInfo, m_subpassDescriptorSetLayouts))
1116 	, m_renderPipelines				(createRenderPipelines(context.getDeviceInterface(), context.getDevice(), m_renderPassInfo, *m_renderPass, m_renderPipelineLayouts, context.getBinaryCollection(), m_format, m_width, m_height))
1117 	, m_commandPool					(createCommandPool(context.getDeviceInterface(), context.getDevice(), VK_COMMAND_POOL_CREATE_TRANSIENT_BIT, context.getUniversalQueueFamilyIndex()))
1118 {
1119 }
1120 
~SubpassDependencyTestInstance(void)1121 SubpassDependencyTestInstance::~SubpassDependencyTestInstance (void)
1122 {
1123 }
1124 
createAndAllocateImages(const DeviceInterface & vk,VkDevice device,Allocator & allocator,vector<de::SharedPtr<Allocation>> & imageMemories,deUint32 universalQueueFamilyIndex,RenderPass renderPassInfo,VkFormat format,deUint32 width,deUint32 height)1125 vector<SharedPtrVkImage> SubpassDependencyTestInstance::createAndAllocateImages (const DeviceInterface&					vk,
1126 																				 VkDevice								device,
1127 																				 Allocator&								allocator,
1128 																				 vector<de::SharedPtr<Allocation> >&	imageMemories,
1129 																				 deUint32								universalQueueFamilyIndex,
1130 																				 RenderPass								renderPassInfo,
1131 																				 VkFormat								format,
1132 																				 deUint32								width,
1133 																				 deUint32								height)
1134 {
1135 	// Verify format support
1136 	{
1137 		const VkFormatFeatureFlags	flags		= isDepthStencilFormat(m_format) ? VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT : VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT;
1138 		const VkFormatProperties	properties	= vk::getPhysicalDeviceFormatProperties(m_context.getInstanceInterface(), m_context.getPhysicalDevice(), format);
1139 
1140 		if ((properties.optimalTilingFeatures & flags) != flags)
1141 			TCU_THROW(NotSupportedError, "Format not supported");
1142 	}
1143 
1144 	vector<SharedPtrVkImage> images;
1145 
1146 	for (size_t imageNdx = 0; imageNdx < renderPassInfo.getAttachments().size(); imageNdx++)
1147 	{
1148 		const VkExtent3D		imageExtent		=
1149 		{
1150 			width,		// uint32_t	width
1151 			height,		// uint32_t	height
1152 			1u			// uint32_t	depth
1153 		};
1154 
1155 		VkImageUsageFlags		usage			= ((isDepthStencilFormat(format)
1156 													? VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT
1157 													: VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT)
1158 													| VK_IMAGE_USAGE_TRANSFER_SRC_BIT
1159 													| VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT);
1160 
1161 		const VkImageCreateInfo	imageCreateInfo	=
1162 		{
1163 			VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,	// VkStructureType			sType
1164 			DE_NULL,								// const void*				pNext
1165 			0u,										// VkImageCreateFlags		flags
1166 			VK_IMAGE_TYPE_2D,						// VkImageType				imageType
1167 			format,									// VkFormat					format
1168 			imageExtent,							// VkExtent3D				extent
1169 			1u,										// uint32_t					mipLevels
1170 			1u,										// uint32_t					arrayLayers
1171 			VK_SAMPLE_COUNT_1_BIT,					// VkSampleCountFlagBits	samples
1172 			VK_IMAGE_TILING_OPTIMAL,				// VkImageTiling			tiling
1173 			usage,									// VkImageUsageFlags		usage
1174 			VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode			sharingMode
1175 			1u,										// uint32_t					queueFamilyIndexCount
1176 			&universalQueueFamilyIndex,				// const uint32_t*			pQueueFamilyIndices
1177 			VK_IMAGE_LAYOUT_UNDEFINED				// VkImageLayout			initialLayout
1178 		};
1179 
1180 		images.push_back(makeSharedPtr(vk::createImage(vk, device, &imageCreateInfo, DE_NULL)));
1181 		imageMemories.push_back((de::SharedPtr<Allocation>)allocator.allocate(getImageMemoryRequirements(vk, device, **images[imageNdx]), MemoryRequirement::Any).release());
1182 		VK_CHECK(vk.bindImageMemory(device, **images[imageNdx], imageMemories[imageNdx]->getMemory(), imageMemories[imageNdx]->getOffset()));
1183 	}
1184 
1185 	return images;
1186 }
1187 
createRenderPipelineLayouts(const DeviceInterface & vkd,VkDevice device,RenderPass renderPassInfo,vector<SharedPtrVkDescriptorLayout> descriptorSetLayouts)1188 vector<SharedPtrVkPipelineLayout> SubpassDependencyTestInstance::createRenderPipelineLayouts (const DeviceInterface&				vkd,
1189 																							  VkDevice								device,
1190 																							  RenderPass							renderPassInfo,
1191 																							  vector<SharedPtrVkDescriptorLayout>	descriptorSetLayouts)
1192 {
1193 	vector<SharedPtrVkPipelineLayout>	pipelineLayouts;
1194 	vector<VkDescriptorSetLayout>		descriptorSetLayoutHandles;
1195 	const size_t						descriptorSetLayoutCount	= descriptorSetLayouts.size();
1196 
1197 	for (size_t descriptorSetLayoutNdx = 0; descriptorSetLayoutNdx < descriptorSetLayoutCount; descriptorSetLayoutNdx++)
1198 		descriptorSetLayoutHandles.push_back(**descriptorSetLayouts.at(descriptorSetLayoutNdx));
1199 
1200 	for (size_t subpassNdx = 0; subpassNdx < renderPassInfo.getSubpasses().size(); subpassNdx++)
1201 	{
1202 		const VkPipelineLayoutCreateInfo createInfo =
1203 		{
1204 			VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,	// VkStructureType				sType
1205 			DE_NULL,										// const void*					pNext
1206 			(vk::VkPipelineLayoutCreateFlags)0,				// VkPipelineLayoutCreateFlags	flags
1207 			(deUint32)descriptorSetLayoutCount,				// deUint32						setLayoutCount
1208 			descriptorSetLayoutHandles.data(),				// const VkDescriptorSetLayout*	pSetLayouts
1209 			0u,												// deUint32						pushConstantRangeCount
1210 			DE_NULL											// const VkPushConstantRange*	pPushConstantRanges
1211 		};
1212 
1213 		pipelineLayouts.push_back(makeSharedPtr(createPipelineLayout(vkd, device, &createInfo)));
1214 	}
1215 
1216 	return pipelineLayouts;
1217 }
1218 
createRenderPipelines(const DeviceInterface & vkd,VkDevice device,RenderPass renderPassInfo,VkRenderPass renderPass,vector<SharedPtrVkPipelineLayout> & pipelineLayouts,const BinaryCollection & binaryCollection,VkFormat format,deUint32 width,deUint32 height)1219 vector<SharedPtrVkPipeline> SubpassDependencyTestInstance::createRenderPipelines (const DeviceInterface&				vkd,
1220 																				  VkDevice								device,
1221 																				  RenderPass							renderPassInfo,
1222 																				  VkRenderPass							renderPass,
1223 																				  vector<SharedPtrVkPipelineLayout>&	pipelineLayouts,
1224 																				  const BinaryCollection&				binaryCollection,
1225 																				  VkFormat								format,
1226 																				  deUint32								width,
1227 																				  deUint32								height)
1228 {
1229 	vector<SharedPtrVkPipeline> pipelines;
1230 
1231 	for (size_t subpassNdx = 0; subpassNdx < renderPassInfo.getSubpasses().size(); subpassNdx++)
1232 	{
1233 		const Unique<VkShaderModule>				vertexShaderModule			(createShaderModule(vkd, device, binaryCollection.get("subpass-vert-" + de::toString(subpassNdx)), 0u));
1234 		const Unique<VkShaderModule>				fragmentShaderModule		(createShaderModule(vkd, device, binaryCollection.get("subpass-frag-" + de::toString(subpassNdx)), 0u));
1235 
1236 		const VkVertexInputBindingDescription		vertexBinding0				=
1237 		{
1238 			0u,							// deUint32					binding;
1239 			sizeof(Vec4),				// deUint32					strideInBytes;
1240 			VK_VERTEX_INPUT_RATE_VERTEX	// VkVertexInputStepRate	stepRate;
1241 		};
1242 
1243 		VkVertexInputAttributeDescription			attr0						=
1244 		{
1245 			0u,								// deUint32	location;
1246 			0u,								// deUint32	binding;
1247 			VK_FORMAT_R32G32B32A32_SFLOAT,	// VkFormat	format;
1248 			0u								// deUint32	offsetInBytes;
1249 		};
1250 
1251 		const VkPipelineVertexInputStateCreateInfo	vertexInputState			=
1252 		{
1253 			VK_STRUCTURE_TYPE_PIPELINE_VERTEX_INPUT_STATE_CREATE_INFO,	// VkStructureType							sType
1254 			DE_NULL,													// const void*								pNext
1255 			(VkPipelineVertexInputStateCreateFlags)0u,					// VkPipelineVertexInputStateCreateFlags	flags
1256 			1u,															// uint32_t									vertexBindingDescriptionCount
1257 			&vertexBinding0,											// const VkVertexInputBindingDescription*	pVertexBindingDescriptions
1258 			1u,															// uint32_t									vertexAttributeDescriptionCount
1259 			&attr0														// const VkVertexInputAttributeDescription*	pVertexAttributeDescriptions
1260 		};
1261 
1262 		const VkStencilOpState						stencilOpState				=
1263 		{
1264 			VK_STENCIL_OP_KEEP,		// stencilFailOp
1265 			VK_STENCIL_OP_KEEP,		// stencilPassOp
1266 			VK_STENCIL_OP_KEEP,		// stencilDepthFailOp
1267 			VK_COMPARE_OP_ALWAYS,	// stencilCompareOp
1268 			0x0u,					// stencilCompareMask
1269 			0x0u,					// stencilWriteMask
1270 			0u						// stencilReference
1271 		};
1272 
1273 		const VkPipelineDepthStencilStateCreateInfo	depthStencilStateCreateInfo	=
1274 		{
1275 			VK_STRUCTURE_TYPE_PIPELINE_DEPTH_STENCIL_STATE_CREATE_INFO,	// VkStructureType							sType
1276 			DE_NULL,													// const void*								pNext
1277 			0u,															// VkPipelineDepthStencilStateCreateFlags	flags
1278 			VK_TRUE,													// VkBool32									depthTestEnable
1279 			VK_TRUE,													// VkBool32									depthWriteEnable
1280 			VK_COMPARE_OP_LESS_OR_EQUAL,								// VkCompareOp								depthCompareOp
1281 			VK_FALSE,													// VkBool32									depthBoundsTestEnable
1282 			VK_TRUE,													// VkBool32									stencilTestEnable
1283 			stencilOpState,												// VkStencilOpState							front
1284 			stencilOpState,												// VkStencilOpState							back
1285 			0.0f,														// float									minDepthBounds
1286 			1.0f,														// float									maxDepthBounds
1287 		};
1288 
1289 		const std::vector<VkViewport>				viewports					(1, makeViewport(tcu::UVec2(width, height)));
1290 		const std::vector<VkRect2D>					scissors					(1, makeRect2D(tcu::UVec2(width, height)));
1291 		const VkPipelineLayout						layout						(**pipelineLayouts[subpassNdx]);
1292 		const VkPipelineDepthStencilStateCreateInfo	depthStencilCreateInfo		(isDepthStencilFormat(format)
1293 																					? depthStencilStateCreateInfo
1294 																					: VkPipelineDepthStencilStateCreateInfo());
1295 
1296 		pipelines.push_back(makeSharedPtr(makeGraphicsPipeline(vkd,									// const DeviceInterface&							vk
1297 															   device,								// const VkDevice									device
1298 															   layout,								// const VkPipelineLayout							pipelineLayout
1299 															   *vertexShaderModule,					// const VkShaderModule								vertexShaderModule
1300 															   DE_NULL,								// const VkShaderModule								tessellationControlShaderModule
1301 															   DE_NULL,								// const VkShaderModule								tessellationEvalShaderModule
1302 															   DE_NULL,								// const VkShaderModule								geometryShaderModule
1303 															   *fragmentShaderModule,				// const VkShaderModule								fragmentShaderModule
1304 															   renderPass,							// const VkRenderPass								renderPass
1305 															   viewports,							// const std::vector<VkViewport>&					viewports
1306 															   scissors,							// const std::vector<VkRect2D>&						scissors
1307 															   VK_PRIMITIVE_TOPOLOGY_TRIANGLE_LIST,	// const VkPrimitiveTopology						topology
1308 															   (deUint32)subpassNdx,				// const deUint32									subpass
1309 															   0u,									// const deUint32									patchControlPoints
1310 															   &vertexInputState,					// const VkPipelineVertexInputStateCreateInfo*		vertexInputStateCreateInfo
1311 															   DE_NULL,								// const VkPipelineRasterizationStateCreateInfo*	rasterizationStateCreateInfo
1312 															   DE_NULL,								// const VkPipelineMultisampleStateCreateInfo*		multisampleStateCreateInfo
1313 															   &depthStencilCreateInfo,				// const VkPipelineDepthStencilStateCreateInfo*		depthStencilStateCreateInfo
1314 															   DE_NULL)));							// const VkPipelineDynamicStateCreateInfo*			pDynamicState
1315 	}
1316 
1317 	return pipelines;
1318 }
1319 
createFramebuffer(const DeviceInterface & vkd,VkDevice device,RenderPass renderPassInfo,VkRenderPass renderPass,vector<SharedPtrVkImageView> & dstImageViews,deUint32 width,deUint32 height)1320 Move<VkFramebuffer> SubpassDependencyTestInstance::createFramebuffer (const DeviceInterface&		vkd,
1321 																	  VkDevice						device,
1322 																	  RenderPass					renderPassInfo,
1323 																	  VkRenderPass					renderPass,
1324 																	  vector<SharedPtrVkImageView>&	dstImageViews,
1325 																	  deUint32						width,
1326 																	  deUint32						height)
1327 {
1328 	const size_t		attachmentCount		(renderPassInfo.getAttachments().size());
1329 	vector<VkImageView>	attachmentHandles;
1330 
1331 	for (deUint32 attachmentNdx = 0; attachmentNdx < attachmentCount; attachmentNdx++)
1332 		attachmentHandles.push_back(**dstImageViews.at(attachmentNdx));
1333 
1334 	const VkFramebufferCreateInfo createInfo =
1335 	{
1336 		VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO,	// VkStructureType			sType
1337 		DE_NULL,									// const void*				pNext
1338 		0u,											// VkFramebufferCreateFlags	flags
1339 		renderPass,									// VkRenderPass				renderPass
1340 		(deUint32)attachmentCount,					// uint32_t					attachmentCount
1341 		attachmentHandles.data(),					// const VkImageView*		pAttachments
1342 		width,										// uint32_t					width
1343 		height,										// uint32_t					height
1344 		1u											// uint32_t					layers
1345 	};
1346 
1347 	return vk::createFramebuffer(vkd, device, &createInfo);
1348 }
1349 
createDescriptorSetLayouts(const DeviceInterface & vkd,VkDevice device,RenderPass renderPassInfo)1350 vector<SharedPtrVkDescriptorLayout> SubpassDependencyTestInstance::createDescriptorSetLayouts (const DeviceInterface&	vkd,
1351 																							   VkDevice					device,
1352 																							   RenderPass				renderPassInfo)
1353 {
1354 	vector<SharedPtrVkDescriptorLayout> layouts;
1355 
1356 	size_t attachmentCount = renderPassInfo.getAttachments().size();
1357 
1358 	for (size_t layoutNdx = 0; layoutNdx < attachmentCount - 1; layoutNdx++)
1359 	{
1360 		const VkDescriptorSetLayoutBinding		bindings	=
1361 		{
1362 				0u,										// uint32_t				binding
1363 				VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT,	// VkDescriptorType		descriptorType
1364 				1u,										// uint32_t				descriptorCount
1365 				VK_SHADER_STAGE_FRAGMENT_BIT,			// VkShaderStageFlags	stageFlags
1366 				DE_NULL									// const VkSampler*		pImmutableSamplers
1367 		};
1368 
1369 		const VkDescriptorSetLayoutCreateInfo	createInfo	=
1370 		{
1371 			VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO,	// VkStructureType						sType
1372 			DE_NULL,												// const void*							pNext
1373 			0u,														// VkDescriptorSetLayoutCreateFlags		flags
1374 			1u,														// uint32_t								bindingCount
1375 			&bindings												// const VkDescriptorSetLayoutBinding*	pBindings
1376 		};
1377 
1378 		layouts.push_back(makeSharedPtr(createDescriptorSetLayout(vkd, device, &createInfo)));
1379 	}
1380 
1381 	return layouts;
1382 }
1383 
createDescriptorSets(const DeviceInterface & vkd,VkDevice device,VkFormat format,vector<SharedPtrVkDescriptorPool> & pools,vector<SharedPtrVkDescriptorLayout> & layouts,vector<SharedPtrVkImageView> & imageViews)1384 vector<SharedPtrVkDescriptorSet> SubpassDependencyTestInstance::createDescriptorSets (const DeviceInterface&				vkd,
1385 																					  VkDevice								device,
1386 																					  VkFormat								format,
1387 																					  vector<SharedPtrVkDescriptorPool>&	pools,
1388 																					  vector<SharedPtrVkDescriptorLayout>&	layouts,
1389 																					  vector<SharedPtrVkImageView>&			imageViews)
1390 {
1391 	vector<SharedPtrVkDescriptorSet> descriptorSets;
1392 
1393 	for (size_t setNdx = 0; setNdx < layouts.size(); setNdx++)
1394 	{
1395 		const VkDescriptorSetAllocateInfo allocateInfo =
1396 		{
1397 			VK_STRUCTURE_TYPE_DESCRIPTOR_SET_ALLOCATE_INFO,	// VkStructureType				sType
1398 			DE_NULL,										// const void*					pNext
1399 			**pools[setNdx],								// VkDescriptorPool				descriptorPool
1400 			1u,												// uint32_t						descriptorSetCount
1401 			&**layouts[setNdx]								// const VkDescriptorSetLayout*	pSetLayouts
1402 		};
1403 
1404 		descriptorSets.push_back(makeSharedPtr(allocateDescriptorSet(vkd, device, &allocateInfo)));
1405 
1406 		{
1407 			VkImageLayout imageLayout				= isDepthStencilFormat(format)
1408 														? VK_IMAGE_LAYOUT_DEPTH_STENCIL_READ_ONLY_OPTIMAL
1409 														: VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
1410 
1411 			const VkDescriptorImageInfo	imageInfo	=
1412 			{
1413 				DE_NULL,				// VkSampler		sampler
1414 				**imageViews[setNdx],	// VkImageView		imageView
1415 				imageLayout				// VkImageLayout	imageLayout
1416 			};
1417 
1418 			const VkWriteDescriptorSet	write		=
1419 			{
1420 				VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET,	// VkStructureType					sType
1421 				DE_NULL,								// const void*						pNext
1422 				**descriptorSets[setNdx],				// VkDescriptorSet					dstSet
1423 				0u,										// uint32_t							dstBinding
1424 				0u,										// uint32_t							dstArrayElement
1425 				1u,										// uint32_t							descriptorCount
1426 				VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT,	// VkDescriptorType					descriptorType
1427 				&imageInfo,								// const VkDescriptorImageInfo*		pImageInfo
1428 				DE_NULL,								// const VkDescriptorBufferInfo*	pBufferInfo
1429 				DE_NULL									// const VkBufferView*				pTexelBufferView
1430 			};
1431 
1432 			vkd.updateDescriptorSets(device, 1u, &write, 0u, DE_NULL);
1433 		}
1434 	}
1435 
1436 	return descriptorSets;
1437 }
1438 
iterate(void)1439 tcu::TestStatus SubpassDependencyTestInstance::iterate (void)
1440 {
1441 	switch (m_renderPassType)
1442 	{
1443 		case RENDERPASS_TYPE_LEGACY:
1444 			return iterateInternal<RenderpassSubpass1>();
1445 		case RENDERPASS_TYPE_RENDERPASS2:
1446 			return iterateInternal<RenderpassSubpass2>();
1447 		default:
1448 			TCU_THROW(InternalError, "Impossible");
1449 	}
1450 }
1451 
1452 template<typename RenderpassSubpass>
iterateInternal(void)1453 tcu::TestStatus SubpassDependencyTestInstance::iterateInternal (void)
1454 {
1455 	de::Random											rand					(5);
1456 	const DeviceInterface&								vkd						(m_context.getDeviceInterface());
1457 	const Unique<VkCommandBuffer>						commandBuffer			(allocateCommandBuffer(vkd, m_context.getDevice(), *m_commandPool, VK_COMMAND_BUFFER_LEVEL_PRIMARY));
1458 	const typename RenderpassSubpass::SubpassBeginInfo	subpassBeginInfo		(DE_NULL, VK_SUBPASS_CONTENTS_INLINE);
1459 	const typename RenderpassSubpass::SubpassEndInfo	subpassEndInfo			(DE_NULL);
1460 	const size_t										attachmentCount			(m_renderPassInfo.getAttachments().size());
1461 	const size_t										subpassCount			(m_renderPassInfo.getSubpasses().size());
1462 	vector<VkClearValue>								clearValues;
1463 	vector<Vec4>										vertexData;
1464 
1465 	beginCommandBuffer(vkd, *commandBuffer);
1466 
1467 	// Transition stencil aspects to the final layout directly.
1468 	if (isDepthStencilFormat(m_format))
1469 	{
1470 		const VkImageSubresourceRange imageSubresourceRange =
1471 		{
1472 			VK_IMAGE_ASPECT_STENCIL_BIT,	// VkImageAspectFlags	aspectMask
1473 			0u,								// uint32_t				baseMipLevel
1474 			1u,								// uint32_t				levelCount
1475 			0u,								// uint32_t				baseArrayLayer
1476 			1u								// uint32_t				layerCount
1477 		};
1478 
1479 		VkImageMemoryBarrier barrier =
1480 		{
1481 			VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,				// VkStructureType			sType
1482 			DE_NULL,											// const void*				pNext
1483 			0u,													// VkAccessFlags			srcAccessMask
1484 			VK_ACCESS_TRANSFER_READ_BIT,						// VkAccessFlags			dstAccessMask
1485 			VK_IMAGE_LAYOUT_UNDEFINED,							// VkImageLayout			oldLayout
1486 			VK_IMAGE_LAYOUT_DEPTH_STENCIL_READ_ONLY_OPTIMAL,	// VkImageLayout			newLayout
1487 			VK_QUEUE_FAMILY_IGNORED,							// uint32_t					srcQueueFamilyIndex
1488 			VK_QUEUE_FAMILY_IGNORED,							// uint32_t					dstQueueFamilyIndex
1489 			DE_NULL,											// VkImage					image
1490 			imageSubresourceRange								// VkImageSubresourceRange	subresourceRange
1491 		};
1492 
1493 		for (deUint32 attachmentNdx = 0; attachmentNdx < attachmentCount; ++attachmentNdx)
1494 		{
1495 			barrier.image = **m_images[attachmentNdx];
1496 			vkd.cmdPipelineBarrier(*commandBuffer, VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT, VK_PIPELINE_STAGE_TRANSFER_BIT, 0u, 0u, DE_NULL, 0u, DE_NULL, 1u, &barrier);
1497 		}
1498 	}
1499 
1500 	// Begin render pass
1501 	{
1502 		VkRect2D					renderArea			=
1503 		{
1504 			{ 0u, 0u },				// VkOffset2D	offset
1505 			{ m_width, m_height }	// VkExtent2D	extent
1506 		};
1507 
1508 		for (size_t attachmentNdx = 0; attachmentNdx < attachmentCount; attachmentNdx++)
1509 			clearValues.push_back(isDepthStencilFormat(m_format) ? makeClearValueDepthStencil(1.0f, 255u) : makeClearValueColor(Vec4(1.0f, 0.0f, 0.0f, 1.0f)));
1510 
1511 		const VkRenderPassBeginInfo	beginInfo			=
1512 		{
1513 			VK_STRUCTURE_TYPE_RENDER_PASS_BEGIN_INFO,	// VkStructureType		sType
1514 			DE_NULL,									// const void*			pNext
1515 			*m_renderPass,								// VkRenderPass			renderPass
1516 			*m_framebuffer,								// VkFramebuffer		framebuffer
1517 			renderArea,									// VkRect2D				renderArea
1518 			(deUint32)attachmentCount,					// uint32_t				clearValueCount
1519 			clearValues.data()							// const VkClearValue*	pClearValues
1520 		};
1521 
1522 		RenderpassSubpass::cmdBeginRenderPass(vkd, *commandBuffer, &beginInfo, &subpassBeginInfo);
1523 	}
1524 
1525 	// Generate vertices for 128 triangles with pseudorandom positions and depths values
1526 	for (int primitiveNdx = 0; primitiveNdx < 128; primitiveNdx++)
1527 	{
1528 		float primitiveDepth = rand.getFloat();
1529 
1530 		for (int vertexNdx = 0; vertexNdx < 3; vertexNdx++)
1531 		{
1532 			float x = 2.0f * rand.getFloat() - 1.0f;
1533 			float y = 2.0f * rand.getFloat() - 1.0f;
1534 
1535 			vertexData.push_back(Vec4(x, y, primitiveDepth, 1.0f));
1536 		}
1537 	}
1538 
1539 	const size_t										singleVertexDataSize	= sizeof(Vec4);
1540 	const size_t										vertexCount				= vertexData.size();
1541 	const size_t										vertexDataSize			= vertexCount * singleVertexDataSize;
1542 	const deUint32										queueFamilyIndices		= m_context.getUniversalQueueFamilyIndex();
1543 
1544 	const VkBufferCreateInfo							vertexBufferParams		=
1545 	{
1546 		VK_STRUCTURE_TYPE_BUFFER_CREATE_INFO,	//	VkStructureType		sType;
1547 		DE_NULL,								//	const void*			pNext;
1548 		0u,										//	VkBufferCreateFlags	flags;
1549 		(VkDeviceSize)vertexDataSize,			//	VkDeviceSize		size;
1550 		VK_BUFFER_USAGE_VERTEX_BUFFER_BIT,		//	VkBufferUsageFlags	usage;
1551 		VK_SHARING_MODE_EXCLUSIVE,				//	VkSharingMode		sharingMode;
1552 		1u,										//	deUint32			queueFamilyCount;
1553 		&queueFamilyIndices,					//	const deUint32*		pQueueFamilyIndices;
1554 	};
1555 
1556 	const Unique<VkBuffer>								vertexBuffer			(createBuffer(vkd, m_context.getDevice(), &vertexBufferParams));
1557 	const de::UniquePtr<Allocation>						vertexBufferMemory		(m_context.getDefaultAllocator().allocate(getBufferMemoryRequirements(vkd, m_context.getDevice(), *vertexBuffer), MemoryRequirement::HostVisible));
1558 
1559 	VK_CHECK(vkd.bindBufferMemory(m_context.getDevice(), *vertexBuffer, vertexBufferMemory->getMemory(), vertexBufferMemory->getOffset()));
1560 
1561 	const VkDeviceSize bindingOffset = 0;
1562 	vkd.cmdBindVertexBuffers(*commandBuffer, 0u, 1u, &vertexBuffer.get(), &bindingOffset);
1563 
1564 	for (size_t subpassNdx = 0; subpassNdx < subpassCount; subpassNdx++)
1565 	{
1566 		if (subpassNdx > 0)
1567 		{
1568 			RenderpassSubpass::cmdNextSubpass(vkd, *commandBuffer, &subpassBeginInfo, &subpassEndInfo);
1569 			vkd.cmdBindDescriptorSets(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, **m_renderPipelineLayouts[subpassNdx], 0, 1, &**m_subpassDescriptorSets[subpassNdx - 1], 0, DE_NULL);
1570 		}
1571 
1572 		vkd.cmdBindPipeline(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, **m_renderPipelines[subpassNdx]);
1573 
1574 		if (subpassNdx == 0)
1575 		{
1576 			// Upload vertex data
1577 			{
1578 				void* vertexBufPtr = vertexBufferMemory->getHostPtr();
1579 				deMemcpy(vertexBufPtr, vertexData.data(), vertexDataSize);
1580 				flushAlloc(vkd, m_context.getDevice(), *vertexBufferMemory);
1581 			}
1582 
1583 			vkd.cmdDraw(*commandBuffer, (deUint32)vertexData.size(), 1u, 0u, 0u);
1584 		}
1585 		else
1586 			vkd.cmdDraw(*commandBuffer, 6u, 1u, 0u, 0u);
1587 	}
1588 
1589 	RenderpassSubpass::cmdEndRenderPass(vkd, *commandBuffer, &subpassEndInfo);
1590 
1591 	// Memory barrier between rendering and copy
1592 	{
1593 		const VkImageAspectFlags	imageAspectFlags		= isDepthStencilFormat(m_format)
1594 																? VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT : VK_IMAGE_ASPECT_COLOR_BIT;
1595 		const VkAccessFlags			srcAccessMask			= isDepthStencilFormat(m_format)
1596 																? VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT : VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT;
1597 		const VkImageLayout			oldLayout				= isDepthStencilFormat(m_format)
1598 																? VK_IMAGE_LAYOUT_DEPTH_STENCIL_READ_ONLY_OPTIMAL : VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL;
1599 		const VkPipelineStageFlags	srcStageMask			= isDepthStencilFormat(m_format)
1600 																? VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT : VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT;
1601 
1602 		VkImageSubresourceRange		imageSubresourceRange	=
1603 		{
1604 			imageAspectFlags,	// VkImageAspectFlags	aspectMask
1605 			0u,					// uint32_t				baseMipLevel
1606 			1u,					// uint32_t				levelCount
1607 			0u,					// uint32_t				baseArrayLayer
1608 			1u					// uint32_t				layerCount
1609 		};
1610 
1611 		const VkImageMemoryBarrier	barrier					=
1612 		{
1613 			VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,	// VkStructureType			sType
1614 			DE_NULL,								// const void*				pNext
1615 			srcAccessMask,							// VkAccessFlags			srcAccessMask
1616 			VK_ACCESS_TRANSFER_READ_BIT,			// VkAccessFlags			dstAccessMask
1617 			oldLayout,								// VkImageLayout			oldLayout
1618 			VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL,	// VkImageLayout			newLayout
1619 			VK_QUEUE_FAMILY_IGNORED,				// uint32_t					srcQueueFamilyIndex
1620 			VK_QUEUE_FAMILY_IGNORED,				// uint32_t					dstQueueFamilyIndex
1621 			**m_images[attachmentCount - 1],		// VkImage					image
1622 			imageSubresourceRange					// VkImageSubresourceRange	subresourceRange
1623 		};
1624 
1625 		vkd.cmdPipelineBarrier(*commandBuffer, srcStageMask, VK_PIPELINE_STAGE_TRANSFER_BIT, 0u, 0u, DE_NULL, 0u, DE_NULL, 1u, &barrier);
1626 	}
1627 
1628 	// Copy image memory to buffer
1629 	{
1630 		if (isDepthStencilFormat(m_format))
1631 		{
1632 			// Copy depth
1633 			const VkImageSubresourceLayers subresourceLayersDepth	=
1634 			{
1635 				VK_IMAGE_ASPECT_DEPTH_BIT,	// VkImageAspectFlags	aspectMask
1636 				0u,							// deUint32				mipLevel
1637 				0u,							// deUint32				baseArrayLayer
1638 				1u							// deUint32				layerCount
1639 			};
1640 
1641 			const VkBufferImageCopy			regionDepth				=
1642 			{
1643 				0u,							// VkDeviceSize				bufferOffset
1644 				0u,							// uint32_t					bufferRowLength
1645 				0u,							// uint32_t					bufferImageHeight
1646 				subresourceLayersDepth,		// VkImageSubresourceLayers	imageSubresource
1647 				{ 0u, 0u, 0u },				// VkOffset3D				imageOffset
1648 				{ m_width, m_height, 1u }	// VkExtent3D				imageExtent
1649 			};
1650 
1651 			vkd.cmdCopyImageToBuffer(*commandBuffer, **m_images[attachmentCount - 1], VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL, *m_primaryBuffer, 1u, &regionDepth);
1652 
1653 			// Copy stencil
1654 			const VkImageSubresourceLayers subresourceLayersStencil	=
1655 			{
1656 				VK_IMAGE_ASPECT_STENCIL_BIT,	// VkImageAspectFlags	aspectMask
1657 				0u,								// deUint32				mipLevel
1658 				0u,								// deUint32				baseArrayLayer
1659 				1u								// deUint32				layerCount
1660 			};
1661 
1662 			const VkBufferImageCopy			regionStencil			=
1663 			{
1664 				0u,							// VkDeviceSize				bufferOffset
1665 				0u,							// uint32_t					bufferRowLength
1666 				0u,							// uint32_t					bufferImageHeight
1667 				subresourceLayersStencil,	// VkImageSubresourceLayers	imageSubresource
1668 				{ 0u, 0u, 0u },				// VkOffset3D				imageOffset
1669 				{ m_width, m_height, 1u }	// VkExtent3D				imageExtent
1670 			};
1671 
1672 			vkd.cmdCopyImageToBuffer(*commandBuffer, **m_images[attachmentCount - 1], VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL, *m_secondaryBuffer, 1u, &regionStencil);
1673 		}
1674 		else
1675 		{
1676 			// Copy color
1677 			const VkImageSubresourceLayers imageSubresourceLayers	=
1678 			{
1679 				VK_IMAGE_ASPECT_COLOR_BIT,	// VkImageAspectFlags	aspectMask
1680 				0u,							// deUint32				mipLevel
1681 				0u,							// deUint32				baseArrayLayer
1682 				1u							// deUint32				layerCount
1683 			};
1684 
1685 			const VkBufferImageCopy			region					=
1686 			{
1687 				0u,							// VkDeviceSize				bufferOffset
1688 				0u,							// uint32_t					bufferRowLength
1689 				0u,							// uint32_t					bufferImageHeight
1690 				imageSubresourceLayers,		// VkImageSubresourceLayers	imageSubresource
1691 				{ 0u, 0u, 0u },				// VkOffset3D				imageOffset
1692 				{ m_width, m_height, 1u }	// VkExtent3D				imageExtent
1693 			};
1694 
1695 			vkd.cmdCopyImageToBuffer(*commandBuffer, **m_images[attachmentCount - 1], VK_IMAGE_LAYOUT_TRANSFER_SRC_OPTIMAL, *m_primaryBuffer, 1u, &region);
1696 		}
1697 	}
1698 
1699 	// Memory barrier between copy and host access
1700 	{
1701 		const VkBufferMemoryBarrier barrier		=
1702 		{
1703 			VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER,	// VkStructureType	sType
1704 			DE_NULL,									// const void*		pNext
1705 			VK_ACCESS_TRANSFER_WRITE_BIT,				// VkAccessFlags	srcAccessMask
1706 			VK_ACCESS_HOST_READ_BIT,					// VkAccessFlags	dstAccessMask
1707 			VK_QUEUE_FAMILY_IGNORED,					// uint32_t			srcQueueFamilyIndex
1708 			VK_QUEUE_FAMILY_IGNORED,					// uint32_t			dstQueueFamilyIndex
1709 			*m_primaryBuffer,							// VkBuffer			buffer
1710 			0u,											// VkDeviceSize		offset
1711 			VK_WHOLE_SIZE								// VkDeviceSize		size
1712 		};
1713 
1714 		vkd.cmdPipelineBarrier(*commandBuffer, VK_PIPELINE_STAGE_TRANSFER_BIT, VK_PIPELINE_STAGE_HOST_BIT, 0u, 0u, DE_NULL, 1u, &barrier, 0u, DE_NULL);
1715 
1716 		if (isDepthStencilFormat(m_format))
1717 		{
1718 			const VkBufferMemoryBarrier stencilBarrier =
1719 			{
1720 				VK_STRUCTURE_TYPE_BUFFER_MEMORY_BARRIER,	// VkStructureType	sType
1721 				DE_NULL,									// const void*		pNext
1722 				VK_ACCESS_TRANSFER_WRITE_BIT,				// VkAccessFlags	srcAccessMask
1723 				VK_ACCESS_HOST_READ_BIT,					// VkAccessFlags	dstAccessMask
1724 				VK_QUEUE_FAMILY_IGNORED,					// uint32_t			srcQueueFamilyIndex
1725 				VK_QUEUE_FAMILY_IGNORED,					// uint32_t			dstQueueFamilyIndex
1726 				*m_secondaryBuffer,							// VkBuffer			buffer
1727 				0u,											// VkDeviceSize		offset
1728 				VK_WHOLE_SIZE								// VkDeviceSize		size
1729 			};
1730 
1731 			vkd.cmdPipelineBarrier(*commandBuffer, VK_PIPELINE_STAGE_TRANSFER_BIT, VK_PIPELINE_STAGE_HOST_BIT, 0u, 0u, DE_NULL, 1u, &stencilBarrier, 0u, DE_NULL);
1732 		}
1733 	}
1734 
1735 	endCommandBuffer(vkd, *commandBuffer);
1736 	submitCommandsAndWait(vkd, m_context.getDevice(), m_context.getUniversalQueue(), *commandBuffer);
1737 	invalidateMappedMemoryRange(vkd, m_context.getDevice(), m_primaryBufferMemory->getMemory(), m_primaryBufferMemory->getOffset(), VK_WHOLE_SIZE);
1738 	invalidateMappedMemoryRange(vkd, m_context.getDevice(), m_secondaryBufferMemory->getMemory(), m_secondaryBufferMemory->getOffset(), VK_WHOLE_SIZE);
1739 
1740 	// Verify result
1741 	{
1742 		const tcu::TextureFormat format (mapVkFormat(m_format));
1743 
1744 		if (isDepthStencilFormat(m_format))
1745 		{
1746 			const void* const					ptrDepth				(m_primaryBufferMemory->getHostPtr());
1747 			const void* const					ptrStencil				(m_secondaryBufferMemory->getHostPtr());
1748 			tcu::TextureLevel					reference				(format, m_width, m_height);
1749 			tcu::TextureLevel					colorBuffer				(mapVkFormat(VK_FORMAT_R8G8B8A8_UNORM), m_width, m_height);
1750 			const tcu::ConstPixelBufferAccess	resultDepthAccess		(getDepthCopyFormat(m_format), m_width, m_height, 1, ptrDepth);
1751 			const tcu::ConstPixelBufferAccess	resultStencilAccess		(getStencilCopyFormat(m_format), m_width, m_height, 1, ptrStencil);
1752 			const PixelBufferAccess				referenceDepthAccess	(tcu::getEffectiveDepthStencilAccess(reference.getAccess(), tcu::Sampler::MODE_DEPTH));
1753 			const PixelBufferAccess				referenceStencilAccess	(tcu::getEffectiveDepthStencilAccess(reference.getAccess(), tcu::Sampler::MODE_STENCIL));
1754 
1755 			tcu::clearDepth(referenceDepthAccess, 1.0f);
1756 			tcu::clearStencil(referenceStencilAccess, 255);
1757 
1758 			// Setup and run reference renderer
1759 			{
1760 				const DepthVertShader					vertShader;
1761 				const DepthFragShader					fragShader;
1762 				const rr::Renderer						renderer;
1763 				const rr::Program						program				(&vertShader, &fragShader);
1764 				const rr::MultisamplePixelBufferAccess	depthBuffer			(rr::MultisamplePixelBufferAccess::fromSinglesampleAccess(referenceDepthAccess));
1765 				const rr::MultisamplePixelBufferAccess	colorBufferAccess	(rr::MultisamplePixelBufferAccess::fromSinglesampleAccess(colorBuffer.getAccess()));
1766 				const rr::RenderTarget					renderTarget		(rr::MultisamplePixelBufferAccess(colorBufferAccess), depthBuffer, rr::MultisamplePixelBufferAccess());
1767 				const rr::PrimitiveType					primitiveType		(rr::PRIMITIVETYPE_TRIANGLES);
1768 				const rr::PrimitiveList					primitiveList		(rr::PrimitiveList(primitiveType, (deUint32)vertexData.size(), 0));
1769 				rr::RenderState							renderState			((rr::ViewportState(depthBuffer)), m_context.getDeviceProperties().limits.subPixelPrecisionBits);
1770 
1771 				const rr::VertexAttrib vertices			= rr::VertexAttrib(rr::VERTEXATTRIBTYPE_FLOAT, 4, sizeof(tcu::Vec4), 0, &vertexData[0]);
1772 
1773 				renderState.fragOps.depthTestEnabled	= DE_TRUE;
1774 				renderState.fragOps.depthFunc			= rr::TESTFUNC_LEQUAL;
1775 
1776 				renderer.draw(rr::DrawCommand(renderState,
1777 											  renderTarget,
1778 											  program,
1779 											  1u,
1780 											  &vertices,
1781 											  primitiveList));
1782 			}
1783 
1784 			for (size_t subpassNdx = 0; subpassNdx < subpassCount - 1; subpassNdx++)
1785 			{
1786 				for (int y = 0; y < reference.getHeight(); y++)
1787 				for (int x = 0; x < reference.getWidth(); x++)
1788 					reference.getAccess().setPixDepth(reference.getAccess().getPixDepth(x, y) - 0.02f, x, y);
1789 			}
1790 
1791 			// Threshold size of subpass count multiplied by the minimum representable difference is allowed for depth compare
1792 			const float							depthThreshold			((float)subpassCount * (1.0f / ((UVec4(1u) << tcu::getTextureFormatMantissaBitDepth(
1793 																			resultDepthAccess.getFormat()).cast<deUint32>()) - 1u).cast<float>().x()));
1794 
1795 			if (!verifyDepth(m_context, reference.getAccess(), resultDepthAccess, depthThreshold))
1796 				m_resultCollector.fail("Depth compare failed.");
1797 
1798 			if (!verifyStencil(m_context, referenceStencilAccess, resultStencilAccess))
1799 				m_resultCollector.fail("Stencil compare failed.");
1800 		}
1801 		else
1802 			DE_FATAL("Not implemented");
1803 	}
1804 
1805 	return tcu::TestStatus(m_resultCollector.getResult(), m_resultCollector.getMessage());
1806 }
1807 
1808 struct SubpassSelfDependencyBackwardsTestConfig
1809 {
SubpassSelfDependencyBackwardsTestConfigvkt::__anon104c10a40111::SubpassSelfDependencyBackwardsTestConfig1810 		SubpassSelfDependencyBackwardsTestConfig	(VkFormat		format_,
1811 													 UVec2			imageSize_,
1812 													 RenderPassType	renderPassType_)
1813 		: format			(format_)
1814 		, imageSize			(imageSize_)
1815 		, renderPassType	(renderPassType_)
1816 	{
1817 	}
1818 
1819 	VkFormat		format;
1820 	UVec2			imageSize;
1821 	RenderPassType	renderPassType;
1822 };
1823 
1824 class SubpassSelfDependencyBackwardsTestInstance : public TestInstance
1825 {
1826 public:
1827 							SubpassSelfDependencyBackwardsTestInstance	(Context&									context,
1828 																		 SubpassSelfDependencyBackwardsTestConfig	testConfig);
1829 
1830 							~SubpassSelfDependencyBackwardsTestInstance	(void);
1831 
1832 	tcu::TestStatus			iterate										(void);
1833 
1834 	template<typename RenderpassSubpass>
1835 	tcu::TestStatus			iterateInternal								(void);
1836 
1837 private:
1838 	const bool				m_extensionSupported;
1839 	const bool				m_featuresSupported;
1840 	const RenderPassType	m_renderPassType;
1841 
1842 	const deUint32			m_width;
1843 	const deUint32			m_height;
1844 	const VkFormat			m_format;
1845 	tcu::ResultCollector	m_resultCollector;
1846 };
1847 
SubpassSelfDependencyBackwardsTestInstance(Context & context,SubpassSelfDependencyBackwardsTestConfig testConfig)1848 SubpassSelfDependencyBackwardsTestInstance::SubpassSelfDependencyBackwardsTestInstance (Context& context, SubpassSelfDependencyBackwardsTestConfig testConfig)
1849 	: TestInstance			(context)
1850 	, m_extensionSupported	((testConfig.renderPassType == RENDERPASS_TYPE_RENDERPASS2) && context.requireDeviceFunctionality("VK_KHR_create_renderpass2"))
1851 	, m_featuresSupported	(context.requireDeviceCoreFeature(DEVICE_CORE_FEATURE_GEOMETRY_SHADER))
1852 	, m_renderPassType		(testConfig.renderPassType)
1853 	, m_width				(testConfig.imageSize.x())
1854 	, m_height				(testConfig.imageSize.y())
1855 	, m_format				(testConfig.format)
1856 {
1857 }
1858 
~SubpassSelfDependencyBackwardsTestInstance(void)1859 SubpassSelfDependencyBackwardsTestInstance::~SubpassSelfDependencyBackwardsTestInstance (void)
1860 {
1861 }
1862 
iterate(void)1863 tcu::TestStatus SubpassSelfDependencyBackwardsTestInstance::iterate (void)
1864 {
1865 	switch (m_renderPassType)
1866 	{
1867 		case RENDERPASS_TYPE_LEGACY:
1868 			return iterateInternal<RenderpassSubpass1>();
1869 		case RENDERPASS_TYPE_RENDERPASS2:
1870 			return iterateInternal<RenderpassSubpass2>();
1871 		default:
1872 			TCU_THROW(InternalError, "Impossible");
1873 	}
1874 }
1875 
1876 template<typename RenderpassSubpass>
iterateInternal(void)1877 tcu::TestStatus SubpassSelfDependencyBackwardsTestInstance::iterateInternal (void)
1878 {
1879 	de::Random											rand					(5);
1880 	const DeviceInterface&								vkd						(m_context.getDeviceInterface());
1881 	const VkDevice										device					= m_context.getDevice();
1882 	const deUint32										queueFamilyIndex		= m_context.getUniversalQueueFamilyIndex();
1883 	const Unique<VkCommandPool>							commandPool				(createCommandPool(vkd, m_context.getDevice(), VK_COMMAND_POOL_CREATE_TRANSIENT_BIT, queueFamilyIndex));
1884 	const Unique<VkCommandBuffer>						commandBuffer			(allocateCommandBuffer(vkd, m_context.getDevice(), *commandPool, VK_COMMAND_BUFFER_LEVEL_PRIMARY));
1885 	const typename RenderpassSubpass::SubpassBeginInfo	subpassBeginInfo		(DE_NULL, VK_SUBPASS_CONTENTS_INLINE);
1886 	const typename RenderpassSubpass::SubpassEndInfo	subpassEndInfo			(DE_NULL);
1887 	vector<Vec4>										vertexData;
1888 	Move<VkImage>										outputImage;
1889 	de::MovePtr<Allocation>								outputImageAllocation;
1890 	Move<VkImageView>									outputImageView;
1891 	Move<VkPipelineLayout>								pipelineLayout;
1892 	Move<VkPipeline>									renderPipeline;
1893 	Move<VkFramebuffer>									framebuffer;
1894 	Move<VkRenderPass>									renderPass;
1895 	Move<VkBuffer>										indirectBuffer;
1896 	de::MovePtr<Allocation>								indirectBufferMemory;
1897 	Move<VkBuffer>										resultBuffer;
1898 	de::MovePtr<Allocation>								resultBufferMemory;
1899 	const VkDeviceSize									indirectBufferSize		= 4 * sizeof(deUint32);
1900 	Move<VkBuffer>										vertexBuffer;
1901 	de::MovePtr<Allocation>								vertexBufferMemory;
1902 
1903 	// Create output image.
1904 	{
1905 		const VkExtent3D		imageExtent		=
1906 		{
1907 			m_width,	// uint32_t	width
1908 			m_height,	// uint32_t	height
1909 			1u			// uint32_t	depth
1910 		};
1911 
1912 		VkImageUsageFlags		usage			= VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT | VK_IMAGE_USAGE_TRANSFER_SRC_BIT;
1913 
1914 		const VkImageCreateInfo	imageCreateInfo	=
1915 		{
1916 			VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,	// VkStructureType			sType
1917 			DE_NULL,								// const void*				pNext
1918 			0u,										// VkImageCreateFlags		flags
1919 			VK_IMAGE_TYPE_2D,						// VkImageType				imageType
1920 			m_format,								// VkFormat					format
1921 			imageExtent,							// VkExtent3D				extent
1922 			1u,										// uint32_t					mipLevels
1923 			1u,										// uint32_t					arrayLayers
1924 			VK_SAMPLE_COUNT_1_BIT,					// VkSampleCountFlagBits	samples
1925 			VK_IMAGE_TILING_OPTIMAL,				// VkImageTiling			tiling
1926 			usage,									// VkImageUsageFlags		usage
1927 			VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode			sharingMode
1928 			1u,										// uint32_t					queueFamilyIndexCount
1929 			&queueFamilyIndex,						// const uint32_t*			pQueueFamilyIndices
1930 			VK_IMAGE_LAYOUT_UNDEFINED				// VkImageLayout			initialLayout
1931 		};
1932 
1933 		outputImage = createImage(vkd, device, &imageCreateInfo, DE_NULL);
1934 		outputImageAllocation = m_context.getDefaultAllocator().allocate(getImageMemoryRequirements(vkd, device, *outputImage), MemoryRequirement::Any);
1935 		VK_CHECK(vkd.bindImageMemory(device, *outputImage, outputImageAllocation->getMemory(), outputImageAllocation->getOffset()));
1936 	}
1937 
1938 	// Create indirect buffer and initialize.
1939 	{
1940 		const VkBufferUsageFlags	bufferUsage	(VK_BUFFER_USAGE_INDIRECT_BUFFER_BIT | VK_BUFFER_USAGE_STORAGE_BUFFER_BIT);
1941 		const VkBufferCreateInfo	bufferCreateInfo	=
1942 		{
1943 			VK_STRUCTURE_TYPE_BUFFER_CREATE_INFO,	// VkStructureType		sType
1944 			DE_NULL,								// const void*			pNext
1945 			0u,										// VkBufferCreateFlags	flags
1946 			indirectBufferSize,						// VkDeviceSize			size
1947 			bufferUsage,							// VkBufferUsageFlags	usage
1948 			VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode		sharingMode
1949 			0u,										// uint32_t				queueFamilyIndexCount
1950 			DE_NULL									// const uint32_t*		pQueueFamilyIndices
1951 		};
1952 
1953 		indirectBuffer			= createBuffer(vkd, device, &bufferCreateInfo);
1954 		indirectBufferMemory	= createBufferMemory(vkd, device, m_context.getDefaultAllocator(), *indirectBuffer);
1955 
1956 		VkDrawIndirectCommand	drawIndirectCommand	=
1957 		{
1958 			64u,	// deUint32	vertexCount
1959 			1u,		// deUint32	instanceCount
1960 			0u,		// deUint32	firstVertex
1961 			0u,		// deUint32	firstInstance
1962 		};
1963 
1964 		deMemcpy(indirectBufferMemory->getHostPtr(), (void*)&drawIndirectCommand, sizeof(VkDrawIndirectCommand));
1965 		flushAlloc(vkd, device, *indirectBufferMemory);
1966 	}
1967 
1968 	// Create result buffer.
1969 	{
1970 		resultBuffer		= createBuffer(vkd, device, m_format, m_width, m_height);
1971 		resultBufferMemory	= createBufferMemory(vkd, device, m_context.getDefaultAllocator(), *resultBuffer);
1972 	}
1973 
1974 	// Create descriptor set layout.
1975 	Unique<VkDescriptorSetLayout>	descriptorSetLayout	(DescriptorSetLayoutBuilder()
1976 			.addSingleBinding(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, VK_SHADER_STAGE_GEOMETRY_BIT)
1977 			.build(vkd, device));
1978 	// Create descriptor pool.
1979 	Unique<VkDescriptorPool>		descriptorPool		(DescriptorPoolBuilder()
1980 			.addType(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, 1u)
1981 			.build(vkd, device, VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT, 1u));
1982 	// Create descriptor set.
1983 	Unique<VkDescriptorSet>			descriptorSet		(makeDescriptorSet(vkd, device, *descriptorPool, *descriptorSetLayout));
1984 
1985 	// Update descriptor set information.
1986 	{
1987 		VkDescriptorBufferInfo descIndirectBuffer = makeDescriptorBufferInfo(*indirectBuffer, 0, indirectBufferSize);
1988 
1989 		DescriptorSetUpdateBuilder()
1990 			.writeSingle(*descriptorSet, DescriptorSetUpdateBuilder::Location::binding(0u), VK_DESCRIPTOR_TYPE_STORAGE_BUFFER, &descIndirectBuffer)
1991 			.update(vkd, device);
1992 	}
1993 
1994 	// Create render pipeline layout.
1995 	{
1996 		const VkPipelineLayoutCreateInfo pipelineLayoutCreateInfo =
1997 		{
1998 			VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,	// VkStructureType				sType
1999 			DE_NULL,										// const void*					pNext
2000 			(vk::VkPipelineLayoutCreateFlags)0,				// VkPipelineLayoutCreateFlags	flags
2001 			1u,												// deUint32						setLayoutCount
2002 			&*descriptorSetLayout,							// const VkDescriptorSetLayout*	pSetLayouts
2003 			0u,												// deUint32						pushConstantRangeCount
2004 			DE_NULL											// const VkPushConstantRange*	pPushConstantRanges
2005 		};
2006 
2007 		pipelineLayout = createPipelineLayout(vkd, device, &pipelineLayoutCreateInfo);
2008 	}
2009 
2010 	// Create render pass.
2011 	{
2012 		vector<Attachment>			attachments;
2013 		vector<AttachmentReference>	colorAttachmentReferences;
2014 
2015 		attachments.push_back(Attachment(m_format, VK_SAMPLE_COUNT_1_BIT, VK_ATTACHMENT_LOAD_OP_CLEAR, VK_ATTACHMENT_STORE_OP_STORE, VK_ATTACHMENT_LOAD_OP_DONT_CARE, VK_ATTACHMENT_STORE_OP_DONT_CARE, VK_IMAGE_LAYOUT_UNDEFINED, VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL));
2016 		colorAttachmentReferences.push_back(AttachmentReference(0u, VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL));
2017 
2018 		const vector<Subpass>		subpasses	(1, Subpass(VK_PIPELINE_BIND_POINT_GRAPHICS, 0u, vector<AttachmentReference>(), colorAttachmentReferences, vector<AttachmentReference>(), AttachmentReference(VK_ATTACHMENT_UNUSED, VK_IMAGE_LAYOUT_GENERAL), vector<deUint32>()));
2019 		vector<SubpassDependency>	deps;
2020 
2021 		deps.push_back(SubpassDependency(0u,									// deUint32				srcPass
2022 										 0u,									// deUint32				dstPass
2023 										 VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT,	// VkPipelineStageFlags	srcStageMask
2024 										 VK_PIPELINE_STAGE_DRAW_INDIRECT_BIT,	// VkPipelineStageFlags	dstStageMask
2025 										 VK_ACCESS_SHADER_WRITE_BIT,			// VkAccessFlags		srcAccessMask
2026 										 VK_ACCESS_INDIRECT_COMMAND_READ_BIT,	// VkAccessFlags		dstAccessMask
2027 										 0));									// VkDependencyFlags	flags
2028 
2029 		renderPass = createRenderPass(vkd, device, RenderPass(attachments, subpasses, deps), m_renderPassType);
2030 	}
2031 
2032 	// Create render pipeline.
2033 	{
2034 		const Unique<VkShaderModule>				vertexShaderModule			(createShaderModule(vkd, device, m_context.getBinaryCollection().get("vert"), 0u));
2035 		const Unique<VkShaderModule>				geometryShaderModule		(createShaderModule(vkd, device, m_context.getBinaryCollection().get("geom"), 0u));
2036 		const Unique<VkShaderModule>				fragmentShaderModule		(createShaderModule(vkd, device, m_context.getBinaryCollection().get("frag"), 0u));
2037 
2038 		const VkVertexInputBindingDescription		vertexBinding0				=
2039 		{
2040 			0u,							// deUint32					binding;
2041 			sizeof(Vec4),				// deUint32					strideInBytes;
2042 			VK_VERTEX_INPUT_RATE_VERTEX	// VkVertexInputStepRate	stepRate;
2043 		};
2044 
2045 		VkVertexInputAttributeDescription			attr0						=
2046 		{
2047 			0u,								// deUint32	location;
2048 			0u,								// deUint32	binding;
2049 			VK_FORMAT_R32G32B32A32_SFLOAT,	// VkFormat	format;
2050 			0u								// deUint32	offsetInBytes;
2051 		};
2052 
2053 		const VkPipelineVertexInputStateCreateInfo	vertexInputState			=
2054 		{
2055 			VK_STRUCTURE_TYPE_PIPELINE_VERTEX_INPUT_STATE_CREATE_INFO,	// VkStructureType							sType
2056 			DE_NULL,													// const void*								pNext
2057 			(VkPipelineVertexInputStateCreateFlags)0u,					// VkPipelineVertexInputStateCreateFlags	flags
2058 			1u,															// uint32_t									vertexBindingDescriptionCount
2059 			&vertexBinding0,											// const VkVertexInputBindingDescription*	pVertexBindingDescriptions
2060 			1u,															// uint32_t									vertexAttributeDescriptionCount
2061 			&attr0														// const VkVertexInputAttributeDescription*	pVertexAttributeDescriptions
2062 		};
2063 
2064 		const std::vector<VkViewport>				viewports					(1, makeViewport(tcu::UVec2(m_width, m_height)));
2065 		const std::vector<VkRect2D>					scissors					(1, makeRect2D(tcu::UVec2(m_width, m_height)));
2066 
2067 		renderPipeline = makeGraphicsPipeline(vkd,	// const DeviceInterface&						vk
2068 				device,								// const VkDevice								device
2069 				*pipelineLayout,					// const VkPipelineLayout						pipelineLayout
2070 				*vertexShaderModule,				// const VkShaderModule							vertexShaderModule
2071 				DE_NULL,							// const VkShaderModule							tessellationControlShaderModule
2072 				DE_NULL,							// const VkShaderModule							tessellationEvalShaderModule
2073 				*geometryShaderModule,				// const VkShaderModule							geometryShaderModule
2074 				*fragmentShaderModule,				// const VkShaderModule							fragmentShaderModule
2075 				*renderPass,						// const VkRenderPass							renderPass
2076 				viewports,							// const std::vector<VkViewport>&				viewports
2077 				scissors,							// const std::vector<VkRect2D>&					scissors
2078 				VK_PRIMITIVE_TOPOLOGY_POINT_LIST,	// const VkPrimitiveTopology					topology
2079 				0u,									// const deUint32								subpass
2080 				0u,									// const deUint32								patchControlPoints
2081 				&vertexInputState);					// const VkPipelineVertexInputStateCreateInfo*	vertexInputStateCreateInfo
2082 	}
2083 
2084 	// Create framebuffer.
2085 	{
2086 		const VkImageViewCreateInfo imageViewCreateInfo =
2087 		{
2088 			VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,	// VkStructureType			sType
2089 			DE_NULL,									// const void*				pNext
2090 			0u,											// VkImageViewCreateFlags	flags
2091 			*outputImage,								// VkImage					image
2092 			VK_IMAGE_VIEW_TYPE_2D,						// VkImageViewType			viewType
2093 			m_format,									// VkFormat					format
2094 			makeComponentMappingRGBA(),					// VkComponentMapping		components
2095 			{											// VkImageSubresourceRange	subresourceRange
2096 				VK_IMAGE_ASPECT_COLOR_BIT,
2097 				0u,
2098 				1u,
2099 				0u,
2100 				1u
2101 			}
2102 		};
2103 		outputImageView	= createImageView(vkd, device, &imageViewCreateInfo);
2104 
2105 		const VkFramebufferCreateInfo framebufferCreateInfo =
2106 		{
2107 			VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO,	// VkStructureType			sType
2108 			DE_NULL,									// const void*				pNext
2109 			0u,											// VkFramebufferCreateFlags	flags
2110 			*renderPass,								// VkRenderPass				renderPass
2111 			1u,											// uint32_t					attachmentCount
2112 			&*outputImageView,							// const VkImageView*		pAttachments
2113 			m_width,									// uint32_t					width
2114 			m_height,									// uint32_t					height
2115 			1u											// uint32_t					layers
2116 		};
2117 
2118 		framebuffer = vk::createFramebuffer(vkd, device, &framebufferCreateInfo);
2119 	}
2120 
2121 	// Generate random point locations (pixel centered to make reference comparison easier).
2122 	for (int primitiveNdx = 0; primitiveNdx < 128; primitiveNdx++)
2123 	{
2124 		vertexData.push_back(Vec4((float)((rand.getUint32() % m_width) * 2) / (float)m_width - 1.0f,
2125 				(float)((rand.getUint32() % m_height) * 2) / (float)m_height - 1.0f,
2126 				1.0f, 1.0f));
2127 	}
2128 
2129 	// Upload vertex data.
2130 	{
2131 		const size_t				vertexDataSize		= vertexData.size() * sizeof(Vec4);
2132 
2133 		const VkBufferCreateInfo	vertexBufferParams	=
2134 		{
2135 			VK_STRUCTURE_TYPE_BUFFER_CREATE_INFO,	//	VkStructureType		sType;
2136 			DE_NULL,								//	const void*			pNext;
2137 			0u,										//	VkBufferCreateFlags	flags;
2138 			(VkDeviceSize)vertexDataSize,			//	VkDeviceSize		size;
2139 			VK_BUFFER_USAGE_VERTEX_BUFFER_BIT,		//	VkBufferUsageFlags	usage;
2140 			VK_SHARING_MODE_EXCLUSIVE,				//	VkSharingMode		sharingMode;
2141 			1u,										//	deUint32			queueFamilyCount;
2142 			&queueFamilyIndex,						//	const deUint32*		pQueueFamilyIndices;
2143 		};
2144 
2145 		vertexBuffer		= createBuffer(vkd, m_context.getDevice(), &vertexBufferParams);
2146 		vertexBufferMemory	= createBufferMemory(vkd, device, m_context.getDefaultAllocator(), *vertexBuffer);
2147 
2148 		deMemcpy(vertexBufferMemory->getHostPtr(), vertexData.data(), vertexDataSize);
2149 		flushAlloc(vkd, device, *vertexBufferMemory);
2150 	}
2151 
2152 	beginCommandBuffer(vkd, *commandBuffer);
2153 	vkd.cmdBindPipeline(*commandBuffer, vk::VK_PIPELINE_BIND_POINT_GRAPHICS, *renderPipeline);
2154 	vkd.cmdBindDescriptorSets(*commandBuffer, vk::VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineLayout, 0u, 1u, &*descriptorSet, 0u, DE_NULL);
2155 
2156 	// Begin render pass.
2157 	{
2158 		VkRect2D					renderArea	=
2159 		{
2160 			{ 0u, 0u },				// VkOffset2D	offset
2161 			{ m_width, m_height }	// VkExtent2D	extent
2162 		};
2163 
2164 		VkClearValue				clearValue	= makeClearValueColor(Vec4(0.0f, 1.0f, 0.0f, 1.0f));
2165 
2166 		const VkRenderPassBeginInfo	beginInfo	=
2167 		{
2168 			VK_STRUCTURE_TYPE_RENDER_PASS_BEGIN_INFO,	// VkStructureType		sType
2169 			DE_NULL,									// const void*			pNext
2170 			*renderPass,								// VkRenderPass			renderPass
2171 			*framebuffer,								// VkFramebuffer		framebuffer
2172 			renderArea,									// VkRect2D				renderArea
2173 			1u,											// uint32_t				clearValueCount
2174 			&clearValue									// const VkClearValue*	pClearValues
2175 		};
2176 
2177 		RenderpassSubpass::cmdBeginRenderPass(vkd, *commandBuffer, &beginInfo, &subpassBeginInfo);
2178 	}
2179 
2180 	const VkDeviceSize bindingOffset = 0;
2181 	vkd.cmdBindVertexBuffers(*commandBuffer, 0u, 1u, &vertexBuffer.get(), &bindingOffset);
2182 
2183 	vkd.cmdBindPipeline(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *renderPipeline);
2184 
2185 	// The first indirect draw: Draw the first 64 items.
2186 	vkd.cmdDrawIndirect(*commandBuffer, *indirectBuffer, 0u, 1u, 0u);
2187 
2188 	// Barrier for indirect buffer.
2189 	{
2190 		const VkMemoryBarrier barrier =
2191 		{
2192 			VK_STRUCTURE_TYPE_MEMORY_BARRIER,	// VkStructureType	sType
2193 			DE_NULL,							// const void*		pNext
2194 			VK_ACCESS_SHADER_WRITE_BIT,			// VkAccessFlags	srcAccessMask
2195 			VK_ACCESS_INDIRECT_COMMAND_READ_BIT	// VkAccessFlags	dstAccessMask
2196 		};
2197 
2198 		vkd.cmdPipelineBarrier(*commandBuffer, VK_PIPELINE_STAGE_GEOMETRY_SHADER_BIT, VK_PIPELINE_STAGE_DRAW_INDIRECT_BIT, 0u, 1u, &barrier, 0u, DE_NULL, 0u, DE_NULL);
2199 	}
2200 
2201 	// The second indirect draw: Draw the last 64 items.
2202 	vkd.cmdDrawIndirect(*commandBuffer, *indirectBuffer, 0u, 1u, 0u);
2203 
2204 	RenderpassSubpass::cmdEndRenderPass(vkd, *commandBuffer, &subpassEndInfo);
2205 
2206 	// Copy results to a buffer.
2207 	copyImageToBuffer(vkd, *commandBuffer, *outputImage, *resultBuffer, tcu::IVec2(m_width, m_height));
2208 
2209 	endCommandBuffer(vkd, *commandBuffer);
2210 	submitCommandsAndWait(vkd, m_context.getDevice(), m_context.getUniversalQueue(), *commandBuffer);
2211 	invalidateMappedMemoryRange(vkd, m_context.getDevice(), resultBufferMemory->getMemory(), resultBufferMemory->getOffset(), VK_WHOLE_SIZE);
2212 
2213 	// Verify result.
2214 	{
2215 		const tcu::TextureFormat format (mapVkFormat(m_format));
2216 
2217 		const void* const					ptrResult		(resultBufferMemory->getHostPtr());
2218 		tcu::TextureLevel					reference		(format, m_width, m_height);
2219 		const tcu::ConstPixelBufferAccess	resultAccess	(format, m_width, m_height, 1, ptrResult);
2220 		const PixelBufferAccess				referenceAccess	(reference.getAccess());
2221 
2222 
2223 		// Setup and run reference renderer.
2224 		{
2225 			vector<Vec4>							triangles;
2226 			const float								offset			= 0.03f;
2227 
2228 			// Convert points into triangles to have quads similar to what GPU is producing from geometry shader.
2229 			for (size_t vtxIdx = 0; vtxIdx < vertexData.size(); vtxIdx++)
2230 			{
2231 				triangles.push_back(vertexData[vtxIdx] + tcu::Vec4(-offset, offset, 0.0f, 0.0f));
2232 				triangles.push_back(vertexData[vtxIdx] + tcu::Vec4(-offset, -offset, 0.0f, 0.0f));
2233 				triangles.push_back(vertexData[vtxIdx] + tcu::Vec4(offset, offset, 0.0f, 0.0f));
2234 
2235 				triangles.push_back(vertexData[vtxIdx] + tcu::Vec4(-offset, -offset, 0.0f, 0.0f));
2236 				triangles.push_back(vertexData[vtxIdx] + tcu::Vec4(offset, offset, 0.0f, 0.0f));
2237 				triangles.push_back(vertexData[vtxIdx] + tcu::Vec4(offset, -offset, 0.0f, 0.0f));
2238 			}
2239 
2240 			const SelfDependencyBackwardsVertShader	vertShader;
2241 			const SelfDependencyBackwardsFragShader	fragShader;
2242 			const rr::Renderer						renderer;
2243 			const rr::Program						program			(&vertShader, &fragShader);
2244 			const rr::MultisamplePixelBufferAccess	msAccess		(rr::MultisamplePixelBufferAccess::fromSinglesampleAccess(referenceAccess));
2245 			const rr::RenderTarget					renderTarget	(msAccess);
2246 			const rr::PrimitiveType					primitiveType	(rr::PRIMITIVETYPE_TRIANGLES);
2247 			const rr::PrimitiveList					primitiveList	(rr::PrimitiveList(primitiveType, (deUint32)triangles.size(), 0));
2248 			const rr::ViewportState					viewportState	(msAccess);
2249 			const rr::RenderState					renderState		(viewportState, m_context.getDeviceProperties().limits.subPixelPrecisionBits);
2250 			const rr::VertexAttrib					vertices		= rr::VertexAttrib(rr::VERTEXATTRIBTYPE_FLOAT, 4, sizeof(tcu::Vec4), 0, &triangles[0]);
2251 
2252 			tcu::clear(referenceAccess, tcu::UVec4(0, 255, 0, 255));
2253 			renderer.draw(rr::DrawCommand(renderState, renderTarget, program, 1u, &vertices, primitiveList));
2254 		}
2255 
2256 		if (!tcu::floatThresholdCompare(m_context.getTestContext().getLog(),	// log
2257 										"Color buffer",							// imageSetName
2258 										"",										// imageSetDesc
2259 										referenceAccess,						// reference
2260 										resultAccess,							// result
2261 										Vec4(0.01f),							// threshold
2262 										tcu::COMPARE_LOG_RESULT))				// logMode
2263 		{
2264 			m_resultCollector.fail("Image compare failed.");
2265 		}
2266 	}
2267 
2268 	return tcu::TestStatus(m_resultCollector.getResult(), m_resultCollector.getMessage());
2269 }
2270 
2271 struct SeparateChannelsTestConfig
2272 {
SeparateChannelsTestConfigvkt::__anon104c10a40111::SeparateChannelsTestConfig2273 		SeparateChannelsTestConfig	(VkFormat		format_,
2274 									 RenderPassType	renderPassType_)
2275 		: format			(format_)
2276 		, renderPassType	(renderPassType_)
2277 	{
2278 	}
2279 
2280 	VkFormat		format;
2281 	RenderPassType	renderPassType;
2282 };
2283 
2284 class SeparateChannelsTestInstance : public TestInstance
2285 {
2286 public:
2287 							SeparateChannelsTestInstance	(Context&					context,
2288 															 SeparateChannelsTestConfig	testConfig);
2289 
2290 							~SeparateChannelsTestInstance	(void);
2291 
2292 	tcu::TestStatus			iterate							(void);
2293 
2294 	template<typename RenderpassSubpass>
2295 	tcu::TestStatus			iterateInternal					(void);
2296 
2297 private:
2298 	const bool				m_extensionSupported;
2299 	const RenderPassType	m_renderPassType;
2300 
2301 	const deUint32			m_width;
2302 	const deUint32			m_height;
2303 	const VkFormat			m_format;
2304 	tcu::ResultCollector	m_resultCollector;
2305 };
2306 
SeparateChannelsTestInstance(Context & context,SeparateChannelsTestConfig testConfig)2307 SeparateChannelsTestInstance::SeparateChannelsTestInstance (Context& context, SeparateChannelsTestConfig testConfig)
2308 	: TestInstance			(context)
2309 	, m_extensionSupported	((testConfig.renderPassType == RENDERPASS_TYPE_RENDERPASS2) && context.requireDeviceFunctionality("VK_KHR_create_renderpass2"))
2310 	, m_renderPassType		(testConfig.renderPassType)
2311 	, m_width				(256u)
2312 	, m_height				(256u)
2313 	, m_format				(testConfig.format)
2314 {
2315 }
2316 
~SeparateChannelsTestInstance(void)2317 SeparateChannelsTestInstance::~SeparateChannelsTestInstance (void)
2318 {
2319 }
2320 
iterate(void)2321 tcu::TestStatus SeparateChannelsTestInstance::iterate (void)
2322 {
2323 	switch (m_renderPassType)
2324 	{
2325 		case RENDERPASS_TYPE_LEGACY:
2326 			return iterateInternal<RenderpassSubpass1>();
2327 		case RENDERPASS_TYPE_RENDERPASS2:
2328 			return iterateInternal<RenderpassSubpass2>();
2329 		default:
2330 			TCU_THROW(InternalError, "Impossible");
2331 	}
2332 }
2333 
2334 template<typename RenderpassSubpass>
iterateInternal(void)2335 tcu::TestStatus SeparateChannelsTestInstance::iterateInternal (void)
2336 {
2337 	const DeviceInterface&								vkd						(m_context.getDeviceInterface());
2338 	const VkDevice										device					= m_context.getDevice();
2339 	const VkQueue										queue					= m_context.getUniversalQueue();
2340 	const deUint32										queueFamilyIndex		= m_context.getUniversalQueueFamilyIndex();
2341 	const Unique<VkCommandPool>							commandPool				(createCommandPool(vkd, m_context.getDevice(), VK_COMMAND_POOL_CREATE_TRANSIENT_BIT, queueFamilyIndex));
2342 	const Unique<VkCommandBuffer>						commandBuffer			(allocateCommandBuffer(vkd, m_context.getDevice(), *commandPool, VK_COMMAND_BUFFER_LEVEL_PRIMARY));
2343 	const typename RenderpassSubpass::SubpassBeginInfo	subpassBeginInfo		(DE_NULL, VK_SUBPASS_CONTENTS_INLINE);
2344 	const typename RenderpassSubpass::SubpassEndInfo	subpassEndInfo			(DE_NULL);
2345 	const bool											isDSFormat				= isDepthStencilFormat(m_format);
2346 	const VkFormat										colorFormat				= isDSFormat ? VK_FORMAT_R8G8B8A8_UNORM : m_format;
2347 	const tcu::Vec4										colorInitValues[2]		= { tcu::Vec4(0.2f, 0.4f, 0.1f, 1.0f), tcu::Vec4(0.5f, 0.4f, 0.7f, 1.0f) };
2348 	const float											depthInitValues[2]		= { 0.3f, 0.7f };
2349 	const deUint32										stencilInitValues[2]	= { 2u, 100u };
2350 	const deUint32										stencilRefValue			= 200u;
2351 	const deUint32										tileSize				= 32u;
2352 	vector<Vec4>										vertexData;
2353 	Move<VkImage>										colorImage;
2354 	de::MovePtr<Allocation>								colorImageAllocation;
2355 	// When testing color formats the same attachment is used as input and output. This requires general layout to be used.
2356 	const VkImageLayout									colorImageLayout		= isDSFormat ? VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL : VK_IMAGE_LAYOUT_GENERAL;
2357 	Move<VkImage>										dsImage;
2358 	de::MovePtr<Allocation>								dsImageAllocation;
2359 	Move<VkImageView>									outputImageView;
2360 	Move<VkImageView>									inputImageView;
2361 	Move<VkImageView>									dsImageView;
2362 	Move<VkPipelineLayout>								pipelineLayout;
2363 	Move<VkPipeline>									renderPipeline;
2364 	Move<VkFramebuffer>									framebuffer;
2365 	Move<VkRenderPass>									renderPass;
2366 	Move<VkBuffer>										resultBuffer0;
2367 	de::MovePtr<Allocation>								resultBuffer0Memory;
2368 	Move<VkBuffer>										resultBuffer1;
2369 	de::MovePtr<Allocation>								resultBuffer1Memory;
2370 	Move<VkBuffer>										vertexBuffer;
2371 	de::MovePtr<Allocation>								vertexBufferMemory;
2372 
2373 	const VkExtent3D		imageExtent		=
2374 	{
2375 		m_width,	// deUint32	width
2376 		m_height,	// deUint32	height
2377 		1u			// deUint32	depth
2378 	};
2379 
2380 	// Create image used for both input and output in case of color test, and as a color output in depth/stencil test.
2381 	{
2382 		VkImageUsageFlags		usage			= VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT | VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT | VK_IMAGE_USAGE_TRANSFER_SRC_BIT | VK_IMAGE_USAGE_TRANSFER_DST_BIT;
2383 
2384 		const VkImageCreateInfo	imageCreateInfo	=
2385 		{
2386 			VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,	// VkStructureType			sType
2387 			DE_NULL,								// const void*				pNext
2388 			0u,										// VkImageCreateFlags		flags
2389 			VK_IMAGE_TYPE_2D,						// VkImageType				imageType
2390 			colorFormat,							// VkFormat					format
2391 			imageExtent,							// VkExtent3D				extent
2392 			1u,										// uint32_t					mipLevels
2393 			1u,										// uint32_t					arrayLayers
2394 			VK_SAMPLE_COUNT_1_BIT,					// VkSampleCountFlagBits	samples
2395 			VK_IMAGE_TILING_OPTIMAL,				// VkImageTiling			tiling
2396 			usage,									// VkImageUsageFlags		usage
2397 			VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode			sharingMode
2398 			1u,										// uint32_t					queueFamilyIndexCount
2399 			&queueFamilyIndex,						// const uint32_t*			pQueueFamilyIndices
2400 			VK_IMAGE_LAYOUT_UNDEFINED				// VkImageLayout			initialLayout
2401 		};
2402 
2403 		checkImageSupport(m_context.getInstanceInterface(), m_context.getPhysicalDevice(), imageCreateInfo);
2404 
2405 		colorImage = createImage(vkd, device, &imageCreateInfo, DE_NULL);
2406 		colorImageAllocation = m_context.getDefaultAllocator().allocate(getImageMemoryRequirements(vkd, device, *colorImage), MemoryRequirement::Any);
2407 		VK_CHECK(vkd.bindImageMemory(device, *colorImage, colorImageAllocation->getMemory(), colorImageAllocation->getOffset()));
2408 	}
2409 
2410 	// Create depth/stencil image
2411 	if (isDSFormat)
2412 	{
2413 		VkImageUsageFlags		usage			= VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT | VK_IMAGE_USAGE_TRANSFER_SRC_BIT | VK_IMAGE_USAGE_TRANSFER_DST_BIT;
2414 
2415 		const VkImageCreateInfo	imageCreateInfo	=
2416 		{
2417 			VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,	// VkStructureType			sType
2418 			DE_NULL,								// const void*				pNext
2419 			0u,										// VkImageCreateFlags		flags
2420 			VK_IMAGE_TYPE_2D,						// VkImageType				imageType
2421 			m_format,								// VkFormat					format
2422 			imageExtent,							// VkExtent3D				extent
2423 			1u,										// uint32_t					mipLevels
2424 			1u,										// uint32_t					arrayLayers
2425 			VK_SAMPLE_COUNT_1_BIT,					// VkSampleCountFlagBits	samples
2426 			VK_IMAGE_TILING_OPTIMAL,				// VkImageTiling			tiling
2427 			usage,									// VkImageUsageFlags		usage
2428 			VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode			sharingMode
2429 			1u,										// uint32_t					queueFamilyIndexCount
2430 			&queueFamilyIndex,						// const uint32_t*			pQueueFamilyIndices
2431 			VK_IMAGE_LAYOUT_UNDEFINED				// VkImageLayout			initialLayout
2432 		};
2433 
2434 		checkImageSupport(m_context.getInstanceInterface(), m_context.getPhysicalDevice(), imageCreateInfo);
2435 
2436 		dsImage = createImage(vkd, device, &imageCreateInfo, DE_NULL);
2437 		dsImageAllocation = m_context.getDefaultAllocator().allocate(getImageMemoryRequirements(vkd, device, *dsImage), MemoryRequirement::Any);
2438 		VK_CHECK(vkd.bindImageMemory(device, *dsImage, dsImageAllocation->getMemory(), dsImageAllocation->getOffset()));
2439 
2440 		// Initialize depth / stencil image
2441 		initDepthStencilImageChessboardPattern(vkd, device, queue, queueFamilyIndex, m_context.getDefaultAllocator(), *dsImage, m_format, depthInitValues[0], depthInitValues[1], stencilInitValues[0], stencilInitValues[1], m_width, m_height, tileSize, VK_IMAGE_LAYOUT_UNDEFINED, VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL, VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT);
2442 	}
2443 
2444 	// Initialize color image
2445 	initColorImageChessboardPattern(vkd, device, queue, queueFamilyIndex, m_context.getDefaultAllocator(), *colorImage, colorFormat, colorInitValues[0], colorInitValues[1], m_width, m_height, tileSize, VK_IMAGE_LAYOUT_UNDEFINED, colorImageLayout, VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT);
2446 
2447 	// Create color image views
2448 	{
2449 		const VkImageViewCreateInfo imageViewCreateInfo =
2450 		{
2451 			VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,	// VkStructureType			sType
2452 			DE_NULL,									// const void*				pNext
2453 			0u,											// VkImageViewCreateFlags	flags
2454 			*colorImage,								// VkImage					image
2455 			VK_IMAGE_VIEW_TYPE_2D,						// VkImageViewType			viewType
2456 			colorFormat,								// VkFormat					format
2457 			makeComponentMappingRGBA(),					// VkComponentMapping		components
2458 			{											// VkImageSubresourceRange	subresourceRange
2459 				VK_IMAGE_ASPECT_COLOR_BIT,
2460 				0u,
2461 				1u,
2462 				0u,
2463 				1u
2464 			}
2465 		};
2466 
2467 		if (!isDSFormat) inputImageView	= createImageView(vkd, device, &imageViewCreateInfo);
2468 		outputImageView	= createImageView(vkd, device, &imageViewCreateInfo);
2469 	}
2470 
2471 	// Create depth/stencil image view
2472 	if (isDSFormat)
2473 	{
2474 		const VkImageViewCreateInfo imageViewCreateInfo =
2475 		{
2476 			VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,	// VkStructureType			sType
2477 			DE_NULL,									// const void*				pNext
2478 			0u,											// VkImageViewCreateFlags	flags
2479 			*dsImage,									// VkImage					image
2480 			VK_IMAGE_VIEW_TYPE_2D,						// VkImageViewType			viewType
2481 			m_format,									// VkFormat					format
2482 			makeComponentMappingRGBA(),					// VkComponentMapping		components
2483 			{											// VkImageSubresourceRange	subresourceRange
2484 				VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT,
2485 				0u,
2486 				1u,
2487 				0u,
2488 				1u
2489 			}
2490 		};
2491 
2492 		dsImageView	= createImageView(vkd, device, &imageViewCreateInfo);
2493 	}
2494 
2495 	// Create result buffers.
2496 	{
2497 		resultBuffer0		= createBuffer(vkd, device, m_format, m_width, m_height);
2498 		resultBuffer0Memory	= createBufferMemory(vkd, device, m_context.getDefaultAllocator(), *resultBuffer0);
2499 		resultBuffer1		= createBuffer(vkd, device, m_format, m_width, m_height);
2500 		resultBuffer1Memory	= createBufferMemory(vkd, device, m_context.getDefaultAllocator(), *resultBuffer1);
2501 	}
2502 
2503 	// Create descriptor set layout.
2504 	Unique<VkDescriptorSetLayout>	descriptorSetLayout	(DescriptorSetLayoutBuilder()
2505 			.addSingleBinding(VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT, VK_SHADER_STAGE_FRAGMENT_BIT)
2506 			.build(vkd, device));
2507 	// Create descriptor pool.
2508 	Unique<VkDescriptorPool>		descriptorPool		(DescriptorPoolBuilder()
2509 			.addType(VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT, 1u)
2510 			.build(vkd, device, VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT, 1u));
2511 	// Create descriptor set.
2512 	Unique<VkDescriptorSet>			descriptorSet		(makeDescriptorSet(vkd, device, *descriptorPool, *descriptorSetLayout));
2513 
2514 	// Update descriptor set information.
2515 	if (!isDSFormat)
2516 	{
2517 		VkDescriptorImageInfo descInputAttachment = makeDescriptorImageInfo(DE_NULL, *inputImageView, VK_IMAGE_LAYOUT_GENERAL);
2518 
2519 		DescriptorSetUpdateBuilder()
2520 			.writeSingle(*descriptorSet, DescriptorSetUpdateBuilder::Location::binding(0u), VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT, &descInputAttachment)
2521 			.update(vkd, device);
2522 	}
2523 
2524 	// Create render pipeline layout.
2525 	{
2526 		const VkPipelineLayoutCreateInfo pipelineLayoutCreateInfo =
2527 		{
2528 			VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,	// VkStructureType				sType
2529 			DE_NULL,										// const void*					pNext
2530 			(vk::VkPipelineLayoutCreateFlags)0,				// VkPipelineLayoutCreateFlags	flags
2531 			1u,												// deUint32						setLayoutCount
2532 			&*descriptorSetLayout,							// const VkDescriptorSetLayout*	pSetLayouts
2533 			0u,												// deUint32						pushConstantRangeCount
2534 			DE_NULL											// const VkPushConstantRange*	pPushConstantRanges
2535 		};
2536 
2537 		pipelineLayout = createPipelineLayout(vkd, device, &pipelineLayoutCreateInfo);
2538 	}
2539 
2540 	// Create render pass.
2541 	{
2542 		vector<Attachment>			attachments;
2543 		vector<AttachmentReference>	colorAttachmentReferences;
2544 		vector<AttachmentReference>	inputAttachmentReferences;
2545 		AttachmentReference			dsAttachmentReference		(1u, VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL, VK_IMAGE_ASPECT_DEPTH_BIT | VK_IMAGE_ASPECT_STENCIL_BIT);
2546 
2547 		const VkImageAspectFlags	inputAttachmentAspectMask	((m_renderPassType == RENDERPASS_TYPE_RENDERPASS2)
2548 																? static_cast<VkImageAspectFlags>(VK_IMAGE_ASPECT_COLOR_BIT)
2549 																: static_cast<VkImageAspectFlags>(0));
2550 
2551 		attachments.push_back(Attachment(colorFormat, VK_SAMPLE_COUNT_1_BIT, VK_ATTACHMENT_LOAD_OP_LOAD, VK_ATTACHMENT_STORE_OP_STORE, VK_ATTACHMENT_LOAD_OP_DONT_CARE, VK_ATTACHMENT_STORE_OP_DONT_CARE, colorImageLayout, colorImageLayout));
2552 		colorAttachmentReferences.push_back(AttachmentReference(0u, colorImageLayout));
2553 
2554 		if (isDSFormat)
2555 		{
2556 			attachments.push_back(Attachment(m_format, VK_SAMPLE_COUNT_1_BIT, VK_ATTACHMENT_LOAD_OP_LOAD, VK_ATTACHMENT_STORE_OP_STORE, VK_ATTACHMENT_LOAD_OP_DONT_CARE, VK_ATTACHMENT_STORE_OP_STORE, VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL, VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL));
2557 		}
2558 		else
2559 		{
2560 			attachments.push_back(Attachment(colorFormat, VK_SAMPLE_COUNT_1_BIT, VK_ATTACHMENT_LOAD_OP_LOAD, VK_ATTACHMENT_STORE_OP_DONT_CARE, VK_ATTACHMENT_LOAD_OP_DONT_CARE, VK_ATTACHMENT_STORE_OP_DONT_CARE, VK_IMAGE_LAYOUT_GENERAL, VK_IMAGE_LAYOUT_GENERAL));
2561 			inputAttachmentReferences.push_back(AttachmentReference(1u, VK_IMAGE_LAYOUT_GENERAL, inputAttachmentAspectMask));
2562 		}
2563 
2564 		const vector<Subpass>		subpasses	(1, Subpass(VK_PIPELINE_BIND_POINT_GRAPHICS, 0u, inputAttachmentReferences, colorAttachmentReferences, vector<AttachmentReference>(), isDSFormat ? dsAttachmentReference : AttachmentReference(VK_ATTACHMENT_UNUSED, VK_IMAGE_LAYOUT_GENERAL), vector<deUint32>()));
2565 
2566 		renderPass = createRenderPass(vkd, device, RenderPass(attachments, subpasses, vector<SubpassDependency>()), m_renderPassType);
2567 	}
2568 
2569 	// Create render pipeline.
2570 	{
2571 		const Unique<VkShaderModule>				vertexShaderModule			(createShaderModule(vkd, device, m_context.getBinaryCollection().get("vert"), 0u));
2572 		const Unique<VkShaderModule>				fragmentShaderModule		(createShaderModule(vkd, device, m_context.getBinaryCollection().get("frag"), 0u));
2573 
2574 		const VkVertexInputBindingDescription		vertexBinding0				=
2575 		{
2576 			0u,							// deUint32					binding
2577 			sizeof(Vec4),				// deUint32					strideInBytes
2578 			VK_VERTEX_INPUT_RATE_VERTEX	// VkVertexInputStepRate	stepRate
2579 		};
2580 
2581 		const VkVertexInputAttributeDescription		attr0						=
2582 		{
2583 			0u,								// deUint32	location
2584 			0u,								// deUint32	binding
2585 			VK_FORMAT_R32G32B32A32_SFLOAT,	// VkFormat	format
2586 			0u								// deUint32	offsetInBytes
2587 		};
2588 
2589 		const VkPipelineVertexInputStateCreateInfo	vertexInputState			=
2590 		{
2591 			VK_STRUCTURE_TYPE_PIPELINE_VERTEX_INPUT_STATE_CREATE_INFO,	// VkStructureType							sType
2592 			DE_NULL,													// const void*								pNext
2593 			(VkPipelineVertexInputStateCreateFlags)0u,					// VkPipelineVertexInputStateCreateFlags	flags
2594 			1u,															// deUint32									vertexBindingDescriptionCount
2595 			&vertexBinding0,											// const VkVertexInputBindingDescription*	pVertexBindingDescriptions
2596 			1u,															// deUint32									vertexAttributeDescriptionCount
2597 			&attr0														// const VkVertexInputAttributeDescription*	pVertexAttributeDescriptions
2598 		};
2599 
2600 		// Use write mask to enable only B and A channels to prevent self dependency (reads are done for channels R and G).
2601 		const VkPipelineColorBlendAttachmentState	colorBlendAttachmentState	=
2602 		{
2603 			VK_FALSE,					// VkBool32					blendEnable
2604 			VK_BLEND_FACTOR_ZERO,		// VkBlendFactor			srcColorBlendFactor
2605 			VK_BLEND_FACTOR_ZERO,		// VkBlendFactor			dstColorBlendFactor
2606 			VK_BLEND_OP_ADD,			// VkBlendOp				colorBlendOp
2607 			VK_BLEND_FACTOR_ZERO,		// VkBlendFactor			srcAlphaBlendFactor
2608 			VK_BLEND_FACTOR_ZERO,		// VkBlendFactor			dstAlphaBlendFactor
2609 			VK_BLEND_OP_ADD,			// VkBlendOp				alphaBlendOp
2610 			VK_COLOR_COMPONENT_B_BIT
2611 			| VK_COLOR_COMPONENT_A_BIT	// VkColorComponentFlags	colorWriteMask
2612 		};
2613 
2614 		const VkPipelineColorBlendStateCreateInfo	colorBlendState				=
2615 		{
2616 			VK_STRUCTURE_TYPE_PIPELINE_COLOR_BLEND_STATE_CREATE_INFO,	// VkStructureType								sType
2617 			DE_NULL,													// const void*									pNext
2618 			0u,															// VkPipelineColorBlendStateCreateFlags			flags
2619 			VK_FALSE,													// VkBool32										logicOpEnable
2620 			VK_LOGIC_OP_CLEAR,											// VkLogicOp									logicOp
2621 			1u,															// deUint32										attachmentCount
2622 			&colorBlendAttachmentState,									// const VkPipelineColorBlendAttachmentState*	pAttachments
2623 			{ 0.0f, 0.0f, 0.0f, 0.0f }									// float										blendConstants[4]
2624 		};
2625 
2626 		const VkStencilOpState						stencilOpState				=
2627 		{
2628 			VK_STENCIL_OP_REPLACE,	// VkStencilOp	failOp
2629 			VK_STENCIL_OP_REPLACE,	// VkStencilOp	passOp
2630 			VK_STENCIL_OP_ZERO,		// VkStencilOp	depthFailOp
2631 			VK_COMPARE_OP_ALWAYS,	// VkCompareOp	compareOp
2632 			0xff,					// deUint32		compareMask
2633 			0xff,					// deUint32		writeMask
2634 			stencilRefValue			// deUint32		reference
2635 		};
2636 
2637 		const VkPipelineDepthStencilStateCreateInfo	depthStencilState			=
2638 		{
2639 			VK_STRUCTURE_TYPE_PIPELINE_DEPTH_STENCIL_STATE_CREATE_INFO,	// VkStructureType							sType
2640 			DE_NULL,													// const void*								pNext
2641 			0u,															// VkPipelineDepthStencilStateCreateFlags	flags
2642 			VK_TRUE,													// VkBool32									depthTestEnable
2643 			VK_FALSE,													// VkBool32									depthWriteEnable
2644 			VK_COMPARE_OP_LESS,											// VkCompareOp								depthCompareOp
2645 			VK_FALSE,													// VkBool32									depthBoundsTestEnable
2646 			VK_TRUE,													// VkBool32									stencilTestEnable
2647 			stencilOpState,												// VkStencilOpState							front
2648 			stencilOpState,												// VkStencilOpState							back
2649 			0.0f,														// float									minDepthBounds
2650 			1.0f														// float									maxDepthBounds
2651 		};
2652 
2653 		const std::vector<VkViewport>				viewports					(1, makeViewport(tcu::UVec2(m_width, m_height)));
2654 		const std::vector<VkRect2D>					scissors					(1, makeRect2D(tcu::UVec2(m_width, m_height)));
2655 
2656 		renderPipeline = makeGraphicsPipeline(vkd,			// const DeviceInterface&							vk
2657 				device,										// const VkDevice									device
2658 				*pipelineLayout,							// const VkPipelineLayout							pipelineLayout
2659 				*vertexShaderModule,						// const VkShaderModule								vertexShaderModule
2660 				DE_NULL,									// const VkShaderModule								tessellationControlShaderModule
2661 				DE_NULL,									// const VkShaderModule								tessellationEvalShaderModule
2662 				DE_NULL,									// const VkShaderModule								geometryShaderModule
2663 				*fragmentShaderModule,						// const VkShaderModule								fragmentShaderModule
2664 				*renderPass,								// const VkRenderPass								renderPass
2665 				viewports,									// const std::vector<VkViewport>&					viewports
2666 				scissors,									// const std::vector<VkRect2D>&						scissors
2667 				VK_PRIMITIVE_TOPOLOGY_TRIANGLE_STRIP,		// const VkPrimitiveTopology						topology
2668 				0u,											// const deUint32									subpass
2669 				0u,											// const deUint32									patchControlPoints
2670 				&vertexInputState,							// const VkPipelineVertexInputStateCreateInfo*		vertexInputStateCreateInfo
2671 				DE_NULL,									// const VkPipelineRasterizationStateCreateInfo*	rasterizationStateCreateInfo
2672 				DE_NULL,									// const VkPipelineMultisampleStateCreateInfo*		multisampleStateCreateInfo
2673 				isDSFormat ? &depthStencilState : DE_NULL,	// const VkPipelineDepthStencilStateCreateInfo*		depthStencilStateCreateInfo
2674 				isDSFormat ? DE_NULL : &colorBlendState);	// const VkPipelineColorBlendStateCreateInfo*		colorBlendStateCreateInfo
2675 	}
2676 
2677 	// Create framebuffer.
2678 	{
2679 		const VkImageView				attachments[]			=
2680 		{
2681 			*outputImageView,
2682 			isDSFormat ? *dsImageView : *inputImageView
2683 		};
2684 
2685 		const VkFramebufferCreateInfo	framebufferCreateInfo	=
2686 		{
2687 			VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO,	// VkStructureType			sType
2688 			DE_NULL,									// const void*				pNext
2689 			0u,											// VkFramebufferCreateFlags	flags
2690 			*renderPass,								// VkRenderPass				renderPass
2691 			2u,											// uint32_t					attachmentCount
2692 			attachments,								// const VkImageView*		pAttachments
2693 			m_width,									// uint32_t					width
2694 			m_height,									// uint32_t					height
2695 			1u											// uint32_t					layers
2696 		};
2697 
2698 		framebuffer = vk::createFramebuffer(vkd, device, &framebufferCreateInfo);
2699 	}
2700 
2701 	// Generate quad vertices
2702 	{
2703 		const tcu::Vec4	lowerLeftVertex		(-1.0f, -1.0f, 0.5f, 1.0f);
2704 		const tcu::Vec4	lowerRightVertex	(1.0f, -1.0f, 0.5f, 1.0f);
2705 		const tcu::Vec4	upperLeftVertex		(-1.0f, 1.0f, 0.5f, 1.0f);
2706 		const tcu::Vec4	upperRightVertex	(1.0f, 1.0f, 0.5f, 1.0f);
2707 
2708 		vertexData.push_back(lowerLeftVertex);
2709 		vertexData.push_back(upperLeftVertex);
2710 		vertexData.push_back(lowerRightVertex);
2711 		vertexData.push_back(upperRightVertex);
2712 	}
2713 
2714 	// Upload vertex data.
2715 	{
2716 		const size_t				vertexDataSize		= vertexData.size() * sizeof(Vec4);
2717 
2718 		const VkBufferCreateInfo	vertexBufferParams	=
2719 		{
2720 			VK_STRUCTURE_TYPE_BUFFER_CREATE_INFO,	//	VkStructureType		sType
2721 			DE_NULL,								//	const void*			pNext
2722 			0u,										//	VkBufferCreateFlags	flags
2723 			(VkDeviceSize)vertexDataSize,			//	VkDeviceSize		size
2724 			VK_BUFFER_USAGE_VERTEX_BUFFER_BIT,		//	VkBufferUsageFlags	usage
2725 			VK_SHARING_MODE_EXCLUSIVE,				//	VkSharingMode		sharingMode
2726 			1u,										//	deUint32			queueFamilyCount
2727 			&queueFamilyIndex,						//	const deUint32*		pQueueFamilyIndices
2728 		};
2729 
2730 		vertexBuffer		= createBuffer(vkd, m_context.getDevice(), &vertexBufferParams);
2731 		vertexBufferMemory	= createBufferMemory(vkd, device, m_context.getDefaultAllocator(), *vertexBuffer);
2732 
2733 		deMemcpy(vertexBufferMemory->getHostPtr(), vertexData.data(), vertexDataSize);
2734 		flushAlloc(vkd, device, *vertexBufferMemory);
2735 	}
2736 
2737 	beginCommandBuffer(vkd, *commandBuffer);
2738 	vkd.cmdBindPipeline(*commandBuffer, vk::VK_PIPELINE_BIND_POINT_GRAPHICS, *renderPipeline);
2739 
2740 	if (!isDSFormat)
2741 		vkd.cmdBindDescriptorSets(*commandBuffer, vk::VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineLayout, 0u, 1u, &*descriptorSet, 0u, DE_NULL);
2742 
2743 	// Begin render pass.
2744 	{
2745 		VkRect2D					renderArea	=
2746 		{
2747 			{ 0u, 0u },				// VkOffset2D	offset
2748 			{ m_width, m_height }	// VkExtent2D	extent
2749 		};
2750 
2751 		const VkRenderPassBeginInfo	beginInfo	=
2752 		{
2753 			VK_STRUCTURE_TYPE_RENDER_PASS_BEGIN_INFO,	// VkStructureType		sType
2754 			DE_NULL,									// const void*			pNext
2755 			*renderPass,								// VkRenderPass			renderPass
2756 			*framebuffer,								// VkFramebuffer		framebuffer
2757 			renderArea,									// VkRect2D				renderArea
2758 			0u,											// uint32_t				clearValueCount
2759 			DE_NULL										// const VkClearValue*	pClearValues
2760 		};
2761 
2762 		RenderpassSubpass::cmdBeginRenderPass(vkd, *commandBuffer, &beginInfo, &subpassBeginInfo);
2763 	}
2764 
2765 	const VkDeviceSize bindingOffset = 0;
2766 
2767 	vkd.cmdBindVertexBuffers(*commandBuffer, 0u, 1u, &vertexBuffer.get(), &bindingOffset);
2768 	vkd.cmdBindPipeline(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *renderPipeline);
2769 	vkd.cmdDraw(*commandBuffer, 4u, 1u, 0u, 0u);
2770 	RenderpassSubpass::cmdEndRenderPass(vkd, *commandBuffer, &subpassEndInfo);
2771 
2772 	// Copy results to a buffer.
2773 	if (isDSFormat)
2774 	{
2775 		copyDepthStencilImageToBuffers(vkd, *commandBuffer, *dsImage, *resultBuffer0, *resultBuffer1, tcu::IVec2(m_width, m_height), VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT, VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL);
2776 	}
2777 	else
2778 	{
2779 		copyImageToBuffer(vkd, *commandBuffer, *colorImage, *resultBuffer0, tcu::IVec2(m_width, m_height), VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT, VK_IMAGE_LAYOUT_GENERAL);
2780 	}
2781 
2782 	endCommandBuffer(vkd, *commandBuffer);
2783 	submitCommandsAndWait(vkd, m_context.getDevice(), m_context.getUniversalQueue(), *commandBuffer);
2784 	invalidateMappedMemoryRange(vkd, m_context.getDevice(), resultBuffer0Memory->getMemory(), resultBuffer0Memory->getOffset(), VK_WHOLE_SIZE);
2785 	invalidateMappedMemoryRange(vkd, m_context.getDevice(), resultBuffer1Memory->getMemory(), resultBuffer1Memory->getOffset(), VK_WHOLE_SIZE);
2786 
2787 	// Verify result.
2788 	{
2789 		const tcu::TextureFormat	format		(mapVkFormat(m_format));
2790 		tcu::TextureLevel			reference	(format, m_width, m_height);
2791 
2792 		if (isDSFormat)
2793 		{
2794 			const void* const					ptrDepth				(resultBuffer0Memory->getHostPtr());
2795 			const void* const					ptrStencil				(resultBuffer1Memory->getHostPtr());
2796 			const tcu::ConstPixelBufferAccess	resultDepthAccess		(getDepthCopyFormat(m_format), m_width, m_height, 1, ptrDepth);
2797 			const tcu::ConstPixelBufferAccess	resultStencilAccess		(getStencilCopyFormat(m_format), m_width, m_height, 1, ptrStencil);
2798 			const PixelBufferAccess				referenceDepthAccess	(tcu::getEffectiveDepthStencilAccess(reference.getAccess(), tcu::Sampler::MODE_DEPTH));
2799 			const PixelBufferAccess				referenceStencilAccess	(tcu::getEffectiveDepthStencilAccess(reference.getAccess(), tcu::Sampler::MODE_STENCIL));
2800 			const float							depthThreshold			(1.0f / ((UVec4(1u) << tcu::getTextureFormatMantissaBitDepth(resultDepthAccess.getFormat()).cast<deUint32>()) - 1u).cast<float>().x());
2801 
2802 			for (deUint32 x = 0; x < m_width; x++)
2803 				for (deUint32 y = 0; y < m_height; y++)
2804 				{
2805 					float depthValue = ((x / tileSize) % 2 != (y / tileSize) % 2) ? depthInitValues[0] : depthInitValues[1];
2806 					referenceDepthAccess.setPixDepth(depthValue, x, y, 0);
2807 					referenceStencilAccess.setPixel(tcu::IVec4(0.5f < depthValue ? stencilRefValue : 0), x, y, 0);
2808 				}
2809 
2810 			if (!verifyDepth(m_context, reference.getAccess(), resultDepthAccess, depthThreshold))
2811 				m_resultCollector.fail("Depth compare failed.");
2812 
2813 			if (!verifyStencil(m_context, referenceStencilAccess, resultStencilAccess))
2814 				m_resultCollector.fail("Stencil compare failed.");
2815 		}
2816 		else
2817 		{
2818 			const void* const					ptrResult		(resultBuffer0Memory->getHostPtr());
2819 			const tcu::ConstPixelBufferAccess	resultAccess	(format, m_width, m_height, 1, ptrResult);
2820 			const PixelBufferAccess				referenceAccess	(reference.getAccess());
2821 
2822 			for (deUint32 x = 0; x < m_width; x++)
2823 				for (deUint32 y = 0; y < m_height; y++)
2824 				{
2825 					const tcu::Vec4	initValue	= ((x / tileSize) % 2 != (y / tileSize) % 2) ? colorInitValues[0] : colorInitValues[1];
2826 					const tcu::Vec4	refValue	= tcu::Vec4(initValue.x(), initValue.y(), initValue.x() + initValue.y(), 1.0f);
2827 
2828 					referenceAccess.setPixel(refValue, x, y, 0);
2829 				}
2830 
2831 			if (!tcu::floatThresholdCompare(m_context.getTestContext().getLog(),	// log
2832 											"Rendered result",						// imageSetName
2833 											"",										// imageSetDesc
2834 											referenceAccess,						// reference
2835 											resultAccess,							// result
2836 											Vec4(0.01f),							// threshold
2837 											tcu::COMPARE_LOG_RESULT))				// logMode
2838 			{
2839 				m_resultCollector.fail("Image compare failed.");
2840 			}
2841 		}
2842 
2843 	}
2844 
2845 	return tcu::TestStatus(m_resultCollector.getResult(), m_resultCollector.getMessage());
2846 }
2847 
2848 struct SingleAttachmentTestConfig
2849 {
SingleAttachmentTestConfigvkt::__anon104c10a40111::SingleAttachmentTestConfig2850 		SingleAttachmentTestConfig	(VkFormat		format_,
2851 									 RenderPassType	renderPassType_)
2852 		: format			(format_)
2853 		, renderPassType	(renderPassType_)
2854 	{
2855 	}
2856 
2857 	VkFormat		format;
2858 	RenderPassType	renderPassType;
2859 };
2860 
2861 class SingleAttachmentTestInstance : public TestInstance
2862 {
2863 public:
2864 							SingleAttachmentTestInstance	(Context&					context,
2865 															 SingleAttachmentTestConfig	testConfig);
2866 
2867 							~SingleAttachmentTestInstance	(void);
2868 
2869 	tcu::TestStatus			iterate							(void);
2870 
2871 	template<typename RenderpassSubpass>
2872 	tcu::TestStatus			iterateInternal					(void);
2873 
2874 private:
2875 	const bool				m_extensionSupported;
2876 	const RenderPassType	m_renderPassType;
2877 
2878 	const deUint32			m_width;
2879 	const deUint32			m_height;
2880 	const VkFormat			m_format;
2881 	tcu::ResultCollector	m_resultCollector;
2882 };
2883 
SingleAttachmentTestInstance(Context & context,SingleAttachmentTestConfig testConfig)2884 SingleAttachmentTestInstance::SingleAttachmentTestInstance (Context& context, SingleAttachmentTestConfig testConfig)
2885 	: TestInstance			(context)
2886 	, m_extensionSupported	((testConfig.renderPassType == RENDERPASS_TYPE_RENDERPASS2) && context.requireDeviceFunctionality("VK_KHR_create_renderpass2"))
2887 	, m_renderPassType		(testConfig.renderPassType)
2888 	, m_width				(256u)
2889 	, m_height				(256u)
2890 	, m_format				(testConfig.format)
2891 {
2892 }
2893 
~SingleAttachmentTestInstance(void)2894 SingleAttachmentTestInstance::~SingleAttachmentTestInstance (void)
2895 {
2896 }
2897 
iterate(void)2898 tcu::TestStatus SingleAttachmentTestInstance::iterate (void)
2899 {
2900 	switch (m_renderPassType)
2901 	{
2902 		case RENDERPASS_TYPE_LEGACY:
2903 			return iterateInternal<RenderpassSubpass1>();
2904 		case RENDERPASS_TYPE_RENDERPASS2:
2905 			return iterateInternal<RenderpassSubpass2>();
2906 		default:
2907 			TCU_THROW(InternalError, "Impossible");
2908 	}
2909 }
2910 
2911 template<typename RenderpassSubpass>
iterateInternal(void)2912 tcu::TestStatus SingleAttachmentTestInstance::iterateInternal (void)
2913 {
2914 	const DeviceInterface&								vkd					(m_context.getDeviceInterface());
2915 	const VkDevice										device				= m_context.getDevice();
2916 	const VkQueue										queue				= m_context.getUniversalQueue();
2917 	const deUint32										queueFamilyIndex	= m_context.getUniversalQueueFamilyIndex();
2918 	const Unique<VkCommandPool>							commandPool			(createCommandPool(vkd, m_context.getDevice(), VK_COMMAND_POOL_CREATE_TRANSIENT_BIT, queueFamilyIndex));
2919 	const Unique<VkCommandBuffer>						commandBuffer		(allocateCommandBuffer(vkd, m_context.getDevice(), *commandPool, VK_COMMAND_BUFFER_LEVEL_PRIMARY));
2920 	const typename RenderpassSubpass::SubpassBeginInfo	subpassBeginInfo	(DE_NULL, VK_SUBPASS_CONTENTS_INLINE);
2921 	const typename RenderpassSubpass::SubpassEndInfo	subpassEndInfo		(DE_NULL);
2922 	const tcu::Vec4										colorInitValues[2]	= { tcu::Vec4(0.2f, 0.4f, 0.1f, 1.0f), tcu::Vec4(0.5f, 0.4f, 0.7f, 1.0f) };
2923 	const VkExtent3D									imageExtent			= { m_width, m_height, 1u };
2924 	vector<Vec4>										vertexData;
2925 	Move<VkImage>										colorImage;
2926 	Move<VkImage>										resultImage;
2927 	de::MovePtr<Allocation>								colorImageAllocation;
2928 	de::MovePtr<Allocation>								resultImageAllocation;
2929 	Move<VkImageView>									imageViewInput;
2930 	Move<VkImageView>									imageViewResult;
2931 	Move<VkPipelineLayout>								pipelineLayoutInput;
2932 	Move<VkPipelineLayout>								pipelineLayoutImageSampler;
2933 	Move<VkPipeline>									pipelineSolidColor;
2934 	Move<VkPipeline>									pipelineInputAtt;
2935 	Move<VkPipeline>									pipelineImageSampler;
2936 	Move<VkFramebuffer>									framebuffer1;
2937 	Move<VkFramebuffer>									framebuffer0;
2938 	Move<VkRenderPass>									renderPass0;
2939 	Move<VkRenderPass>									renderPass1;
2940 	Move<VkBuffer>										resultBuffer;
2941 	de::MovePtr<Allocation>								resultBufferMemory;
2942 	Move<VkBuffer>										vertexBuffer;
2943 	de::MovePtr<Allocation>								vertexBufferMemory;
2944 	Move<VkSampler>										sampler;
2945 
2946 	// Create image used for both input and output.
2947 	{
2948 		VkImageUsageFlags		usage			= VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT | VK_IMAGE_USAGE_INPUT_ATTACHMENT_BIT
2949 												  | VK_IMAGE_USAGE_TRANSFER_SRC_BIT | VK_IMAGE_USAGE_TRANSFER_DST_BIT
2950 												  | VK_IMAGE_USAGE_SAMPLED_BIT;
2951 
2952 		const VkImageCreateInfo	imageCreateInfo	=
2953 		{
2954 			VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,	// VkStructureType			sType
2955 			DE_NULL,								// const void*				pNext
2956 			0u,										// VkImageCreateFlags		flags
2957 			VK_IMAGE_TYPE_2D,						// VkImageType				imageType
2958 			m_format,								// VkFormat					format
2959 			imageExtent,							// VkExtent3D				extent
2960 			1u,										// uint32_t					mipLevels
2961 			1u,										// uint32_t					arrayLayers
2962 			VK_SAMPLE_COUNT_1_BIT,					// VkSampleCountFlagBits	samples
2963 			VK_IMAGE_TILING_OPTIMAL,				// VkImageTiling			tiling
2964 			usage,									// VkImageUsageFlags		usage
2965 			VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode			sharingMode
2966 			1u,										// uint32_t					queueFamilyIndexCount
2967 			&queueFamilyIndex,						// const uint32_t*			pQueueFamilyIndices
2968 			VK_IMAGE_LAYOUT_UNDEFINED				// VkImageLayout			initialLayout
2969 		};
2970 
2971 		checkImageSupport(m_context.getInstanceInterface(), m_context.getPhysicalDevice(), imageCreateInfo);
2972 
2973 		colorImage = createImage(vkd, device, &imageCreateInfo, DE_NULL);
2974 		colorImageAllocation = m_context.getDefaultAllocator().allocate(getImageMemoryRequirements(vkd, device, *colorImage), MemoryRequirement::Any);
2975 		VK_CHECK(vkd.bindImageMemory(device, *colorImage, colorImageAllocation->getMemory(), colorImageAllocation->getOffset()));
2976 	}
2977 
2978 	// Create image used for final result.
2979 	{
2980 		VkImageUsageFlags		usage			= VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT | VK_IMAGE_USAGE_TRANSFER_SRC_BIT | VK_IMAGE_USAGE_TRANSFER_DST_BIT;
2981 
2982 		const VkImageCreateInfo	imageCreateInfo	=
2983 		{
2984 			VK_STRUCTURE_TYPE_IMAGE_CREATE_INFO,	// VkStructureType			sType
2985 			DE_NULL,								// const void*				pNext
2986 			0u,										// VkImageCreateFlags		flags
2987 			VK_IMAGE_TYPE_2D,						// VkImageType				imageType
2988 			m_format,								// VkFormat					format
2989 			imageExtent,							// VkExtent3D				extent
2990 			1u,										// uint32_t					mipLevels
2991 			1u,										// uint32_t					arrayLayers
2992 			VK_SAMPLE_COUNT_1_BIT,					// VkSampleCountFlagBits	samples
2993 			VK_IMAGE_TILING_OPTIMAL,				// VkImageTiling			tiling
2994 			usage,									// VkImageUsageFlags		usage
2995 			VK_SHARING_MODE_EXCLUSIVE,				// VkSharingMode			sharingMode
2996 			1u,										// uint32_t					queueFamilyIndexCount
2997 			&queueFamilyIndex,						// const uint32_t*			pQueueFamilyIndices
2998 			VK_IMAGE_LAYOUT_UNDEFINED				// VkImageLayout			initialLayout
2999 		};
3000 
3001 		checkImageSupport(m_context.getInstanceInterface(), m_context.getPhysicalDevice(), imageCreateInfo);
3002 
3003 		resultImage = createImage(vkd, device, &imageCreateInfo, DE_NULL);
3004 		resultImageAllocation = m_context.getDefaultAllocator().allocate(getImageMemoryRequirements(vkd, device, *resultImage), MemoryRequirement::Any);
3005 		VK_CHECK(vkd.bindImageMemory(device, *resultImage, resultImageAllocation->getMemory(), resultImageAllocation->getOffset()));
3006 	}
3007 
3008 	// Initialize color image. This is expected to be cleared later.
3009 	initColorImageChessboardPattern(vkd, device, queue, queueFamilyIndex, m_context.getDefaultAllocator(), *colorImage, m_format, colorInitValues[0], colorInitValues[1], m_width, m_height, 32u, VK_IMAGE_LAYOUT_UNDEFINED, VK_IMAGE_LAYOUT_GENERAL, VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT);
3010 	// Initialize result image. This will be overwritten later.
3011 	initColorImageChessboardPattern(vkd, device, queue, queueFamilyIndex, m_context.getDefaultAllocator(), *resultImage, m_format, colorInitValues[0], colorInitValues[1], m_width, m_height, 32u, VK_IMAGE_LAYOUT_UNDEFINED, VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL, VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT);
3012 
3013 	// Create image views.
3014 	{
3015 		const VkImageViewCreateInfo imageViewCreateInfo =
3016 		{
3017 			VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,	// VkStructureType			sType
3018 			DE_NULL,									// const void*				pNext
3019 			0u,											// VkImageViewCreateFlags	flags
3020 			*colorImage,								// VkImage					image
3021 			VK_IMAGE_VIEW_TYPE_2D,						// VkImageViewType			viewType
3022 			m_format,									// VkFormat					format
3023 			makeComponentMappingRGBA(),					// VkComponentMapping		components
3024 			{											// VkImageSubresourceRange	subresourceRange
3025 				VK_IMAGE_ASPECT_COLOR_BIT,
3026 				0u,
3027 				1u,
3028 				0u,
3029 				1u
3030 			}
3031 		};
3032 
3033 		imageViewInput = createImageView(vkd, device, &imageViewCreateInfo);
3034 	}
3035 
3036 	{
3037 		const VkImageViewCreateInfo imageViewCreateInfo =
3038 		{
3039 			VK_STRUCTURE_TYPE_IMAGE_VIEW_CREATE_INFO,	// VkStructureType			sType
3040 			DE_NULL,									// const void*				pNext
3041 			0u,											// VkImageViewCreateFlags	flags
3042 			*resultImage,								// VkImage					image
3043 			VK_IMAGE_VIEW_TYPE_2D,						// VkImageViewType			viewType
3044 			m_format,									// VkFormat					format
3045 			makeComponentMappingRGBA(),					// VkComponentMapping		components
3046 			{											// VkImageSubresourceRange	subresourceRange
3047 				VK_IMAGE_ASPECT_COLOR_BIT,
3048 				0u,
3049 				1u,
3050 				0u,
3051 				1u
3052 			}
3053 		};
3054 
3055 		imageViewResult = createImageView(vkd, device, &imageViewCreateInfo);
3056 	}
3057 
3058 	// Create result buffer.
3059 	{
3060 		resultBuffer		= createBuffer(vkd, device, m_format, m_width, m_height);
3061 		resultBufferMemory	= createBufferMemory(vkd, device, m_context.getDefaultAllocator(), *resultBuffer);
3062 	}
3063 
3064 	// Create sampler.
3065 	{
3066 		const VkSamplerCreateInfo samplerInfo =
3067 		{
3068 			VK_STRUCTURE_TYPE_SAMPLER_CREATE_INFO,		// VkStructureType			sType
3069 			DE_NULL,									// const void*				pNext
3070 			0u,											// VkSamplerCreateFlags		flags
3071 			VK_FILTER_NEAREST,							// VkFilter					magFilter
3072 			VK_FILTER_NEAREST,							// VkFilter					minFilter
3073 			VK_SAMPLER_MIPMAP_MODE_NEAREST,				// VkSamplerMipmapMode		mipmapMode
3074 			VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,		// VkSamplerAddressMode		addressModeU
3075 			VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,		// VkSamplerAddressMode		addressModeV
3076 			VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE,		// VkSamplerAddressMode		addressModeW
3077 			0.0f,										// float					mipLodBias
3078 			VK_FALSE,									// VkBool32					anisotropyEnable
3079 			1.0f,										// float					maxAnisotropy
3080 			VK_FALSE,									// VkBool32					compareEnable
3081 			VK_COMPARE_OP_ALWAYS,						// VkCompareOp				compareOp
3082 			0.0f,										// float					minLod
3083 			0.0f,										// float					maxLod
3084 			VK_BORDER_COLOR_FLOAT_TRANSPARENT_BLACK,	// VkBorderColor			borderColor
3085 			VK_FALSE,									// VkBool32					unnormalizedCoordinates
3086 		};
3087 
3088 		sampler = createSampler(vkd, device, &samplerInfo);
3089 	}
3090 
3091 	// Create descriptor set layouts.
3092 	Unique<VkDescriptorSetLayout>	descriptorSetLayoutInput	(DescriptorSetLayoutBuilder()
3093 			.addSingleBinding(VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT, VK_SHADER_STAGE_FRAGMENT_BIT)
3094 			.build(vkd, device));
3095 
3096 	Unique<VkDescriptorSetLayout>	descriptorSetLayoutImageSampler	(DescriptorSetLayoutBuilder()
3097 			.addSingleBinding(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER, VK_SHADER_STAGE_FRAGMENT_BIT)
3098 			.build(vkd, device));
3099 
3100 	// Create descriptor pool.
3101 	Unique<VkDescriptorPool>		descriptorPool		(DescriptorPoolBuilder()
3102 			.addType(VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT, 1u)
3103 			.addType(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER, 1u)
3104 			.build(vkd, device, VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT, 2u));
3105 
3106 	// Create desriptor sets.
3107 	Unique<VkDescriptorSet>			descriptorSetInput	(makeDescriptorSet(vkd, device, *descriptorPool, *descriptorSetLayoutInput));
3108 	Unique<VkDescriptorSet>			descriptorSetImageSampler	(makeDescriptorSet(vkd, device, *descriptorPool, *descriptorSetLayoutImageSampler));
3109 
3110 	// Update descriptor set information.
3111 	VkDescriptorImageInfo			descIOAttachment	= makeDescriptorImageInfo(DE_NULL, *imageViewInput, VK_IMAGE_LAYOUT_GENERAL);
3112 	VkDescriptorImageInfo			descImageSampler	= makeDescriptorImageInfo(*sampler, *imageViewInput, VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL);
3113 
3114 	DescriptorSetUpdateBuilder()
3115 		.writeSingle(*descriptorSetInput, DescriptorSetUpdateBuilder::Location::binding(0u), VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT, &descIOAttachment)
3116 		.update(vkd, device);
3117 
3118 	DescriptorSetUpdateBuilder()
3119 		.writeSingle(*descriptorSetImageSampler, DescriptorSetUpdateBuilder::Location::binding(0u), VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER, &descImageSampler)
3120 		.update(vkd, device);
3121 
3122 	// Create pipeline layouts.
3123 	{
3124 		const VkPipelineLayoutCreateInfo pipelineLayoutCreateInfo =
3125 		{
3126 			VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,	// VkStructureType				sType
3127 			DE_NULL,										// const void*					pNext
3128 			(vk::VkPipelineLayoutCreateFlags)0,				// VkPipelineLayoutCreateFlags	flags
3129 			1u,												// deUint32						setLayoutCount
3130 			&descriptorSetLayoutInput.get(),				// const VkDescriptorSetLayout*	pSetLayouts
3131 			0u,												// deUint32						pushConstantRangeCount
3132 			DE_NULL											// const VkPushConstantRange*	pPushConstantRanges
3133 		};
3134 
3135 		pipelineLayoutInput = createPipelineLayout(vkd, device, &pipelineLayoutCreateInfo);
3136 	}
3137 	{
3138 		const VkPipelineLayoutCreateInfo pipelineLayoutCreateInfo =
3139 		{
3140 			VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,	// VkStructureType				sType
3141 			DE_NULL,										// const void*					pNext
3142 			(vk::VkPipelineLayoutCreateFlags)0,				// VkPipelineLayoutCreateFlags	flags
3143 			1u,												// deUint32						setLayoutCount
3144 			&descriptorSetLayoutImageSampler.get(),			// const VkDescriptorSetLayout*	pSetLayouts
3145 			0u,												// deUint32						pushConstantRangeCount
3146 			DE_NULL											// const VkPushConstantRange*	pPushConstantRanges
3147 		};
3148 
3149 		pipelineLayoutImageSampler = createPipelineLayout(vkd, device, &pipelineLayoutCreateInfo);
3150 	}
3151 
3152 	// Create render passes.
3153 	{
3154 		vector<Attachment>			attachments;
3155 		vector<AttachmentReference>	colorAttachmentReferences;
3156 
3157 		attachments.push_back(Attachment(m_format, VK_SAMPLE_COUNT_1_BIT, VK_ATTACHMENT_LOAD_OP_LOAD, VK_ATTACHMENT_STORE_OP_STORE,
3158 										 VK_ATTACHMENT_LOAD_OP_DONT_CARE, VK_ATTACHMENT_STORE_OP_DONT_CARE,
3159 										 VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL, VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL));
3160 
3161 		colorAttachmentReferences.push_back(AttachmentReference(0u, VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL));
3162 
3163 		const vector<Subpass>			subpasses	(1, Subpass(VK_PIPELINE_BIND_POINT_GRAPHICS, 0u, vector<AttachmentReference>(),
3164 													 colorAttachmentReferences, vector<AttachmentReference>(),
3165 													 AttachmentReference(VK_ATTACHMENT_UNUSED, VK_IMAGE_LAYOUT_GENERAL), vector<deUint32>()));
3166 
3167 		renderPass1 = createRenderPass(vkd, device, RenderPass(attachments, subpasses, vector<SubpassDependency>()), m_renderPassType);
3168 	}
3169 	{
3170 		vector<Attachment>			attachments;
3171 		vector<AttachmentReference>	colorAttachmentReferences;
3172 		vector<AttachmentReference>	inputAttachmentReferences;
3173 
3174 		const VkImageAspectFlags	inputAttachmentAspectMask	((m_renderPassType == RENDERPASS_TYPE_RENDERPASS2)
3175 																? static_cast<VkImageAspectFlags>(VK_IMAGE_ASPECT_COLOR_BIT)
3176 																: static_cast<VkImageAspectFlags>(0));
3177 
3178 		attachments.push_back(Attachment(m_format, VK_SAMPLE_COUNT_1_BIT, VK_ATTACHMENT_LOAD_OP_CLEAR, VK_ATTACHMENT_STORE_OP_STORE,
3179 										 VK_ATTACHMENT_LOAD_OP_DONT_CARE, VK_ATTACHMENT_STORE_OP_DONT_CARE, VK_IMAGE_LAYOUT_GENERAL, VK_IMAGE_LAYOUT_GENERAL));
3180 
3181 		colorAttachmentReferences.push_back(AttachmentReference(0u, VK_IMAGE_LAYOUT_GENERAL));
3182 		inputAttachmentReferences.push_back(AttachmentReference(0u, VK_IMAGE_LAYOUT_GENERAL, inputAttachmentAspectMask));
3183 
3184 		const vector<Subpass>			subpasses		(1, Subpass(VK_PIPELINE_BIND_POINT_GRAPHICS, 0u, inputAttachmentReferences,
3185 														 colorAttachmentReferences, vector<AttachmentReference>(),
3186 														 AttachmentReference(VK_ATTACHMENT_UNUSED, VK_IMAGE_LAYOUT_GENERAL), vector<deUint32>()));
3187 
3188 		const vector<SubpassDependency>	dependencies	(1, SubpassDependency(0u, 0u, VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT,
3189 														 VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT, VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT,
3190 														 VK_ACCESS_INPUT_ATTACHMENT_READ_BIT, VK_DEPENDENCY_BY_REGION_BIT));
3191 
3192 		renderPass0 = createRenderPass(vkd, device, RenderPass(attachments, subpasses, dependencies), m_renderPassType);
3193 	}
3194 
3195 	// Create pipelines.
3196 	{
3197 		const Unique<VkShaderModule>				vertexShaderModule				(createShaderModule(vkd, device, m_context.getBinaryCollection().get("vert"), 0u));
3198 		const Unique<VkShaderModule>				fragmentShaderModuleInputAtt	(createShaderModule(vkd, device, m_context.getBinaryCollection().get("frag_input_attachment"), 0u));
3199 		const Unique<VkShaderModule>				fragmentShaderModuleSolidColor	(createShaderModule(vkd, device, m_context.getBinaryCollection().get("frag_solid_color"), 0u));
3200 		const Unique<VkShaderModule>				fragmentShaderModuleSampler		(createShaderModule(vkd, device, m_context.getBinaryCollection().get("frag_combined_image_sampler"), 0u));
3201 
3202 		const VkVertexInputBindingDescription		vertexBinding0					=
3203 		{
3204 			0u,							// deUint32					binding
3205 			sizeof(Vec4),				// deUint32					strideInBytes
3206 			VK_VERTEX_INPUT_RATE_VERTEX	// VkVertexInputStepRate	stepRate
3207 		};
3208 
3209 		const VkVertexInputAttributeDescription		attr0							=
3210 		{
3211 			0u,								// deUint32	location
3212 			0u,								// deUint32	binding
3213 			VK_FORMAT_R32G32B32A32_SFLOAT,	// VkFormat	format
3214 			0u								// deUint32	offsetInBytes
3215 		};
3216 
3217 		const VkPipelineVertexInputStateCreateInfo	vertexInputState				=
3218 		{
3219 			VK_STRUCTURE_TYPE_PIPELINE_VERTEX_INPUT_STATE_CREATE_INFO,	// VkStructureType							sType
3220 			DE_NULL,													// const void*								pNext
3221 			(VkPipelineVertexInputStateCreateFlags)0u,					// VkPipelineVertexInputStateCreateFlags	flags
3222 			1u,															// deUint32									vertexBindingDescriptionCount
3223 			&vertexBinding0,											// const VkVertexInputBindingDescription*	pVertexBindingDescriptions
3224 			1u,															// deUint32									vertexAttributeDescriptionCount
3225 			&attr0														// const VkVertexInputAttributeDescription*	pVertexAttributeDescriptions
3226 		};
3227 
3228 		const std::vector<VkViewport>				viewports						(1, makeViewport(tcu::UVec2(m_width, m_height)));
3229 		const std::vector<VkRect2D>					scissors						(1, makeRect2D(tcu::UVec2(m_width, m_height)));
3230 
3231 		const VkPipelineColorBlendAttachmentState		colorBlendAttachmentState	=
3232 		{
3233 			VK_TRUE,								// VkBool32					blendEnable
3234 			VK_BLEND_FACTOR_ONE,					// VkBlendFactor			srcColorBlendFactor
3235 			VK_BLEND_FACTOR_ONE_MINUS_SRC_ALPHA,	// VkBlendFactor			dstColorBlendFactor
3236 			VK_BLEND_OP_ADD,						// VkBlendOp				colorBlendOp
3237 			VK_BLEND_FACTOR_ONE,					// VkBlendFactor			srcAlphaBlendFactor
3238 			VK_BLEND_FACTOR_ONE_MINUS_SRC_ALPHA,	// VkBlendFactor			dstAlphaBlendFactor
3239 			VK_BLEND_OP_ADD,						// VkBlendOp				alphaBlendOp
3240 			VK_COLOR_COMPONENT_R_BIT				// VkColorComponentFlags	colorWriteMask
3241 				| VK_COLOR_COMPONENT_G_BIT
3242 				| VK_COLOR_COMPONENT_B_BIT
3243 				| VK_COLOR_COMPONENT_A_BIT
3244 		};
3245 
3246 		const VkPipelineColorBlendStateCreateInfo		colorBlendState				=
3247 		{
3248 			VK_STRUCTURE_TYPE_PIPELINE_COLOR_BLEND_STATE_CREATE_INFO,	// VkStructureType								sType
3249 			DE_NULL,													// const void*									pNext
3250 			0u,															// VkPipelineColorBlendStateCreateFlags			flags
3251 			VK_FALSE,													// VkBool32										logicOpEnable
3252 			VK_LOGIC_OP_CLEAR,											// VkLogicOp									logicOp
3253 			1u,															// deUint32										attachmentCount
3254 			&colorBlendAttachmentState,									// const VkPipelineColorBlendAttachmentState*	pAttachments
3255 			{ 0.0f, 0.0f, 0.0f, 0.0f }									// float										blendConstants[4]
3256 		};
3257 
3258 		pipelineSolidColor = makeGraphicsPipeline(vkd,		// const DeviceInterface&							vk
3259 				device,										// const VkDevice									device
3260 				*pipelineLayoutInput,						// const VkPipelineLayout							pipelineLayout
3261 				*vertexShaderModule,						// const VkShaderModule								vertexShaderModule
3262 				DE_NULL,									// const VkShaderModule								tessellationControlShaderModule
3263 				DE_NULL,									// const VkShaderModule								tessellationEvalShaderModule
3264 				DE_NULL,									// const VkShaderModule								geometryShaderModule
3265 				*fragmentShaderModuleSolidColor,			// const VkShaderModule								fragmentShaderModule
3266 				*renderPass0,								// const VkRenderPass								renderPass
3267 				viewports,									// const std::vector<VkViewport>&					viewports
3268 				scissors,									// const std::vector<VkRect2D>&						scissors
3269 				VK_PRIMITIVE_TOPOLOGY_TRIANGLE_STRIP,		// const VkPrimitiveTopology						topology
3270 				0u,											// const deUint32									subpass
3271 				0u,											// const deUint32									patchControlPoints
3272 				&vertexInputState,							// const VkPipelineVertexInputStateCreateInfo*		vertexInputStateCreateInfo
3273 				DE_NULL,									// const VkPipelineRasterizationStateCreateInfo*	rasterizationStateCreateInfo
3274 				DE_NULL,									// const VkPipelineMultisampleStateCreateInfo*		multisampleStateCreateInfo
3275 				DE_NULL,									// const VkPipelineDepthStencilStateCreateInfo*		depthStencilStateCreateInfo
3276 				&colorBlendState);							// const VkPipelineColorBlendStateCreateInfo*		colorBlendStateCreateInfo
3277 
3278 		pipelineInputAtt = makeGraphicsPipeline(vkd,		// const DeviceInterface&							vk
3279 				device,										// const VkDevice									device
3280 				*pipelineLayoutInput,						// const VkPipelineLayout							pipelineLayout
3281 				*vertexShaderModule,						// const VkShaderModule								vertexShaderModule
3282 				DE_NULL,									// const VkShaderModule								tessellationControlShaderModule
3283 				DE_NULL,									// const VkShaderModule								tessellationEvalShaderModule
3284 				DE_NULL,									// const VkShaderModule								geometryShaderModule
3285 				*fragmentShaderModuleInputAtt,				// const VkShaderModule								fragmentShaderModule
3286 				*renderPass0,								// const VkRenderPass								renderPass
3287 				viewports,									// const std::vector<VkViewport>&					viewports
3288 				scissors,									// const std::vector<VkRect2D>&						scissors
3289 				VK_PRIMITIVE_TOPOLOGY_TRIANGLE_STRIP,		// const VkPrimitiveTopology						topology
3290 				0u,											// const deUint32									subpass
3291 				0u,											// const deUint32									patchControlPoints
3292 				&vertexInputState,							// const VkPipelineVertexInputStateCreateInfo*		vertexInputStateCreateInfo
3293 				DE_NULL,									// const VkPipelineRasterizationStateCreateInfo*	rasterizationStateCreateInfo
3294 				DE_NULL,									// const VkPipelineMultisampleStateCreateInfo*		multisampleStateCreateInfo
3295 				DE_NULL,									// const VkPipelineDepthStencilStateCreateInfo*		depthStencilStateCreateInfo
3296 				&colorBlendState);							// const VkPipelineColorBlendStateCreateInfo*		colorBlendStateCreateInfo
3297 
3298 		pipelineImageSampler = makeGraphicsPipeline(vkd,	// const DeviceInterface&							vk
3299 				device,										// const VkDevice									device
3300 				*pipelineLayoutImageSampler,				// const VkPipelineLayout							pipelineLayout
3301 				*vertexShaderModule,						// const VkShaderModule								vertexShaderModule
3302 				DE_NULL,									// const VkShaderModule								tessellationControlShaderModule
3303 				DE_NULL,									// const VkShaderModule								tessellationEvalShaderModule
3304 				DE_NULL,									// const VkShaderModule								geometryShaderModule
3305 				*fragmentShaderModuleSampler,				// const VkShaderModule								fragmentShaderModule
3306 				*renderPass1,								// const VkRenderPass								renderPass
3307 				viewports,									// const std::vector<VkViewport>&					viewports
3308 				scissors,									// const std::vector<VkRect2D>&						scissors
3309 				VK_PRIMITIVE_TOPOLOGY_TRIANGLE_STRIP,		// const VkPrimitiveTopology						topology
3310 				0u,											// const deUint32									subpass
3311 				0u,											// const deUint32									patchControlPoints
3312 				&vertexInputState,							// const VkPipelineVertexInputStateCreateInfo*		vertexInputStateCreateInfo
3313 				DE_NULL,									// const VkPipelineRasterizationStateCreateInfo*	rasterizationStateCreateInfo
3314 				DE_NULL,									// const VkPipelineMultisampleStateCreateInfo*		multisampleStateCreateInfo
3315 				DE_NULL,									// const VkPipelineDepthStencilStateCreateInfo*		depthStencilStateCreateInfo
3316 				&colorBlendState);							// const VkPipelineColorBlendStateCreateInfo*		colorBlendStateCreateInfo
3317 	}
3318 
3319 	// Create framebuffers.
3320 	{
3321 		const VkFramebufferCreateInfo	framebufferCreateInfo	=
3322 		{
3323 			VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO,	// VkStructureType			sType
3324 			DE_NULL,									// const void*				pNext
3325 			0u,											// VkFramebufferCreateFlags	flags
3326 			*renderPass0,								// VkRenderPass				renderPass
3327 			1u,											// uint32_t					attachmentCount
3328 			&imageViewInput.get(),						// const VkImageView*		pAttachments
3329 			256u,										// uint32_t					width
3330 			256u,										// uint32_t					height
3331 			1u											// uint32_t					layers
3332 		};
3333 
3334 		framebuffer0 = vk::createFramebuffer(vkd, device, &framebufferCreateInfo);
3335 	}
3336 	{
3337 		const VkFramebufferCreateInfo	framebufferCreateInfo	=
3338 		{
3339 			VK_STRUCTURE_TYPE_FRAMEBUFFER_CREATE_INFO,	// VkStructureType			sType
3340 			DE_NULL,									// const void*				pNext
3341 			0u,											// VkFramebufferCreateFlags	flags
3342 			*renderPass1,								// VkRenderPass				renderPass
3343 			1u,											// uint32_t					attachmentCount
3344 			&imageViewResult.get(),						// const VkImageView*		pAttachments
3345 			m_width,									// uint32_t					width
3346 			m_height,									// uint32_t					height
3347 			1u											// uint32_t					layers
3348 		};
3349 
3350 		framebuffer1 = vk::createFramebuffer(vkd, device, &framebufferCreateInfo);
3351 	}
3352 
3353 	// Generate quad vertices.
3354 	{
3355 		const tcu::Vec4	lowerLeftVertex		(-1.0f, -1.0f, 0.5f, 1.0f);
3356 		const tcu::Vec4	lowerRightVertex	(1.0f, -1.0f, 0.5f, 1.0f);
3357 		const tcu::Vec4	upperLeftVertex		(-1.0f, 1.0f, 0.5f, 1.0f);
3358 		const tcu::Vec4	upperRightVertex	(1.0f, 1.0f, 0.5f, 1.0f);
3359 
3360 		vertexData.push_back(lowerLeftVertex);
3361 		vertexData.push_back(upperLeftVertex);
3362 		vertexData.push_back(lowerRightVertex);
3363 		vertexData.push_back(upperRightVertex);
3364 	}
3365 
3366 	// Upload vertex data.
3367 	{
3368 		const size_t				vertexDataSize		= vertexData.size() * sizeof(Vec4);
3369 
3370 		const VkBufferCreateInfo	vertexBufferParams	=
3371 		{
3372 			VK_STRUCTURE_TYPE_BUFFER_CREATE_INFO,	//	VkStructureType		sType
3373 			DE_NULL,								//	const void*			pNext
3374 			0u,										//	VkBufferCreateFlags	flags
3375 			(VkDeviceSize)vertexDataSize,			//	VkDeviceSize		size
3376 			VK_BUFFER_USAGE_VERTEX_BUFFER_BIT,		//	VkBufferUsageFlags	usage
3377 			VK_SHARING_MODE_EXCLUSIVE,				//	VkSharingMode		sharingMode
3378 			1u,										//	deUint32			queueFamilyCount
3379 			&queueFamilyIndex,						//	const deUint32*		pQueueFamilyIndices
3380 		};
3381 
3382 		vertexBuffer		= createBuffer(vkd, m_context.getDevice(), &vertexBufferParams);
3383 		vertexBufferMemory	= createBufferMemory(vkd, device, m_context.getDefaultAllocator(), *vertexBuffer);
3384 
3385 		deMemcpy(vertexBufferMemory->getHostPtr(), vertexData.data(), vertexDataSize);
3386 		flushAlloc(vkd, device, *vertexBufferMemory);
3387 	}
3388 
3389 	beginCommandBuffer(vkd, *commandBuffer);
3390 
3391 	// Begin render pass.
3392 	{
3393 		const VkRect2D				renderArea	=
3394 		{
3395 			{ 0u, 0u },				// VkOffset2D	offset
3396 			{ m_width, m_height }	// VkExtent2D	extent
3397 		};
3398 
3399 		const VkClearValue			clearValue	= makeClearValueColor(Vec4(0.0f, 0.0f, 0.0f, 0.0f));
3400 
3401 		const VkRenderPassBeginInfo	beginInfo	=
3402 		{
3403 			VK_STRUCTURE_TYPE_RENDER_PASS_BEGIN_INFO,	// VkStructureType		sType
3404 			DE_NULL,									// const void*			pNext
3405 			*renderPass0,								// VkRenderPass			renderPass
3406 			*framebuffer0,								// VkFramebuffer		framebuffer
3407 			renderArea,									// VkRect2D				renderArea
3408 			1u,											// uint32_t				clearValueCount
3409 			&clearValue									// const VkClearValue*	pClearValues
3410 		};
3411 
3412 		RenderpassSubpass::cmdBeginRenderPass(vkd, *commandBuffer, &beginInfo, &subpassBeginInfo);
3413 	}
3414 
3415 	// Bind pipeline.
3416 	vkd.cmdBindPipeline(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineSolidColor);
3417 
3418 	// Bind vertex buffer.
3419 	const VkDeviceSize bindingOffset = 0;
3420 	vkd.cmdBindVertexBuffers(*commandBuffer, 0u, 1u, &vertexBuffer.get(), &bindingOffset);
3421 
3422 	// Bind descriptor set.
3423 	vkd.cmdBindDescriptorSets(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineLayoutInput, 0u, 1u, &*descriptorSetInput, 0u, DE_NULL);
3424 
3425 	// Draw solid color.
3426 	vkd.cmdDraw(*commandBuffer, 4u, 1u, 0u, 0u);
3427 
3428 	// Bind pipeline.
3429 	vkd.cmdBindPipeline(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineInputAtt);
3430 
3431 	// Bind descriptor set.
3432 	vkd.cmdBindDescriptorSets(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineLayoutInput, 0u, 1u, &*descriptorSetInput, 0u, DE_NULL);
3433 
3434 	// Pipeline barrier to handle self dependency.
3435 	{
3436 		const VkImageMemoryBarrier imageBarrier =
3437 		{
3438 			VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,			// VkStructureType			sType
3439 			DE_NULL,										// const void*				pNext
3440 			VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT,			// VkAccessFlags			srcAccessMask
3441 			VK_ACCESS_INPUT_ATTACHMENT_READ_BIT,			// VkAccessFlags			dstAccessMask
3442 			VK_IMAGE_LAYOUT_GENERAL,						// VkImageLayout			oldLayout
3443 			VK_IMAGE_LAYOUT_GENERAL,						// VkImageLayout			newLayout
3444 			VK_QUEUE_FAMILY_IGNORED,						// uint32_t					srcQueueFamilyIndex
3445 			VK_QUEUE_FAMILY_IGNORED,						// uint32_t					dstQueueFamilyIndex
3446 			*colorImage,									// VkImage					image
3447 			{ VK_IMAGE_ASPECT_COLOR_BIT, 0u, 1u, 0u, 1u }	// VkImageSubresourceRange	subresourceRange
3448 		};
3449 
3450 		vkd.cmdPipelineBarrier(*commandBuffer, VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT, VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT, VK_DEPENDENCY_BY_REGION_BIT, 0u, DE_NULL, 0u, DE_NULL, 1u, &imageBarrier);
3451 	}
3452 
3453 	// Draw. Adds (0.1, 0.2, 0.0, 0.0) to the previous result.
3454 	vkd.cmdDraw(*commandBuffer, 4u, 1u, 0u, 0u);
3455 
3456 	// End render pass.
3457 	RenderpassSubpass::cmdEndRenderPass(vkd, *commandBuffer, &subpassEndInfo);
3458 
3459 	// Pipeline barrier.
3460 	{
3461 		const VkImageMemoryBarrier imageBarriers[] =
3462 		{
3463 			{
3464 				VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,			// VkStructureType			sType
3465 				DE_NULL,										// const void*				pNext
3466 				VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT
3467 				| VK_ACCESS_TRANSFER_WRITE_BIT
3468 				| VK_ACCESS_HOST_WRITE_BIT,						// VkAccessFlags			srcAccessMask
3469 				VK_ACCESS_SHADER_READ_BIT,						// VkAccessFlags			dstAccessMask
3470 				VK_IMAGE_LAYOUT_GENERAL,						// VkImageLayout			oldLayout
3471 				VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL,		// VkImageLayout			newLayout
3472 				VK_QUEUE_FAMILY_IGNORED,						// uint32_t					srcQueueFamilyIndex
3473 				VK_QUEUE_FAMILY_IGNORED,						// uint32_t					dstQueueFamilyIndex
3474 				*colorImage,									// VkImage					image
3475 				{ VK_IMAGE_ASPECT_COLOR_BIT, 0u, 1u, 0u, 1u }	// VkImageSubresourceRange	subresourceRange
3476 			},
3477 			{
3478 				VK_STRUCTURE_TYPE_IMAGE_MEMORY_BARRIER,			// VkStructureType			sType
3479 				DE_NULL,										// const void*				pNext
3480 				VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT,			// VkAccessFlags			srcAccessMask
3481 				VK_ACCESS_COLOR_ATTACHMENT_READ_BIT
3482 				| VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT,			// VkAccessFlags			dstAccessMask
3483 				VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL,		// VkImageLayout			oldLayout
3484 				VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL,		// VkImageLayout			newLayout
3485 				VK_QUEUE_FAMILY_IGNORED,						// uint32_t					srcQueueFamilyIndex
3486 				VK_QUEUE_FAMILY_IGNORED,						// uint32_t					dstQueueFamilyIndex
3487 				*resultImage,									// VkImage					image
3488 				{ VK_IMAGE_ASPECT_COLOR_BIT, 0u, 1u, 0u, 1u }	// VkImageSubresourceRange	subresourceRange
3489 			}
3490 		};
3491 
3492 		vkd.cmdPipelineBarrier(*commandBuffer, VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT | VK_PIPELINE_STAGE_ALL_COMMANDS_BIT, VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT | VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT, 0u, 0u, DE_NULL, 0u, DE_NULL, 2u, imageBarriers);
3493 	}
3494 
3495 	// Begin render pass.
3496 	{
3497 		const VkRect2D				renderArea	=
3498 		{
3499 			{ 0, 0 },	            // VkOffset2D	offset
3500 			{ m_width, m_height }	// VkExtent2D	extent
3501 		};
3502 
3503 		const VkRenderPassBeginInfo	beginInfo	=
3504 		{
3505 			VK_STRUCTURE_TYPE_RENDER_PASS_BEGIN_INFO,	// VkStructureType		sType
3506 			DE_NULL,									// const void*			pNext
3507 			*renderPass1,								// VkRenderPass			renderPass
3508 			*framebuffer1,								// VkFramebuffer		framebuffer
3509 			renderArea,									// VkRect2D				renderArea
3510 			0u,											// uint32_t				clearValueCount
3511 			DE_NULL										// const VkClearValue*	pClearValues
3512 		};
3513 
3514 		RenderpassSubpass::cmdBeginRenderPass(vkd, *commandBuffer, &beginInfo, &subpassBeginInfo);
3515 	}
3516 
3517 	// Bind pipeline.
3518 	vkd.cmdBindPipeline(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineImageSampler);
3519 
3520 	// Bind descriptor set.
3521 	vkd.cmdBindDescriptorSets(*commandBuffer, VK_PIPELINE_BIND_POINT_GRAPHICS, *pipelineLayoutImageSampler, 0u, 1u, &*descriptorSetImageSampler, 0u, DE_NULL);
3522 
3523 	// Draw. Samples the previous results and adds (0.1, 0.2, 0.0, 0.0).
3524 	vkd.cmdDraw(*commandBuffer, 4u, 1u, 0u, 0u);
3525 
3526 	// End render pass.
3527 	RenderpassSubpass::cmdEndRenderPass(vkd, *commandBuffer, &subpassEndInfo);
3528 
3529 	// Copy results to a buffer.
3530 	copyImageToBuffer(vkd, *commandBuffer, *resultImage, *resultBuffer, tcu::IVec2(m_width, m_height), VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT, VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL);
3531 
3532 	endCommandBuffer(vkd, *commandBuffer);
3533 	submitCommandsAndWait(vkd, m_context.getDevice(), m_context.getUniversalQueue(), *commandBuffer);
3534 	invalidateMappedMemoryRange(vkd, m_context.getDevice(), resultBufferMemory->getMemory(), resultBufferMemory->getOffset(), VK_WHOLE_SIZE);
3535 
3536 	// Verify results.
3537 	{
3538 		const tcu::TextureFormat			format			(mapVkFormat(m_format));
3539 		tcu::TextureLevel					reference		(format, m_width, m_height);
3540 		const void* const					ptrResult		(resultBufferMemory->getHostPtr());
3541 		const tcu::ConstPixelBufferAccess	resultAccess	(format, m_width, m_height, 1, ptrResult);
3542 		const PixelBufferAccess				referenceAccess	(reference.getAccess());
3543 
3544 		for (deUint32 x = 0; x < m_width; x++)
3545 			for (deUint32 y = 0; y < m_height; y++)
3546 			{
3547 				referenceAccess.setPixel(tcu::Vec4(0.3f, 0.6f, 0.0f, 1.0f), x, y, 0);
3548 			}
3549 
3550 		if (!tcu::floatThresholdCompare(m_context.getTestContext().getLog(),	// log
3551 										"Rendered result",						// imageSetName
3552 										"",										// imageSetDesc
3553 										referenceAccess,						// reference
3554 										resultAccess,							// result
3555 										Vec4(0.05f),							// threshold
3556 										tcu::COMPARE_LOG_RESULT))				// logMode
3557 		{
3558 			m_resultCollector.fail("Image compare failed.");
3559 		}
3560 	}
3561 
3562 	return tcu::TestStatus(m_resultCollector.getResult(), m_resultCollector.getMessage());
3563 }
3564 
3565 // Shader programs for testing dependencies between render pass instances
3566 struct ExternalPrograms
3567 {
initvkt::__anon104c10a40111::ExternalPrograms3568 	void init (vk::SourceCollections& dst, ExternalTestConfig testConfig) const
3569 	{
3570 		for (size_t renderPassNdx = 0; renderPassNdx < testConfig.renderPasses.size(); renderPassNdx++)
3571 		{
3572 			dst.glslSources.add("quad-vert-" + de::toString(renderPassNdx)) << glu::VertexSource(
3573 				"#version 450\n"
3574 				"layout(location = 0) out highp vec2 vtxTexCoords;\n"
3575 				"highp float;\n"
3576 				"void main (void)\n"
3577 				"{\n"
3578 				"    vec4 position;"
3579 				"    position = vec4(((gl_VertexIndex + 2) / 3) % 2 == 0 ? -1.0 : 1.0,\n"
3580 				"                    ((gl_VertexIndex + 1) / 3) % 2 == 0 ? -1.0 : 1.0, 0.0, 1.0);\n"
3581 				"    gl_Position = position;\n"
3582 				"	vtxTexCoords = position.xy / 2.0 + vec2(0.5);"
3583 				"}\n");
3584 
3585 			// First pass renders four quads of different color
3586 			if (renderPassNdx == 0)
3587 			{
3588 				dst.glslSources.add("quad-frag-" + de::toString(renderPassNdx)) << glu::FragmentSource(
3589 					"#version 450\n"
3590 					"layout(location = 0) in highp vec2 vtxTexCoords;\n"
3591 					"layout(location = 0) out highp vec4 o_color;\n"
3592 					"void main (void)\n"
3593 					"{\n"
3594 					"    if (gl_FragCoord.x <= " + de::toString(testConfig.imageSize.x() / 2) + " && gl_FragCoord.y <= " + de::toString(testConfig.imageSize.y() / 2) + ")\n"
3595 					"        o_color = vec4(1.0, 0.0, 0.0, 1.0);\n"
3596 					"    else if (gl_FragCoord.x > " + de::toString(testConfig.imageSize.x() / 2) + " && gl_FragCoord.y <= " + de::toString(testConfig.imageSize.y() / 2) + ")\n"
3597 					"        o_color = vec4(0.0, 1.0, 0.0, 1.0);\n"
3598 					"    else if (gl_FragCoord.x <= " + de::toString(testConfig.imageSize.x() / 2) + " && gl_FragCoord.y > " + de::toString(testConfig.imageSize.y() / 2) + ")\n"
3599 					"        o_color = vec4(0.0, 0.0, 1.0, 1.0);\n"
3600 					"    else\n"
3601 					"        o_color = vec4(0.0, 0.0, 0.0, 1.0);\n"
3602 					""
3603 					"}\n");
3604 			}
3605 			else
3606 			{
3607 				if (renderPassNdx % 2 == 0)
3608 				{
3609 					// Blur previous pass horizontally
3610 					dst.glslSources.add("quad-frag-" + de::toString(renderPassNdx)) << glu::FragmentSource(
3611 						"#version 450\n"
3612 						"layout(binding = 0) uniform sampler2D previousPass;\n"
3613 						"layout(location = 0) in highp vec2 vtxTexCoords;\n"
3614 						"layout(location = 0) out highp vec4 o_color;\n"
3615 						"void main (void)\n"
3616 						"{\n"
3617 						"    vec2 step = vec2(1.0 / " + de::toString(testConfig.imageSize.x()) + ", 1.0 / " + de::toString(testConfig.imageSize.y()) + ");\n"
3618 						"    vec2 minCoord = vec2(0.0, 0.0);\n"
3619 						"    vec2 maxCoord = vec2(1.0, 1.0);\n"
3620 						"    vec4 blurColor = vec4(0.0);\n"
3621 						"    for(int sampleNdx = 0; sampleNdx < " + de::toString(testConfig.blurKernel + 1) + "; sampleNdx++)\n"
3622 						"    {\n"
3623 						"        vec2 sampleCoord = vec2((vtxTexCoords.x - " + de::toString(testConfig.blurKernel / 2) + " * step.x) + step.x * sampleNdx, vtxTexCoords.y);\n"
3624 						"        blurColor += 0.12 * texture(previousPass, clamp(sampleCoord, minCoord, maxCoord));\n"
3625 						"    }\n"
3626 						"    o_color = blurColor;\n"
3627 						"}\n");
3628 				}
3629 				else
3630 				{
3631 					// Blur previous pass vertically
3632 					dst.glslSources.add("quad-frag-" + de::toString(renderPassNdx)) << glu::FragmentSource(
3633 						"#version 450\n"
3634 						"layout(binding = 0) uniform highp sampler2D previousPass;\n"
3635 						"layout(location = 0) in highp vec2 vtxTexCoords;\n"
3636 						"layout(location = 0) out highp vec4 o_color;\n"
3637 						"void main (void)\n"
3638 						"{\n"
3639 						"    vec2 step = vec2(1.0 / " + de::toString(testConfig.imageSize.x()) + ", 1.0 / " + de::toString(testConfig.imageSize.y()) + ");\n"
3640 						"    vec2 minCoord = vec2(0.0, 0.0);\n"
3641 						"    vec2 maxCoord = vec2(1.0, 1.0);\n"
3642 						"    vec4 blurColor = vec4(0.0);\n"
3643 						"    for(int sampleNdx = 0; sampleNdx < " + de::toString(testConfig.blurKernel + 1) + "; sampleNdx++)\n"
3644 						"    {\n"
3645 						"        vec2 sampleCoord = vec2(vtxTexCoords.x, (vtxTexCoords.y - " + de::toString(testConfig.blurKernel / 2) + " * step.y) + step.y * sampleNdx);\n"
3646 						"        blurColor += 0.12 * texture(previousPass, clamp(sampleCoord, minCoord, maxCoord));\n"
3647 						"    }\n"
3648 						"    o_color = blurColor;\n"
3649 						"}\n");
3650 				}
3651 			}
3652 		}
3653 	}
3654 };
3655 
3656 // Shader programs for testing dependencies between subpasses
3657 struct SubpassPrograms
3658 {
initvkt::__anon104c10a40111::SubpassPrograms3659 	void init (vk::SourceCollections& dst, SubpassTestConfig testConfig) const
3660 	{
3661 		size_t subpassCount = testConfig.renderPass.getSubpasses().size();
3662 
3663 		for (size_t subpassNdx = 0; subpassNdx < subpassCount; subpassNdx++)
3664 		{
3665 			if (subpassNdx == 0)
3666 			{
3667 				dst.glslSources.add("subpass-vert-" + de::toString(subpassNdx)) << glu::VertexSource(
3668 				"#version 450\n"
3669 				"highp float;\n"
3670 				"layout(location = 0) in highp vec4 position;\n"
3671 				"void main (void)\n"
3672 				"{\n"
3673 				"    gl_Position = position;\n"
3674 				"}\n");
3675 			}
3676 			else
3677 			{
3678 				dst.glslSources.add("subpass-vert-" + de::toString(subpassNdx)) << glu::VertexSource(
3679 					"#version 450\n"
3680 					"highp float;\n"
3681 					"void main (void)\n"
3682 					"{\n"
3683 					"    vec4 position;"
3684 					"    position = vec4(((gl_VertexIndex + 2) / 3) % 2 == 0 ? -1.0 : 1.0,\n"
3685 					"                    ((gl_VertexIndex + 1) / 3) % 2 == 0 ? -1.0 : 1.0, 0.0, 1.0);\n"
3686 					"    gl_Position = position;\n"
3687 					"}\n");
3688 			}
3689 
3690 			if (isDepthStencilFormat(testConfig.format))
3691 			{
3692 				if (subpassNdx == 0)
3693 				{
3694 					// Empty fragment shader: Fragment depth unmodified.
3695 					dst.glslSources.add("subpass-frag-" + de::toString(subpassNdx)) << glu::FragmentSource(
3696 						"#version 450\n"
3697 						"void main (void)\n"
3698 						"{\n"
3699 						"}\n");
3700 				}
3701 				else
3702 				{
3703 					// Use fragment depth from previous depth rendering result.
3704 					dst.glslSources.add("subpass-frag-" + de::toString(subpassNdx)) << glu::FragmentSource(
3705 						"#version 450\n"
3706 						"layout (input_attachment_index = 0, binding = 0) uniform subpassInput depthStencil;\n"
3707 						"void main (void)\n"
3708 						"{\n"
3709 						"    float inputDepth = subpassLoad(depthStencil).x;\n"
3710 						"    gl_FragDepth = inputDepth - 0.02;\n"
3711 						"}\n");
3712 				}
3713 			}
3714 			else
3715 				DE_FATAL("Unimplemented");
3716 		}
3717 	}
3718 };
3719 
3720 // Shader programs for testing backwards subpass self dependency from geometry stage to indirect draw
3721 struct SubpassSelfDependencyBackwardsPrograms
3722 {
initvkt::__anon104c10a40111::SubpassSelfDependencyBackwardsPrograms3723 	void init (vk::SourceCollections& dst, SubpassSelfDependencyBackwardsTestConfig testConfig) const
3724 	{
3725 		DE_UNREF(testConfig);
3726 
3727 		dst.glslSources.add("vert") << glu::VertexSource(
3728 				"#version 450\n"
3729 				"layout(location = 0) in highp vec4 position;\n"
3730 				"out gl_PerVertex {\n"
3731 				"    vec4 gl_Position;\n"
3732 				"};\n"
3733 				"void main (void)\n"
3734 				"{\n"
3735 				"    gl_Position = position;\n"
3736 				"}\n");
3737 
3738 		dst.glslSources.add("geom") << glu::GeometrySource(
3739 				"#version 450\n"
3740 				"layout(points) in;\n"
3741 				"layout(triangle_strip, max_vertices = 4) out;\n"
3742 				"\n"
3743 				"in gl_PerVertex {\n"
3744 				"    vec4 gl_Position;\n"
3745 				"} gl_in[];\n"
3746 				"\n"
3747 				"out gl_PerVertex {\n"
3748 				"    vec4 gl_Position;\n"
3749 				"};\n"
3750 				"layout (binding = 0) buffer IndirectBuffer\n"
3751 				"{\n"
3752 				"    uint vertexCount;\n"
3753 				"    uint instanceCount;\n"
3754 				"    uint firstVertex;\n"
3755 				"    uint firstInstance;\n"
3756 				"} indirectBuffer;\n"
3757 				"\n"
3758 				"void main (void) {\n"
3759 				"    vec4 p = gl_in[0].gl_Position;\n"
3760 				"    float offset = 0.03f;\n"
3761 				"    gl_Position = p + vec4(-offset, offset, 0, 0);\n"
3762 				"    EmitVertex();\n"
3763 				"    gl_Position = p + vec4(-offset, -offset, 0, 0);\n"
3764 				"    EmitVertex();\n"
3765 				"    gl_Position = p + vec4(offset, offset, 0, 0);\n"
3766 				"    EmitVertex();\n"
3767 				"    gl_Position = p + vec4(offset, -offset, 0, 0);\n"
3768 				"    EmitVertex();\n"
3769 				"    EndPrimitive();\n"
3770 				"    indirectBuffer.vertexCount = 64;\n"
3771 				"    indirectBuffer.instanceCount = 1;\n"
3772 				"    indirectBuffer.firstVertex = 64;\n"
3773 				"    indirectBuffer.firstInstance = 0;\n"
3774 				"}\n");
3775 
3776 		dst.glslSources.add("frag") << glu::FragmentSource(
3777 				"#version 450\n"
3778 				"layout(location = 0) out highp vec4 fragColor;\n"
3779 				"void main (void)\n"
3780 				"{\n"
3781 				"    fragColor = vec4(1, 0, 0, 1);\n"
3782 				"}\n");
3783 	}
3784 };
3785 
3786 struct SeparateChannelsPrograms
3787 {
initvkt::__anon104c10a40111::SeparateChannelsPrograms3788 	void init (vk::SourceCollections& dst, SeparateChannelsTestConfig testConfig) const
3789 	{
3790 		dst.glslSources.add("vert") << glu::VertexSource(
3791 				"#version 450\n"
3792 				"layout(location = 0) in highp vec4 position;\n"
3793 				"void main (void)\n"
3794 				"{\n"
3795 				"    gl_Position = position;\n"
3796 				"}\n");
3797 
3798 		if (isDepthStencilFormat(testConfig.format))
3799 		{
3800 			dst.glslSources.add("frag") << glu::FragmentSource(
3801 					"#version 450\n"
3802 					"layout(location = 0) out highp vec4 fragColor;\n"
3803 					"void main (void)\n"
3804 					"{\n"
3805 					"    fragColor = vec4(1);\n"
3806 					"}\n");
3807 		}
3808 		else
3809 		{
3810 			dst.glslSources.add("frag") << glu::FragmentSource(
3811 					"#version 450\n"
3812 					"layout(set = 0, binding = 0, input_attachment_index = 0) uniform subpassInput inputAtt;\n"
3813 					"layout(location = 0) out highp vec4 fragColor;\n"
3814 					"void main (void)\n"
3815 					"{\n"
3816 					"    vec4 inputColor = subpassLoad(inputAtt);\n"
3817 					"    fragColor = vec4(1, 1, inputColor.r + inputColor.g, 1);\n"
3818 					"}\n");
3819 		}
3820 	}
3821 };
3822 
3823 struct SingleAttachmentPrograms
3824 {
initvkt::__anon104c10a40111::SingleAttachmentPrograms3825 	void init (vk::SourceCollections& dst, SingleAttachmentTestConfig testConfig) const
3826 	{
3827 		DE_UNREF(testConfig);
3828 
3829 		dst.glslSources.add("vert") << glu::VertexSource(
3830 				"#version 450\n"
3831 				"layout(location = 0) in highp vec4 position;\n"
3832 				"void main (void)\n"
3833 				"{\n"
3834 				"    gl_Position = position;\n"
3835 				"}\n");
3836 
3837 		dst.glslSources.add("frag_solid_color") << glu::FragmentSource(
3838 				"#version 450\n"
3839 				"layout(location = 0) out highp vec4 fragColor;\n"
3840 				"void main (void)\n"
3841 				"{\n"
3842 				"    fragColor = vec4(0.1, 0.2, 0.0, 1.0);\n"
3843 				"}\n");
3844 
3845 		dst.glslSources.add("frag_input_attachment") << glu::FragmentSource(
3846 				"#version 450\n"
3847 				"layout(set = 0, binding = 0, input_attachment_index = 0) uniform subpassInput inputAtt;\n"
3848 				"layout(location = 0) out highp vec4 fragColor;\n"
3849 				"void main (void)\n"
3850 				"{\n"
3851 				"    vec4 inputColor = subpassLoad(inputAtt);\n"
3852 				"    fragColor = inputColor + vec4(0.1, 0.2, 0.0, 0.0);\n"
3853 				"}\n");
3854 
3855 		dst.glslSources.add("frag_combined_image_sampler") << glu::FragmentSource(
3856 				"#version 450\n"
3857 				"layout(set = 0, binding = 0) uniform highp sampler2D tex;\n"
3858 				"layout(location = 0) out highp vec4 fragColor;\n"
3859 				"void main (void)\n"
3860 				"{\n"
3861 				"    vec2 uv = vec2(gl_FragCoord) / 255.0;\n"
3862 				"    vec4 inputColor = texture(tex, uv);\n"
3863 				"    fragColor = inputColor + vec4(0.1, 0.2, 0.0, 0.0);\n"
3864 				"}\n");
3865 	}
3866 };
3867 
formatToName(VkFormat format)3868 std::string formatToName (VkFormat format)
3869 {
3870 	const std::string	formatStr	= de::toString(format);
3871 	const std::string	prefix		= "VK_FORMAT_";
3872 
3873 	DE_ASSERT(formatStr.substr(0, prefix.length()) == prefix);
3874 
3875 	return de::toLower(formatStr.substr(prefix.length()));
3876 }
3877 
initTests(tcu::TestCaseGroup * group,const RenderPassType renderPassType)3878 void initTests (tcu::TestCaseGroup* group, const RenderPassType renderPassType)
3879 {
3880 	tcu::TestContext& testCtx(group->getTestContext());
3881 
3882 	// Test external subpass dependencies
3883 	{
3884 		const deUint32	renderPassCounts[]	= { 2u, 3u, 5u};
3885 
3886 		const UVec2		renderSizes[]		=
3887 		{
3888 			UVec2(64, 64),
3889 			UVec2(128, 128),
3890 			UVec2(512, 512)
3891 		};
3892 
3893 		de::MovePtr<tcu::TestCaseGroup>	externalGroup	(new tcu::TestCaseGroup(testCtx, "external_subpass", "external_subpass"));
3894 
3895 		for (size_t renderSizeNdx = 0; renderSizeNdx < DE_LENGTH_OF_ARRAY(renderSizes); renderSizeNdx++)
3896 		{
3897 			string groupName ("render_size_" + de::toString(renderSizes[renderSizeNdx].x()) + "_" + de::toString(renderSizes[renderSizeNdx].y()));
3898 			de::MovePtr<tcu::TestCaseGroup> renderSizeGroup	(new tcu::TestCaseGroup(testCtx, groupName.c_str(), groupName.c_str()));
3899 
3900 			for (size_t renderPassCountNdx = 0; renderPassCountNdx < DE_LENGTH_OF_ARRAY(renderPassCounts); renderPassCountNdx++)
3901 			{
3902 				vector<RenderPass>	renderPasses;
3903 
3904 				for (size_t renderPassNdx = 0; renderPassNdx < renderPassCounts[renderPassCountNdx]; renderPassNdx++)
3905 				{
3906 					vector<Attachment>			attachments;
3907 					vector<AttachmentReference>	colorAttachmentReferences;
3908 
3909 					const VkFormat				format				(VK_FORMAT_R8G8B8A8_UNORM);
3910 					const VkSampleCountFlagBits	sampleCount			(VK_SAMPLE_COUNT_1_BIT);
3911 					const VkAttachmentLoadOp	loadOp				(VK_ATTACHMENT_LOAD_OP_DONT_CARE);
3912 					const VkAttachmentStoreOp	storeOp				(VK_ATTACHMENT_STORE_OP_STORE);
3913 					const VkAttachmentLoadOp	stencilLoadOp		(VK_ATTACHMENT_LOAD_OP_DONT_CARE);
3914 					const VkAttachmentStoreOp	stencilStoreOp		(VK_ATTACHMENT_STORE_OP_DONT_CARE);
3915 					const VkImageLayout			initialLayout		(VK_IMAGE_LAYOUT_UNDEFINED);
3916 					const VkImageLayout			finalLayout			(VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL);
3917 					const VkImageLayout			subpassLayout		(VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL);
3918 
3919 					attachments.push_back(Attachment(format, sampleCount, loadOp, storeOp, stencilLoadOp, stencilStoreOp, initialLayout, finalLayout));
3920 					colorAttachmentReferences.push_back(AttachmentReference((deUint32)0, subpassLayout));
3921 
3922 					const VkImageLayout			depthStencilLayout	(VK_IMAGE_LAYOUT_GENERAL);
3923 					const vector<Subpass>		subpasses			(1, Subpass(VK_PIPELINE_BIND_POINT_GRAPHICS, 0u, vector<AttachmentReference>(), colorAttachmentReferences, vector<AttachmentReference>(),
3924 																		AttachmentReference(VK_ATTACHMENT_UNUSED, depthStencilLayout), vector<deUint32>()));
3925 					vector<SubpassDependency>	deps;
3926 
3927 					deps.push_back(SubpassDependency(VK_SUBPASS_EXTERNAL,										// deUint32				srcPass
3928 													 0,															// deUint32				dstPass
3929 													 VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT,				// VkPipelineStageFlags	srcStageMask
3930 													 VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT | VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT,						// VkPipelineStageFlags	dstStageMask
3931 													 VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT,						// VkAccessFlags		srcAccessMask
3932 													 VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT | VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT,	// VkAccessFlags		dstAccessMask
3933 													 0));														// VkDependencyFlags	flags
3934 
3935 					deps.push_back(SubpassDependency(0,															// deUint32				srcPass
3936 													 VK_SUBPASS_EXTERNAL,										// deUint32				dstPass
3937 													 VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT | VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT,						// VkPipelineStageFlags	srcStageMask
3938 													 VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT,				// VkPipelineStageFlags	dstStageMask
3939 													 VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT | VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT,	// VkAccessFlags		srcAccessMask
3940 													 VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT,						// VkAccessFlags		dstAccessMask
3941 													 0));														// VkDependencyFlags	flags
3942 
3943 					RenderPass					renderPass			(attachments, subpasses, deps);
3944 
3945 					renderPasses.push_back(renderPass);
3946 				}
3947 
3948 				const deUint32		blurKernel	(12u);
3949 				string				testName	("render_passes_" + de::toString(renderPassCounts[renderPassCountNdx]));
3950 				ExternalTestConfig	testConfig
3951 				{
3952 					VK_FORMAT_R8G8B8A8_UNORM,
3953 					renderSizes[renderSizeNdx],
3954 					renderPasses,
3955 					renderPassType,
3956 					SYNCHRONIZATION_TYPE_LEGACY,
3957 					blurKernel
3958 				};
3959 
3960 				renderSizeGroup->addChild(new InstanceFactory1<ExternalDependencyTestInstance, ExternalTestConfig, ExternalPrograms>(testCtx, tcu::NODETYPE_SELF_VALIDATE, testName.c_str(), testName.c_str(), testConfig));
3961 				if (renderPassType == RENDERPASS_TYPE_RENDERPASS2)
3962 				{
3963 					testName += "_sync_2";
3964 					testConfig.synchronizationType = SYNCHRONIZATION_TYPE_SYNCHRONIZATION2;
3965 					renderSizeGroup->addChild(new InstanceFactory1<ExternalDependencyTestInstance, ExternalTestConfig, ExternalPrograms>(testCtx, tcu::NODETYPE_SELF_VALIDATE, testName.c_str(), testName.c_str(), testConfig));
3966 				}
3967 			}
3968 
3969 			externalGroup->addChild(renderSizeGroup.release());
3970 		}
3971 
3972 		group->addChild(externalGroup.release());
3973 	}
3974 
3975 	// Test implicit subpass dependencies
3976 	{
3977 		const deUint32					renderPassCounts[]		= { 2u, 3u, 5u };
3978 
3979 		de::MovePtr<tcu::TestCaseGroup>	implicitGroup			(new tcu::TestCaseGroup(testCtx, "implicit_dependencies", "implicit_dependencies"));
3980 
3981 		for (size_t renderPassCountNdx = 0; renderPassCountNdx < DE_LENGTH_OF_ARRAY(renderPassCounts); renderPassCountNdx++)
3982 		{
3983 			vector<RenderPass> renderPasses;
3984 
3985 			for (size_t renderPassNdx = 0; renderPassNdx < renderPassCounts[renderPassCountNdx]; renderPassNdx++)
3986 			{
3987 				vector<Attachment>			attachments;
3988 				vector<AttachmentReference>	colorAttachmentReferences;
3989 
3990 				const VkFormat				format					(VK_FORMAT_R8G8B8A8_UNORM);
3991 				const VkSampleCountFlagBits	sampleCount				(VK_SAMPLE_COUNT_1_BIT);
3992 				const VkAttachmentLoadOp	loadOp					(VK_ATTACHMENT_LOAD_OP_DONT_CARE);
3993 				const VkAttachmentStoreOp	storeOp					(VK_ATTACHMENT_STORE_OP_STORE);
3994 				const VkAttachmentLoadOp	stencilLoadOp			(VK_ATTACHMENT_LOAD_OP_DONT_CARE);
3995 				const VkAttachmentStoreOp	stencilStoreOp			(VK_ATTACHMENT_STORE_OP_DONT_CARE);
3996 				const VkImageLayout			initialLayout			(VK_IMAGE_LAYOUT_UNDEFINED);
3997 				const VkImageLayout			finalLayout				(VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL);
3998 				const VkImageLayout			subpassLayout			(VK_IMAGE_LAYOUT_COLOR_ATTACHMENT_OPTIMAL);
3999 
4000 				attachments.push_back(Attachment(format, sampleCount, loadOp, storeOp, stencilLoadOp, stencilStoreOp, initialLayout, finalLayout));
4001 				colorAttachmentReferences.push_back(AttachmentReference((deUint32)0, subpassLayout));
4002 
4003 				const VkImageLayout			depthStencilLayout		(VK_IMAGE_LAYOUT_GENERAL);
4004 				const vector<Subpass>		subpasses				(1, Subpass(VK_PIPELINE_BIND_POINT_GRAPHICS, 0u, vector<AttachmentReference>(), colorAttachmentReferences, vector<AttachmentReference>(), AttachmentReference(VK_ATTACHMENT_UNUSED, depthStencilLayout), vector<deUint32>()));
4005 				vector<SubpassDependency>	deps;
4006 
4007 				// The first render pass lets the implementation add all subpass dependencies implicitly.
4008 				// On the following passes only the dependency from external to first subpass is defined as
4009 				// we need to make sure we have the image ready from previous render pass. In this case
4010 				// the dependency from subpass 0 to external is added implicitly by the implementation.
4011 				if (renderPassNdx > 0)
4012 				{
4013 					deps.push_back(SubpassDependency(VK_SUBPASS_EXTERNAL,										// deUint32				srcPass
4014 													 0,															// deUint32				dstPass
4015 													 VK_PIPELINE_STAGE_BOTTOM_OF_PIPE_BIT,				// VkPipelineStageFlags	srcStageMask
4016 													 VK_PIPELINE_STAGE_COLOR_ATTACHMENT_OUTPUT_BIT | VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT,						// VkPipelineStageFlags	dstStageMask
4017 													 0,						// VkAccessFlags		srcAccessMask
4018 													 VK_ACCESS_COLOR_ATTACHMENT_WRITE_BIT | VK_ACCESS_SHADER_READ_BIT | VK_ACCESS_SHADER_WRITE_BIT,	// VkAccessFlags		dstAccessMask
4019 													 0));														// VkDependencyFlags	flags
4020 				}
4021 
4022 				RenderPass					renderPass				(attachments, subpasses, deps);
4023 
4024 				renderPasses.push_back(renderPass);
4025 			}
4026 
4027 			const deUint32				blurKernel	(12u);
4028 			const ExternalTestConfig	testConfig	(VK_FORMAT_R8G8B8A8_UNORM, UVec2(128, 128), renderPasses, renderPassType, SYNCHRONIZATION_TYPE_LEGACY, blurKernel);
4029 			const string				testName	("render_passes_" + de::toString(renderPassCounts[renderPassCountNdx]));
4030 
4031 			implicitGroup->addChild(new InstanceFactory1<ExternalDependencyTestInstance, ExternalTestConfig, ExternalPrograms>(testCtx, tcu::NODETYPE_SELF_VALIDATE, testName.c_str(), testName.c_str(), testConfig));
4032 		}
4033 
4034 		group->addChild(implicitGroup.release());
4035 	}
4036 
4037 	// Test late fragment operations using depth_stencil attachments in multipass rendering
4038 	{
4039 		const UVec2		renderSizes[]		=
4040 		{
4041 			UVec2(32, 32),
4042 			UVec2(64, 64),
4043 			UVec2(128, 128)
4044 		};
4045 
4046 		const deUint32	subpassCounts[]		= { 2u, 3u, 5u };
4047 
4048 		// Implementations must support at least one of the following formats
4049 		// for depth_stencil attachments
4050 		const VkFormat formats[]			=
4051 		{
4052 			VK_FORMAT_D24_UNORM_S8_UINT,
4053 			VK_FORMAT_D32_SFLOAT_S8_UINT
4054 		};
4055 
4056 		de::MovePtr<tcu::TestCaseGroup>	lateFragmentTestsGroup (new tcu::TestCaseGroup(testCtx, "late_fragment_tests", "wait for late fragment tests"));
4057 
4058 		for (size_t renderSizeNdx = 0; renderSizeNdx < DE_LENGTH_OF_ARRAY(renderSizes); renderSizeNdx++)
4059 		{
4060 			string							renderSizeGroupName	("render_size_" + de::toString(renderSizes[renderSizeNdx].x()) + "_" + de::toString(renderSizes[renderSizeNdx].y()));
4061 			de::MovePtr<tcu::TestCaseGroup>	renderSizeGroup		(new tcu::TestCaseGroup(testCtx, renderSizeGroupName.c_str(), renderSizeGroupName.c_str()));
4062 
4063 			for (size_t subpassCountNdx = 0; subpassCountNdx < DE_LENGTH_OF_ARRAY(subpassCounts); subpassCountNdx++)
4064 			{
4065 				string							subpassGroupName	("subpass_count_" + de::toString(subpassCounts[subpassCountNdx]));
4066 				de::MovePtr<tcu::TestCaseGroup>	subpassCountGroup	(new tcu::TestCaseGroup(testCtx, subpassGroupName.c_str(), subpassGroupName.c_str()));
4067 
4068 				for (size_t formatNdx = 0; formatNdx < DE_LENGTH_OF_ARRAY(formats); formatNdx++)
4069 				{
4070 					const deUint32				subpassCount	(subpassCounts[subpassCountNdx]);
4071 					const deUint32				attachmentCount	(subpassCount);
4072 					vector<Subpass>				subpasses;
4073 					vector<Attachment>			attachments;
4074 					vector<SubpassDependency>	deps;
4075 
4076 					// Attachments
4077 					for (size_t attachmentNdx = 0; attachmentNdx < attachmentCount; attachmentNdx++)
4078 					{
4079 						const VkFormat				format						(formats[formatNdx]);
4080 						const VkSampleCountFlagBits	sampleCount					(VK_SAMPLE_COUNT_1_BIT);
4081 						const VkAttachmentLoadOp	loadOp						(VK_ATTACHMENT_LOAD_OP_CLEAR);
4082 						const VkAttachmentStoreOp	storeOp						((attachmentNdx == attachmentCount - 1)
4083 																					? VK_ATTACHMENT_STORE_OP_STORE
4084 																					: VK_ATTACHMENT_STORE_OP_DONT_CARE);
4085 						const VkAttachmentLoadOp	stencilLoadOp				(VK_ATTACHMENT_LOAD_OP_CLEAR);
4086 						const VkAttachmentStoreOp	stencilStoreOp				((attachmentNdx == attachmentCount - 1)
4087 																					? VK_ATTACHMENT_STORE_OP_STORE
4088 																					: VK_ATTACHMENT_STORE_OP_DONT_CARE);
4089 						const VkImageLayout			initialLayout				(VK_IMAGE_LAYOUT_UNDEFINED);
4090 						const VkImageLayout			finalLayout					(VK_IMAGE_LAYOUT_DEPTH_STENCIL_READ_ONLY_OPTIMAL);
4091 
4092 						attachments.push_back(Attachment(format, sampleCount, loadOp, storeOp, stencilLoadOp, stencilStoreOp, initialLayout, finalLayout));
4093 					}
4094 
4095 					// Subpasses
4096 					for (size_t subpassNdx = 0; subpassNdx < subpassCount; subpassNdx++)
4097 					{
4098 						vector<AttachmentReference>	inputAttachmentReferences;
4099 						const VkImageAspectFlags	inputAttachmentAspectMask	((renderPassType == RENDERPASS_TYPE_RENDERPASS2)
4100 																					? static_cast<VkImageAspectFlags>(VK_IMAGE_ASPECT_DEPTH_BIT)
4101 																					: static_cast<VkImageAspectFlags>(0));
4102 
4103 						// Input attachment references
4104 						if (subpassNdx > 0)
4105 							inputAttachmentReferences.push_back(AttachmentReference((deUint32)subpassNdx - 1, VK_IMAGE_LAYOUT_DEPTH_STENCIL_READ_ONLY_OPTIMAL, inputAttachmentAspectMask));
4106 
4107 						subpasses.push_back(Subpass(VK_PIPELINE_BIND_POINT_GRAPHICS, 0u, inputAttachmentReferences, vector<AttachmentReference>(), vector<AttachmentReference>(), AttachmentReference((deUint32)subpassNdx, VK_IMAGE_LAYOUT_DEPTH_STENCIL_ATTACHMENT_OPTIMAL), vector<deUint32>()));
4108 
4109 						// Subpass dependencies from current subpass to previous subpass.
4110 						// Subpasses will wait for the late fragment operations before reading the contents
4111 						// of previous subpass.
4112 						if (subpassNdx > 0)
4113 						{
4114 							deps.push_back(SubpassDependency((deUint32)subpassNdx - 1,							// deUint32				srcPass
4115 															 (deUint32)subpassNdx,								// deUint32				dstPass
4116 															 VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT,			// VkPipelineStageFlags	srcStageMask
4117 															 VK_PIPELINE_STAGE_FRAGMENT_SHADER_BIT
4118 																| VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT,	// VkPipelineStageFlags	dstStageMask
4119 															 VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT,		// VkAccessFlags		srcAccessMask
4120 															 VK_ACCESS_INPUT_ATTACHMENT_READ_BIT,				// VkAccessFlags		dstAccessMask
4121 															 VK_DEPENDENCY_BY_REGION_BIT));						// VkDependencyFlags	flags
4122 						}
4123 					}
4124 					deps.push_back(SubpassDependency((deUint32)subpassCount - 1,								// deUint32				srcPass
4125 													 VK_SUBPASS_EXTERNAL,										// deUint32				dstPass
4126 													 VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT,					// VkPipelineStageFlags	srcStageMask
4127 													 VK_PIPELINE_STAGE_LATE_FRAGMENT_TESTS_BIT,					// VkPipelineStageFlags	dstStageMask
4128 													 VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT,				// VkAccessFlags		srcAccessMask
4129 													 VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_READ_BIT | VK_ACCESS_DEPTH_STENCIL_ATTACHMENT_WRITE_BIT, // VkAccessFlags		dstAccessMask
4130 													 VK_DEPENDENCY_BY_REGION_BIT));								// VkDependencyFlags	flags
4131 
4132 					const RenderPass		renderPass	(attachments, subpasses, deps);
4133 					const SubpassTestConfig	testConfig	(formats[formatNdx], renderSizes[renderSizeNdx], renderPass, renderPassType);
4134 					const string			format		(formatToName(formats[formatNdx]).c_str());
4135 
4136 					subpassCountGroup->addChild(new InstanceFactory1<SubpassDependencyTestInstance, SubpassTestConfig, SubpassPrograms>(testCtx, tcu::NODETYPE_SELF_VALIDATE, format, format, testConfig));
4137 				}
4138 
4139 				renderSizeGroup->addChild(subpassCountGroup.release());
4140 			}
4141 
4142 			lateFragmentTestsGroup->addChild(renderSizeGroup.release());
4143 		}
4144 
4145 		group->addChild(lateFragmentTestsGroup.release());
4146 	}
4147 
4148 	// Test subpass self dependency
4149 	{
4150 		const UVec2		renderSizes[]		=
4151 		{
4152 			UVec2(64, 64),
4153 			UVec2(128, 128),
4154 			UVec2(512, 512)
4155 		};
4156 
4157 		de::MovePtr<tcu::TestCaseGroup>	selfDependencyGroup	(new tcu::TestCaseGroup(testCtx, "self_dependency", "self_dependency"));
4158 
4159 		for (size_t renderSizeNdx = 0; renderSizeNdx < DE_LENGTH_OF_ARRAY(renderSizes); renderSizeNdx++)
4160 		{
4161 			string groupName	("render_size_" + de::toString(renderSizes[renderSizeNdx].x()) + "_" + de::toString(renderSizes[renderSizeNdx].y()));
4162 			de::MovePtr<tcu::TestCaseGroup>	renderSizeGroup	(new tcu::TestCaseGroup(testCtx, groupName.c_str(), groupName.c_str()));
4163 
4164 			const SubpassSelfDependencyBackwardsTestConfig	testConfig	(VK_FORMAT_R8G8B8A8_UNORM, renderSizes[renderSizeNdx], renderPassType);
4165 			renderSizeGroup->addChild(new InstanceFactory1<SubpassSelfDependencyBackwardsTestInstance, SubpassSelfDependencyBackwardsTestConfig, SubpassSelfDependencyBackwardsPrograms>(testCtx, tcu::NODETYPE_SELF_VALIDATE, "geometry_to_indirectdraw", "", testConfig));
4166 
4167 			selfDependencyGroup->addChild(renderSizeGroup.release());
4168 		}
4169 
4170 		group->addChild(selfDependencyGroup.release());
4171 	}
4172 
4173 	// Test using a single attachment with reads and writes using separate channels. This should work without subpass self-dependency.
4174 	{
4175 		de::MovePtr<tcu::TestCaseGroup>	separateChannelsGroup	(new tcu::TestCaseGroup(testCtx, "separate_channels", "separate_channels"));
4176 
4177 		struct TestConfig
4178 		{
4179 			string		name;
4180 			VkFormat	format;
4181 		} configs[] =
4182 		{
4183 			{	"r8g8b8a8_unorm",		VK_FORMAT_R8G8B8A8_UNORM		},
4184 			{	"r16g16b16a16_sfloat",	VK_FORMAT_R16G16B16A16_SFLOAT	},
4185 			{	"d24_unorm_s8_uint",	VK_FORMAT_D24_UNORM_S8_UINT		},
4186 			{	"d32_sfloat_s8_uint",	VK_FORMAT_D32_SFLOAT_S8_UINT	}
4187 		};
4188 
4189 		for (deUint32 configIdx = 0; configIdx < DE_LENGTH_OF_ARRAY(configs); configIdx++)
4190 		{
4191 			const SeparateChannelsTestConfig testConfig(configs[configIdx].format, renderPassType);
4192 
4193 			separateChannelsGroup->addChild(new InstanceFactory1<SeparateChannelsTestInstance, SeparateChannelsTestConfig, SeparateChannelsPrograms>(testCtx, tcu::NODETYPE_SELF_VALIDATE, configs[configIdx].name, "", testConfig));
4194 		}
4195 
4196 		group->addChild(separateChannelsGroup.release());
4197 	}
4198 
4199 	// Test using a single attachment for input and output.
4200 	{
4201 		de::MovePtr<tcu::TestCaseGroup>	singleAttachmentGroup	(new tcu::TestCaseGroup(testCtx, "single_attachment", "single_attachment"));
4202 
4203 		struct TestConfig
4204 		{
4205 			string		name;
4206 			VkFormat	format;
4207 		} configs[] =
4208 		{
4209 			{	"r8g8b8a8_unorm",			VK_FORMAT_R8G8B8A8_UNORM		},
4210 			{	"b8g8r8a8_unorm",			VK_FORMAT_B8G8R8A8_UNORM		},
4211 			{	"r16g16b16a16_sfloat",		VK_FORMAT_R16G16B16A16_SFLOAT	},
4212 			{	"r5g6b5_unorm_pack16",		VK_FORMAT_R5G6B5_UNORM_PACK16	},
4213 			{	"a1r5g5b5_unorm_pack16",	VK_FORMAT_A1R5G5B5_UNORM_PACK16	}
4214 		};
4215 
4216 		for (deUint32 configIdx = 0; configIdx < DE_LENGTH_OF_ARRAY(configs); configIdx++)
4217 		{
4218 			const SingleAttachmentTestConfig testConfig(configs[configIdx].format, renderPassType);
4219 
4220 			singleAttachmentGroup->addChild(new InstanceFactory1<SingleAttachmentTestInstance, SingleAttachmentTestConfig, SingleAttachmentPrograms>(testCtx, tcu::NODETYPE_SELF_VALIDATE, configs[configIdx].name, "", testConfig));
4221 		}
4222 
4223 		group->addChild(singleAttachmentGroup.release());
4224 	}
4225 }
4226 } // anonymous
4227 
createRenderPassSubpassDependencyTests(tcu::TestContext & testCtx)4228 tcu::TestCaseGroup* createRenderPassSubpassDependencyTests (tcu::TestContext& testCtx)
4229 {
4230 	return createTestGroup(testCtx, "subpass_dependencies", "Subpass dependency tests", initTests, RENDERPASS_TYPE_LEGACY);
4231 }
4232 
createRenderPass2SubpassDependencyTests(tcu::TestContext & testCtx)4233 tcu::TestCaseGroup* createRenderPass2SubpassDependencyTests (tcu::TestContext& testCtx)
4234 {
4235 	return createTestGroup(testCtx, "subpass_dependencies", "Subpass dependency tests", initTests, RENDERPASS_TYPE_RENDERPASS2);
4236 }
4237 } // vkt
4238