blob: d0e59867777aea3dc91b77a551df08c8e893c1e6 [file] [log] [blame]
Tony-LunarG73719992020-01-15 10:20:28 -07001/* Copyright (c) 2015-2020 The Khronos Group Inc.
2 * Copyright (c) 2015-2020 Valve Corporation
3 * Copyright (c) 2015-2020 LunarG, Inc.
4 * Copyright (C) 2015-2020 Google Inc.
Chris Forbes47567b72017-06-09 12:09:45 -07005 *
6 * Licensed under the Apache License, Version 2.0 (the "License");
7 * you may not use this file except in compliance with the License.
8 * You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing, software
13 * distributed under the License is distributed on an "AS IS" BASIS,
14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 * See the License for the specific language governing permissions and
16 * limitations under the License.
17 *
18 * Author: Chris Forbes <chrisf@ijw.co.nz>
Dave Houlton51653902018-06-22 17:32:13 -060019 * Author: Dave Houlton <daveh@lunarg.com>
Chris Forbes47567b72017-06-09 12:09:45 -070020 */
21
Petr Kraus25810d02019-08-27 17:41:15 +020022#include "shader_validation.h"
23
Chris Forbes47567b72017-06-09 12:09:45 -070024#include <cassert>
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +020025#include <chrono>
Petr Kraus25810d02019-08-27 17:41:15 +020026#include <cinttypes>
Jeff Bolzf234bf82019-11-04 14:07:15 -060027#include <cmath>
Petr Kraus25810d02019-08-27 17:41:15 +020028#include <map>
Chris Forbes47567b72017-06-09 12:09:45 -070029#include <sstream>
Petr Kraus25810d02019-08-27 17:41:15 +020030#include <string>
31#include <unordered_map>
32#include <vector>
33
Mark Lobodzinski102687e2020-04-28 11:03:28 -060034#include <spirv/unified1/spirv.hpp>
Chris Forbes47567b72017-06-09 12:09:45 -070035#include "vk_loader_platform.h"
36#include "vk_enum_string_helper.h"
Chris Forbes47567b72017-06-09 12:09:45 -070037#include "vk_layer_data.h"
38#include "vk_layer_extension_utils.h"
39#include "vk_layer_utils.h"
Mark Lobodzinskib56bbb92019-02-18 11:49:59 -070040#include "chassis.h"
Chris Forbes47567b72017-06-09 12:09:45 -070041#include "core_validation.h"
Petr Kraus25810d02019-08-27 17:41:15 +020042
Chris Forbes4ae55b32017-06-09 14:42:56 -070043#include "spirv-tools/libspirv.h"
Chris Forbes9a61e082017-07-24 15:35:29 -070044#include "xxhash.h"
Chris Forbes47567b72017-06-09 12:09:45 -070045
Chris Forbes8a6d8cb2019-02-14 14:33:08 -080046void decoration_set::add(uint32_t decoration, uint32_t value) {
47 switch (decoration) {
48 case spv::DecorationLocation:
49 flags |= location_bit;
50 location = value;
51 break;
52 case spv::DecorationPatch:
53 flags |= patch_bit;
54 break;
55 case spv::DecorationRelaxedPrecision:
56 flags |= relaxed_precision_bit;
57 break;
58 case spv::DecorationBlock:
59 flags |= block_bit;
60 break;
61 case spv::DecorationBufferBlock:
62 flags |= buffer_block_bit;
63 break;
64 case spv::DecorationComponent:
65 flags |= component_bit;
66 component = value;
67 break;
68 case spv::DecorationInputAttachmentIndex:
69 flags |= input_attachment_index_bit;
70 input_attachment_index = value;
71 break;
72 case spv::DecorationDescriptorSet:
73 flags |= descriptor_set_bit;
74 descriptor_set = value;
75 break;
76 case spv::DecorationBinding:
77 flags |= binding_bit;
78 binding = value;
79 break;
80 case spv::DecorationNonWritable:
81 flags |= nonwritable_bit;
82 break;
83 case spv::DecorationBuiltIn:
84 flags |= builtin_bit;
85 builtin = value;
86 break;
87 }
88}
89
Chris Forbes47567b72017-06-09 12:09:45 -070090enum FORMAT_TYPE {
91 FORMAT_TYPE_FLOAT = 1, // UNORM, SNORM, FLOAT, USCALED, SSCALED, SRGB -- anything we consider float in the shader
92 FORMAT_TYPE_SINT = 2,
93 FORMAT_TYPE_UINT = 4,
94};
95
96typedef std::pair<unsigned, unsigned> location_t;
97
Chris Forbes47567b72017-06-09 12:09:45 -070098static shader_stage_attributes shader_stage_attribs[] = {
Ari Suonpaa696b3432019-03-11 14:02:57 +020099 {"vertex shader", false, false, VK_SHADER_STAGE_VERTEX_BIT},
100 {"tessellation control shader", true, true, VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT},
101 {"tessellation evaluation shader", true, false, VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT},
102 {"geometry shader", true, false, VK_SHADER_STAGE_GEOMETRY_BIT},
103 {"fragment shader", false, false, VK_SHADER_STAGE_FRAGMENT_BIT},
Chris Forbes47567b72017-06-09 12:09:45 -0700104};
105
John Zulauf14c355b2019-06-27 16:09:37 -0600106unsigned ExecutionModelToShaderStageFlagBits(unsigned mode);
107
Chris Forbes47567b72017-06-09 12:09:45 -0700108// SPIRV utility functions
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600109void SHADER_MODULE_STATE::BuildDefIndex() {
locke-lunargde3f0fa2020-09-10 11:55:31 -0600110 function_set func_set = {};
111 EntryPoint *entry_point = nullptr;
112
Chris Forbes47567b72017-06-09 12:09:45 -0700113 for (auto insn : *this) {
locke-lunargde3f0fa2020-09-10 11:55:31 -0600114 // offset is not 0, it means it's updated and the offset is in a Function.
115 if (func_set.offset)
116 func_set.op_lists.insert({insn.opcode(), insn.offset()});
117 else if (entry_point) {
118 entry_point->decorate_list.insert({insn.opcode(), insn.offset()});
119 }
120
Chris Forbes47567b72017-06-09 12:09:45 -0700121 switch (insn.opcode()) {
122 // Types
123 case spv::OpTypeVoid:
124 case spv::OpTypeBool:
125 case spv::OpTypeInt:
126 case spv::OpTypeFloat:
127 case spv::OpTypeVector:
128 case spv::OpTypeMatrix:
129 case spv::OpTypeImage:
130 case spv::OpTypeSampler:
131 case spv::OpTypeSampledImage:
132 case spv::OpTypeArray:
133 case spv::OpTypeRuntimeArray:
134 case spv::OpTypeStruct:
135 case spv::OpTypeOpaque:
136 case spv::OpTypePointer:
137 case spv::OpTypeFunction:
138 case spv::OpTypeEvent:
139 case spv::OpTypeDeviceEvent:
140 case spv::OpTypeReserveId:
141 case spv::OpTypeQueue:
142 case spv::OpTypePipe:
Shannon McPherson0fa28232018-11-01 11:59:02 -0600143 case spv::OpTypeAccelerationStructureNV:
Jeff Bolze4356752019-03-07 11:23:46 -0600144 case spv::OpTypeCooperativeMatrixNV:
Chris Forbes47567b72017-06-09 12:09:45 -0700145 def_index[insn.word(1)] = insn.offset();
146 break;
147
148 // Fixed constants
149 case spv::OpConstantTrue:
150 case spv::OpConstantFalse:
151 case spv::OpConstant:
152 case spv::OpConstantComposite:
153 case spv::OpConstantSampler:
154 case spv::OpConstantNull:
155 def_index[insn.word(2)] = insn.offset();
156 break;
157
158 // Specialization constants
159 case spv::OpSpecConstantTrue:
160 case spv::OpSpecConstantFalse:
161 case spv::OpSpecConstant:
162 case spv::OpSpecConstantComposite:
163 case spv::OpSpecConstantOp:
164 def_index[insn.word(2)] = insn.offset();
165 break;
166
167 // Variables
168 case spv::OpVariable:
169 def_index[insn.word(2)] = insn.offset();
170 break;
171
172 // Functions
173 case spv::OpFunction:
174 def_index[insn.word(2)] = insn.offset();
locke-lunargde3f0fa2020-09-10 11:55:31 -0600175 func_set.id = insn.word(2);
176 func_set.offset = insn.offset();
177 func_set.op_lists.clear();
Chris Forbes47567b72017-06-09 12:09:45 -0700178 break;
179
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800180 // Decorations
181 case spv::OpDecorate: {
182 auto targetId = insn.word(1);
183 decorations[targetId].add(insn.word(2), insn.len() > 3u ? insn.word(3) : 0u);
184 } break;
185 case spv::OpGroupDecorate: {
186 auto const &src = decorations[insn.word(1)];
187 for (auto i = 2u; i < insn.len(); i++) decorations[insn.word(i)].merge(src);
188 } break;
189
John Zulauf14c355b2019-06-27 16:09:37 -0600190 // Entry points ... add to the entrypoint table
191 case spv::OpEntryPoint: {
192 // Entry points do not have an id (the id is the function id) and thus need their own table
193 auto entrypoint_name = (char const *)&insn.word(3);
194 auto execution_model = insn.word(1);
195 auto entrypoint_stage = ExecutionModelToShaderStageFlagBits(execution_model);
locke-lunargde3f0fa2020-09-10 11:55:31 -0600196 entry_points.emplace(entrypoint_name,
197 EntryPoint{insn.offset(), static_cast<VkShaderStageFlagBits>(entrypoint_stage)});
198
199 auto range = entry_points.equal_range(entrypoint_name);
200 for (auto it = range.first; it != range.second; ++it) {
201 if (it->second.offset == insn.offset()) {
202 entry_point = &(it->second);
203 break;
204 }
205 }
206 assert(entry_point != nullptr);
207 break;
208 }
209 case spv::OpFunctionEnd: {
210 assert(entry_point != nullptr);
211 func_set.length = insn.offset() - func_set.offset;
212 entry_point->function_set_list.emplace_back(func_set);
John Zulauf14c355b2019-06-27 16:09:37 -0600213 break;
214 }
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800215
Chris Forbes47567b72017-06-09 12:09:45 -0700216 default:
217 // We don't care about any other defs for now.
218 break;
219 }
220 }
221}
222
Jeff Bolz105d6492018-09-29 15:46:44 -0500223unsigned ExecutionModelToShaderStageFlagBits(unsigned mode) {
224 switch (mode) {
225 case spv::ExecutionModelVertex:
226 return VK_SHADER_STAGE_VERTEX_BIT;
227 case spv::ExecutionModelTessellationControl:
228 return VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT;
229 case spv::ExecutionModelTessellationEvaluation:
230 return VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT;
231 case spv::ExecutionModelGeometry:
232 return VK_SHADER_STAGE_GEOMETRY_BIT;
233 case spv::ExecutionModelFragment:
234 return VK_SHADER_STAGE_FRAGMENT_BIT;
235 case spv::ExecutionModelGLCompute:
236 return VK_SHADER_STAGE_COMPUTE_BIT;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600237 case spv::ExecutionModelRayGenerationNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700238 return VK_SHADER_STAGE_RAYGEN_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600239 case spv::ExecutionModelAnyHitNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700240 return VK_SHADER_STAGE_ANY_HIT_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600241 case spv::ExecutionModelClosestHitNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700242 return VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600243 case spv::ExecutionModelMissNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700244 return VK_SHADER_STAGE_MISS_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600245 case spv::ExecutionModelIntersectionNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700246 return VK_SHADER_STAGE_INTERSECTION_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600247 case spv::ExecutionModelCallableNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700248 return VK_SHADER_STAGE_CALLABLE_BIT_NV;
Jeff Bolz105d6492018-09-29 15:46:44 -0500249 case spv::ExecutionModelTaskNV:
250 return VK_SHADER_STAGE_TASK_BIT_NV;
251 case spv::ExecutionModelMeshNV:
252 return VK_SHADER_STAGE_MESH_BIT_NV;
253 default:
254 return 0;
255 }
256}
257
locke-lunargde3f0fa2020-09-10 11:55:31 -0600258const SHADER_MODULE_STATE::EntryPoint *FindEntrypointStruct(SHADER_MODULE_STATE const *src, char const *name,
259 VkShaderStageFlagBits stageBits) {
260 auto range = src->entry_points.equal_range(name);
261 for (auto it = range.first; it != range.second; ++it) {
262 if (it->second.stage == stageBits) {
263 return &(it->second);
264 }
265 }
266 return nullptr;
267}
268
locke-lunargd9a069d2019-09-17 01:50:19 -0600269spirv_inst_iter FindEntrypoint(SHADER_MODULE_STATE const *src, char const *name, VkShaderStageFlagBits stageBits) {
John Zulauf14c355b2019-06-27 16:09:37 -0600270 auto range = src->entry_points.equal_range(name);
271 for (auto it = range.first; it != range.second; ++it) {
272 if (it->second.stage == stageBits) {
273 return src->at(it->second.offset);
Chris Forbes47567b72017-06-09 12:09:45 -0700274 }
275 }
Chris Forbes47567b72017-06-09 12:09:45 -0700276 return src->end();
277}
278
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600279static char const *StorageClassName(unsigned sc) {
Chris Forbes47567b72017-06-09 12:09:45 -0700280 switch (sc) {
281 case spv::StorageClassInput:
282 return "input";
283 case spv::StorageClassOutput:
284 return "output";
285 case spv::StorageClassUniformConstant:
286 return "const uniform";
287 case spv::StorageClassUniform:
288 return "uniform";
289 case spv::StorageClassWorkgroup:
290 return "workgroup local";
291 case spv::StorageClassCrossWorkgroup:
292 return "workgroup global";
293 case spv::StorageClassPrivate:
294 return "private global";
295 case spv::StorageClassFunction:
296 return "function";
297 case spv::StorageClassGeneric:
298 return "generic";
299 case spv::StorageClassAtomicCounter:
300 return "atomic counter";
301 case spv::StorageClassImage:
302 return "image";
303 case spv::StorageClassPushConstant:
304 return "push constant";
Chris Forbes9f89d752018-03-07 12:57:48 -0800305 case spv::StorageClassStorageBuffer:
306 return "storage buffer";
Chris Forbes47567b72017-06-09 12:09:45 -0700307 default:
308 return "unknown";
309 }
310}
311
312// Get the value of an integral constant
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600313unsigned GetConstantValue(SHADER_MODULE_STATE const *src, unsigned id) {
Chris Forbes47567b72017-06-09 12:09:45 -0700314 auto value = src->get_def(id);
315 assert(value != src->end());
316
317 if (value.opcode() != spv::OpConstant) {
318 // TODO: Either ensure that the specialization transform is already performed on a module we're
319 // considering here, OR -- specialize on the fly now.
320 return 1;
321 }
322
323 return value.word(3);
324}
325
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600326static void DescribeTypeInner(std::ostringstream &ss, SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700327 auto insn = src->get_def(type);
328 assert(insn != src->end());
329
330 switch (insn.opcode()) {
331 case spv::OpTypeBool:
332 ss << "bool";
333 break;
334 case spv::OpTypeInt:
335 ss << (insn.word(3) ? 's' : 'u') << "int" << insn.word(2);
336 break;
337 case spv::OpTypeFloat:
338 ss << "float" << insn.word(2);
339 break;
340 case spv::OpTypeVector:
341 ss << "vec" << insn.word(3) << " of ";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600342 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700343 break;
344 case spv::OpTypeMatrix:
345 ss << "mat" << insn.word(3) << " of ";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600346 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700347 break;
348 case spv::OpTypeArray:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600349 ss << "arr[" << GetConstantValue(src, insn.word(3)) << "] of ";
350 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700351 break;
Chris Forbes062f1222018-08-21 15:34:15 -0700352 case spv::OpTypeRuntimeArray:
353 ss << "runtime arr[] of ";
354 DescribeTypeInner(ss, src, insn.word(2));
355 break;
Chris Forbes47567b72017-06-09 12:09:45 -0700356 case spv::OpTypePointer:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600357 ss << "ptr to " << StorageClassName(insn.word(2)) << " ";
358 DescribeTypeInner(ss, src, insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700359 break;
360 case spv::OpTypeStruct: {
361 ss << "struct of (";
362 for (unsigned i = 2; i < insn.len(); i++) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600363 DescribeTypeInner(ss, src, insn.word(i));
Chris Forbes47567b72017-06-09 12:09:45 -0700364 if (i == insn.len() - 1) {
365 ss << ")";
366 } else {
367 ss << ", ";
368 }
369 }
370 break;
371 }
372 case spv::OpTypeSampler:
373 ss << "sampler";
374 break;
375 case spv::OpTypeSampledImage:
376 ss << "sampler+";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600377 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700378 break;
379 case spv::OpTypeImage:
380 ss << "image(dim=" << insn.word(3) << ", sampled=" << insn.word(7) << ")";
381 break;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600382 case spv::OpTypeAccelerationStructureNV:
Jeff Bolz105d6492018-09-29 15:46:44 -0500383 ss << "accelerationStruture";
384 break;
Chris Forbes47567b72017-06-09 12:09:45 -0700385 default:
386 ss << "oddtype";
387 break;
388 }
389}
390
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600391static std::string DescribeType(SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700392 std::ostringstream ss;
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600393 DescribeTypeInner(ss, src, type);
Chris Forbes47567b72017-06-09 12:09:45 -0700394 return ss.str();
395}
396
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600397static bool IsNarrowNumericType(spirv_inst_iter type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700398 if (type.opcode() != spv::OpTypeInt && type.opcode() != spv::OpTypeFloat) return false;
399 return type.word(2) < 64;
400}
401
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600402static bool TypesMatch(SHADER_MODULE_STATE const *a, SHADER_MODULE_STATE const *b, unsigned a_type, unsigned b_type, bool a_arrayed,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600403 bool b_arrayed, bool relaxed) {
Chris Forbes47567b72017-06-09 12:09:45 -0700404 // Walk two type trees together, and complain about differences
405 auto a_insn = a->get_def(a_type);
406 auto b_insn = b->get_def(b_type);
407 assert(a_insn != a->end());
408 assert(b_insn != b->end());
409
Chris Forbes062f1222018-08-21 15:34:15 -0700410 // Ignore runtime-sized arrays-- they cannot appear in these interfaces.
411
Chris Forbes47567b72017-06-09 12:09:45 -0700412 if (a_arrayed && a_insn.opcode() == spv::OpTypeArray) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600413 return TypesMatch(a, b, a_insn.word(2), b_type, false, b_arrayed, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700414 }
415
416 if (b_arrayed && b_insn.opcode() == spv::OpTypeArray) {
417 // We probably just found the extra level of arrayness in b_type: compare the type inside it to a_type
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600418 return TypesMatch(a, b, a_type, b_insn.word(2), a_arrayed, false, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700419 }
420
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600421 if (a_insn.opcode() == spv::OpTypeVector && relaxed && IsNarrowNumericType(b_insn)) {
422 return TypesMatch(a, b, a_insn.word(2), b_type, a_arrayed, b_arrayed, false);
Chris Forbes47567b72017-06-09 12:09:45 -0700423 }
424
425 if (a_insn.opcode() != b_insn.opcode()) {
426 return false;
427 }
428
429 if (a_insn.opcode() == spv::OpTypePointer) {
430 // Match on pointee type. storage class is expected to differ
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600431 return TypesMatch(a, b, a_insn.word(3), b_insn.word(3), a_arrayed, b_arrayed, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700432 }
433
434 if (a_arrayed || b_arrayed) {
435 // If we havent resolved array-of-verts by here, we're not going to.
436 return false;
437 }
438
439 switch (a_insn.opcode()) {
440 case spv::OpTypeBool:
441 return true;
442 case spv::OpTypeInt:
443 // Match on width, signedness
444 return a_insn.word(2) == b_insn.word(2) && a_insn.word(3) == b_insn.word(3);
445 case spv::OpTypeFloat:
446 // Match on width
447 return a_insn.word(2) == b_insn.word(2);
448 case spv::OpTypeVector:
449 // Match on element type, count.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600450 if (!TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false)) return false;
451 if (relaxed && IsNarrowNumericType(a->get_def(a_insn.word(2)))) {
Chris Forbes47567b72017-06-09 12:09:45 -0700452 return a_insn.word(3) >= b_insn.word(3);
453 } else {
454 return a_insn.word(3) == b_insn.word(3);
455 }
456 case spv::OpTypeMatrix:
457 // Match on element type, count.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600458 return TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false) &&
Dave Houltona9df0ce2018-02-07 10:51:23 -0700459 a_insn.word(3) == b_insn.word(3);
Chris Forbes47567b72017-06-09 12:09:45 -0700460 case spv::OpTypeArray:
461 // Match on element type, count. these all have the same layout. we don't get here if b_arrayed. This differs from
462 // vector & matrix types in that the array size is the id of a constant instruction, * not a literal within OpTypeArray
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600463 return TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false) &&
464 GetConstantValue(a, a_insn.word(3)) == GetConstantValue(b, b_insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700465 case spv::OpTypeStruct:
466 // Match on all element types
Dave Houltona9df0ce2018-02-07 10:51:23 -0700467 {
468 if (a_insn.len() != b_insn.len()) {
469 return false; // Structs cannot match if member counts differ
Chris Forbes47567b72017-06-09 12:09:45 -0700470 }
Chris Forbes47567b72017-06-09 12:09:45 -0700471
Dave Houltona9df0ce2018-02-07 10:51:23 -0700472 for (unsigned i = 2; i < a_insn.len(); i++) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600473 if (!TypesMatch(a, b, a_insn.word(i), b_insn.word(i), a_arrayed, b_arrayed, false)) {
Dave Houltona9df0ce2018-02-07 10:51:23 -0700474 return false;
475 }
476 }
477
478 return true;
479 }
Chris Forbes47567b72017-06-09 12:09:45 -0700480 default:
481 // Remaining types are CLisms, or may not appear in the interfaces we are interested in. Just claim no match.
482 return false;
483 }
484}
485
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600486static unsigned GetLocationsConsumedByType(SHADER_MODULE_STATE const *src, unsigned type, bool strip_array_level) {
Chris Forbes47567b72017-06-09 12:09:45 -0700487 auto insn = src->get_def(type);
488 assert(insn != src->end());
489
490 switch (insn.opcode()) {
491 case spv::OpTypePointer:
492 // See through the ptr -- this is only ever at the toplevel for graphics shaders we're never actually passing
493 // pointers around.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600494 return GetLocationsConsumedByType(src, insn.word(3), strip_array_level);
Chris Forbes47567b72017-06-09 12:09:45 -0700495 case spv::OpTypeArray:
496 if (strip_array_level) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600497 return GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700498 } else {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600499 return GetConstantValue(src, insn.word(3)) * GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700500 }
501 case spv::OpTypeMatrix:
502 // Num locations is the dimension * element size
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600503 return insn.word(3) * GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700504 case spv::OpTypeVector: {
505 auto scalar_type = src->get_def(insn.word(2));
506 auto bit_width =
507 (scalar_type.opcode() == spv::OpTypeInt || scalar_type.opcode() == spv::OpTypeFloat) ? scalar_type.word(2) : 32;
508
509 // Locations are 128-bit wide; 3- and 4-component vectors of 64 bit types require two.
510 return (bit_width * insn.word(3) + 127) / 128;
511 }
512 default:
513 // Everything else is just 1.
514 return 1;
515
516 // TODO: extend to handle 64bit scalar types, whose vectors may need multiple locations.
517 }
518}
519
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600520static unsigned GetComponentsConsumedByType(SHADER_MODULE_STATE const *src, unsigned type, bool strip_array_level) {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200521 auto insn = src->get_def(type);
522 assert(insn != src->end());
523
524 switch (insn.opcode()) {
525 case spv::OpTypePointer:
526 // See through the ptr -- this is only ever at the toplevel for graphics shaders we're never actually passing
527 // pointers around.
528 return GetComponentsConsumedByType(src, insn.word(3), strip_array_level);
529 case spv::OpTypeStruct: {
530 uint32_t sum = 0;
531 for (uint32_t i = 2; i < insn.len(); i++) { // i=2 to skip word(0) and word(1)=ID of struct
532 sum += GetComponentsConsumedByType(src, insn.word(i), false);
533 }
534 return sum;
535 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -0500536 case spv::OpTypeArray:
537 if (strip_array_level) {
538 return GetComponentsConsumedByType(src, insn.word(2), false);
539 } else {
540 return GetConstantValue(src, insn.word(3)) * GetComponentsConsumedByType(src, insn.word(2), false);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200541 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200542 case spv::OpTypeMatrix:
543 // Num locations is the dimension * element size
544 return insn.word(3) * GetComponentsConsumedByType(src, insn.word(2), false);
545 case spv::OpTypeVector: {
546 auto scalar_type = src->get_def(insn.word(2));
547 auto bit_width =
548 (scalar_type.opcode() == spv::OpTypeInt || scalar_type.opcode() == spv::OpTypeFloat) ? scalar_type.word(2) : 32;
549 // One component is 32-bit
550 return (bit_width * insn.word(3) + 31) / 32;
551 }
552 case spv::OpTypeFloat: {
553 auto bit_width = insn.word(2);
554 return (bit_width + 31) / 32;
555 }
556 case spv::OpTypeInt: {
557 auto bit_width = insn.word(2);
558 return (bit_width + 31) / 32;
559 }
560 case spv::OpConstant:
561 return GetComponentsConsumedByType(src, insn.word(1), false);
562 default:
563 return 0;
564 }
565}
566
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600567static unsigned GetLocationsConsumedByFormat(VkFormat format) {
Chris Forbes47567b72017-06-09 12:09:45 -0700568 switch (format) {
569 case VK_FORMAT_R64G64B64A64_SFLOAT:
570 case VK_FORMAT_R64G64B64A64_SINT:
571 case VK_FORMAT_R64G64B64A64_UINT:
572 case VK_FORMAT_R64G64B64_SFLOAT:
573 case VK_FORMAT_R64G64B64_SINT:
574 case VK_FORMAT_R64G64B64_UINT:
575 return 2;
576 default:
577 return 1;
578 }
579}
580
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600581static unsigned GetFormatType(VkFormat fmt) {
Dave Houltona9df0ce2018-02-07 10:51:23 -0700582 if (FormatIsSInt(fmt)) return FORMAT_TYPE_SINT;
583 if (FormatIsUInt(fmt)) return FORMAT_TYPE_UINT;
584 if (FormatIsDepthAndStencil(fmt)) return FORMAT_TYPE_FLOAT | FORMAT_TYPE_UINT;
585 if (fmt == VK_FORMAT_UNDEFINED) return 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700586 // everything else -- UNORM/SNORM/FLOAT/USCALED/SSCALED is all float in the shader.
587 return FORMAT_TYPE_FLOAT;
588}
589
590// characterizes a SPIR-V type appearing in an interface to a FF stage, for comparison to a VkFormat's characterization above.
Chris Forbes062f1222018-08-21 15:34:15 -0700591// also used for input attachments, as we statically know their format.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600592static unsigned GetFundamentalType(SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700593 auto insn = src->get_def(type);
594 assert(insn != src->end());
595
596 switch (insn.opcode()) {
597 case spv::OpTypeInt:
598 return insn.word(3) ? FORMAT_TYPE_SINT : FORMAT_TYPE_UINT;
599 case spv::OpTypeFloat:
600 return FORMAT_TYPE_FLOAT;
601 case spv::OpTypeVector:
Chris Forbes47567b72017-06-09 12:09:45 -0700602 case spv::OpTypeMatrix:
Chris Forbes47567b72017-06-09 12:09:45 -0700603 case spv::OpTypeArray:
Chris Forbes062f1222018-08-21 15:34:15 -0700604 case spv::OpTypeRuntimeArray:
605 case spv::OpTypeImage:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600606 return GetFundamentalType(src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700607 case spv::OpTypePointer:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600608 return GetFundamentalType(src, insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700609
610 default:
611 return 0;
612 }
613}
614
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600615static uint32_t GetShaderStageId(VkShaderStageFlagBits stage) {
Chris Forbes47567b72017-06-09 12:09:45 -0700616 uint32_t bit_pos = uint32_t(u_ffs(stage));
617 return bit_pos - 1;
618}
619
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600620static spirv_inst_iter GetStructType(SHADER_MODULE_STATE const *src, spirv_inst_iter def, bool is_array_of_verts) {
Chris Forbes47567b72017-06-09 12:09:45 -0700621 while (true) {
622 if (def.opcode() == spv::OpTypePointer) {
623 def = src->get_def(def.word(3));
624 } else if (def.opcode() == spv::OpTypeArray && is_array_of_verts) {
625 def = src->get_def(def.word(2));
626 is_array_of_verts = false;
627 } else if (def.opcode() == spv::OpTypeStruct) {
628 return def;
629 } else {
630 return src->end();
631 }
632 }
633}
634
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600635static bool CollectInterfaceBlockMembers(SHADER_MODULE_STATE const *src, std::map<location_t, interface_var> *out,
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800636 bool is_array_of_verts, uint32_t id, uint32_t type_id, bool is_patch,
637 int /*first_location*/) {
Chris Forbes47567b72017-06-09 12:09:45 -0700638 // Walk down the type_id presented, trying to determine whether it's actually an interface block.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600639 auto type = GetStructType(src, src->get_def(type_id), is_array_of_verts && !is_patch);
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800640 if (type == src->end() || !(src->get_decorations(type.word(1)).flags & decoration_set::block_bit)) {
Chris Forbes47567b72017-06-09 12:09:45 -0700641 // This isn't an interface block.
Chris Forbesa313d772017-06-13 13:59:41 -0700642 return false;
Chris Forbes47567b72017-06-09 12:09:45 -0700643 }
644
645 std::unordered_map<unsigned, unsigned> member_components;
646 std::unordered_map<unsigned, unsigned> member_relaxed_precision;
Chris Forbesa313d772017-06-13 13:59:41 -0700647 std::unordered_map<unsigned, unsigned> member_patch;
Chris Forbes47567b72017-06-09 12:09:45 -0700648
649 // Walk all the OpMemberDecorate for type's result id -- first pass, collect components.
650 for (auto insn : *src) {
651 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1)) {
652 unsigned member_index = insn.word(2);
653
654 if (insn.word(3) == spv::DecorationComponent) {
655 unsigned component = insn.word(4);
656 member_components[member_index] = component;
657 }
658
659 if (insn.word(3) == spv::DecorationRelaxedPrecision) {
660 member_relaxed_precision[member_index] = 1;
661 }
Chris Forbesa313d772017-06-13 13:59:41 -0700662
663 if (insn.word(3) == spv::DecorationPatch) {
664 member_patch[member_index] = 1;
665 }
Chris Forbes47567b72017-06-09 12:09:45 -0700666 }
667 }
668
Chris Forbesa313d772017-06-13 13:59:41 -0700669 // TODO: correctly handle location assignment from outside
670
Chris Forbes47567b72017-06-09 12:09:45 -0700671 // Second pass -- produce the output, from Location decorations
672 for (auto insn : *src) {
673 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1)) {
674 unsigned member_index = insn.word(2);
675 unsigned member_type_id = type.word(2 + member_index);
676
677 if (insn.word(3) == spv::DecorationLocation) {
678 unsigned location = insn.word(4);
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600679 unsigned num_locations = GetLocationsConsumedByType(src, member_type_id, false);
Chris Forbes47567b72017-06-09 12:09:45 -0700680 auto component_it = member_components.find(member_index);
681 unsigned component = component_it == member_components.end() ? 0 : component_it->second;
682 bool is_relaxed_precision = member_relaxed_precision.find(member_index) != member_relaxed_precision.end();
Dave Houltona9df0ce2018-02-07 10:51:23 -0700683 bool member_is_patch = is_patch || member_patch.count(member_index) > 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700684
685 for (unsigned int offset = 0; offset < num_locations; offset++) {
686 interface_var v = {};
687 v.id = id;
688 // TODO: member index in interface_var too?
689 v.type_id = member_type_id;
690 v.offset = offset;
Chris Forbesa313d772017-06-13 13:59:41 -0700691 v.is_patch = member_is_patch;
Chris Forbes47567b72017-06-09 12:09:45 -0700692 v.is_block_member = true;
693 v.is_relaxed_precision = is_relaxed_precision;
694 (*out)[std::make_pair(location + offset, component)] = v;
695 }
696 }
697 }
698 }
Chris Forbesa313d772017-06-13 13:59:41 -0700699
700 return true;
Chris Forbes47567b72017-06-09 12:09:45 -0700701}
702
Ari Suonpaa696b3432019-03-11 14:02:57 +0200703static std::vector<uint32_t> FindEntrypointInterfaces(spirv_inst_iter entrypoint) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800704 assert(entrypoint.opcode() == spv::OpEntryPoint);
705
Ari Suonpaa696b3432019-03-11 14:02:57 +0200706 std::vector<uint32_t> interfaces;
707 // Find the end of the entrypoint's name string. additional zero bytes follow the actual null terminator, to fill out the
708 // rest of the word - so we only need to look at the last byte in the word to determine which word contains the terminator.
709 uint32_t word = 3;
710 while (entrypoint.word(word) & 0xff000000u) {
711 ++word;
712 }
713 ++word;
714
715 for (; word < entrypoint.len(); word++) interfaces.push_back(entrypoint.word(word));
716
717 return interfaces;
718}
719
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600720static std::map<location_t, interface_var> CollectInterfaceByLocation(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600721 spv::StorageClass sinterface, bool is_array_of_verts) {
Chris Forbes47567b72017-06-09 12:09:45 -0700722 // TODO: handle index=1 dual source outputs from FS -- two vars will have the same location, and we DON'T want to clobber.
723
Chris Forbes47567b72017-06-09 12:09:45 -0700724 std::map<location_t, interface_var> out;
725
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800726 for (uint32_t iid : FindEntrypointInterfaces(entrypoint)) {
727 auto insn = src->get_def(iid);
Chris Forbes47567b72017-06-09 12:09:45 -0700728 assert(insn != src->end());
729 assert(insn.opcode() == spv::OpVariable);
730
731 if (insn.word(3) == static_cast<uint32_t>(sinterface)) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800732 auto d = src->get_decorations(iid);
Chris Forbes47567b72017-06-09 12:09:45 -0700733 unsigned id = insn.word(2);
734 unsigned type = insn.word(1);
735
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800736 int location = d.location;
737 int builtin = d.builtin;
738 unsigned component = d.component;
739 bool is_patch = (d.flags & decoration_set::patch_bit) != 0;
740 bool is_relaxed_precision = (d.flags & decoration_set::relaxed_precision_bit) != 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700741
Dave Houltona9df0ce2018-02-07 10:51:23 -0700742 if (builtin != -1)
743 continue;
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800744 else if (!CollectInterfaceBlockMembers(src, &out, is_array_of_verts, id, type, is_patch, location)) {
Chris Forbes47567b72017-06-09 12:09:45 -0700745 // A user-defined interface variable, with a location. Where a variable occupied multiple locations, emit
746 // one result for each.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600747 unsigned num_locations = GetLocationsConsumedByType(src, type, is_array_of_verts && !is_patch);
Chris Forbes47567b72017-06-09 12:09:45 -0700748 for (unsigned int offset = 0; offset < num_locations; offset++) {
749 interface_var v = {};
750 v.id = id;
751 v.type_id = type;
752 v.offset = offset;
753 v.is_patch = is_patch;
754 v.is_relaxed_precision = is_relaxed_precision;
755 out[std::make_pair(location + offset, component)] = v;
756 }
Chris Forbes47567b72017-06-09 12:09:45 -0700757 }
758 }
759 }
760
761 return out;
762}
763
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600764static std::vector<uint32_t> CollectBuiltinBlockMembers(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint,
Ari Suonpaa696b3432019-03-11 14:02:57 +0200765 uint32_t storageClass) {
766 std::vector<uint32_t> variables;
767 std::vector<uint32_t> builtinStructMembers;
768 std::vector<uint32_t> builtinDecorations;
769
770 for (auto insn : *src) {
771 switch (insn.opcode()) {
772 // Find all built-in member decorations
773 case spv::OpMemberDecorate:
774 if (insn.word(3) == spv::DecorationBuiltIn) {
775 builtinStructMembers.push_back(insn.word(1));
776 }
777 break;
778 // Find all built-in decorations
779 case spv::OpDecorate:
780 switch (insn.word(2)) {
781 case spv::DecorationBlock: {
782 uint32_t blockID = insn.word(1);
783 for (auto builtInBlockID : builtinStructMembers) {
784 // Check if one of the members of the block are built-in -> the block is built-in
785 if (blockID == builtInBlockID) {
786 builtinDecorations.push_back(blockID);
787 break;
788 }
789 }
790 break;
791 }
792 case spv::DecorationBuiltIn:
793 builtinDecorations.push_back(insn.word(1));
794 break;
795 default:
796 break;
797 }
798 break;
799 default:
800 break;
801 }
802 }
803
804 // Find all interface variables belonging to the entrypoint and matching the storage class
805 for (uint32_t id : FindEntrypointInterfaces(entrypoint)) {
806 auto def = src->get_def(id);
807 assert(def != src->end());
808 assert(def.opcode() == spv::OpVariable);
809
810 if (def.word(3) == storageClass) variables.push_back(def.word(1));
811 }
812
813 // Find all members belonging to the builtin block selected
814 std::vector<uint32_t> builtinBlockMembers;
815 for (auto &var : variables) {
816 auto def = src->get_def(src->get_def(var).word(3));
817
818 // It could be an array of IO blocks. The element type should be the struct defining the block contents
819 if (def.opcode() == spv::OpTypeArray) def = src->get_def(def.word(2));
820
821 // Now find all members belonging to the struct defining the IO block
822 if (def.opcode() == spv::OpTypeStruct) {
823 for (auto builtInID : builtinDecorations) {
824 if (builtInID == def.word(1)) {
825 for (int i = 2; i < (int)def.len(); i++)
826 builtinBlockMembers.push_back(spv::BuiltInMax); // Start with undefined builtin for each struct member.
827 // These shouldn't be left after replacing.
828 for (auto insn : *src) {
829 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == builtInID &&
830 insn.word(3) == spv::DecorationBuiltIn) {
831 auto structIndex = insn.word(2);
832 assert(structIndex < builtinBlockMembers.size());
833 builtinBlockMembers[structIndex] = insn.word(4);
834 }
835 }
836 }
837 }
838 }
839 }
840
841 return builtinBlockMembers;
842}
843
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600844static std::vector<std::pair<uint32_t, interface_var>> CollectInterfaceByInputAttachmentIndex(
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600845 SHADER_MODULE_STATE const *src, std::unordered_set<uint32_t> const &accessible_ids) {
Chris Forbes47567b72017-06-09 12:09:45 -0700846 std::vector<std::pair<uint32_t, interface_var>> out;
847
848 for (auto insn : *src) {
849 if (insn.opcode() == spv::OpDecorate) {
850 if (insn.word(2) == spv::DecorationInputAttachmentIndex) {
851 auto attachment_index = insn.word(3);
852 auto id = insn.word(1);
853
854 if (accessible_ids.count(id)) {
855 auto def = src->get_def(id);
856 assert(def != src->end());
locke-lunarg9a16ebb2020-07-30 16:56:33 -0600857 if (def.opcode() == spv::OpVariable && def.word(3) == spv::StorageClassUniformConstant) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600858 auto num_locations = GetLocationsConsumedByType(src, def.word(1), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700859 for (unsigned int offset = 0; offset < num_locations; offset++) {
860 interface_var v = {};
861 v.id = id;
862 v.type_id = def.word(1);
863 v.offset = offset;
864 out.emplace_back(attachment_index + offset, v);
865 }
866 }
867 }
868 }
869 }
870 }
871
872 return out;
873}
874
locke-lunarg25b6c352020-08-06 17:44:18 -0600875static bool AtomicOperation(uint32_t opcode) {
876 switch (opcode) {
877 case spv::OpAtomicLoad:
878 case spv::OpAtomicStore:
879 case spv::OpAtomicExchange:
880 case spv::OpAtomicCompareExchange:
881 case spv::OpAtomicCompareExchangeWeak:
882 case spv::OpAtomicIIncrement:
883 case spv::OpAtomicIDecrement:
884 case spv::OpAtomicIAdd:
885 case spv::OpAtomicISub:
886 case spv::OpAtomicSMin:
887 case spv::OpAtomicUMin:
888 case spv::OpAtomicSMax:
889 case spv::OpAtomicUMax:
890 case spv::OpAtomicAnd:
891 case spv::OpAtomicOr:
892 case spv::OpAtomicXor:
893 case spv::OpAtomicFAddEXT:
894 return true;
895 default:
896 return false;
897 }
898 return false;
899}
900
locke-lunarg12d20992020-09-21 12:46:49 -0600901bool CheckObjectIDFromOpLoad(uint32_t object_id, const std::vector<unsigned> &operator_members,
902 const std::unordered_map<unsigned, unsigned> &load_members,
903 const std::unordered_map<unsigned, std::pair<unsigned, unsigned>> &accesschain_members) {
904 for (auto load_id : operator_members) {
locke-lunargd3da0422020-09-23 01:02:11 -0600905 if (object_id == load_id) return true;
locke-lunarg12d20992020-09-21 12:46:49 -0600906 auto load_it = load_members.find(load_id);
907 if (load_it == load_members.end()) {
908 continue;
909 }
910 if (load_it->second == object_id) {
911 return true;
912 }
913
914 auto accesschain_it = accesschain_members.find(load_it->second);
915 if (accesschain_it == accesschain_members.end()) {
916 continue;
917 }
918 if (accesschain_it->second.first == object_id) {
919 return true;
920 }
921 }
922 return false;
923}
924
locke-lunargae2a43c2020-09-22 17:21:57 -0600925bool CheckImageOperandsBiasOffset(uint32_t type) {
926 return type & (spv::ImageOperandsBiasMask | spv::ImageOperandsConstOffsetMask | spv::ImageOperandsOffsetMask |
927 spv::ImageOperandsConstOffsetsMask)
928 ? true
929 : false;
930}
931
locke-lunargd3da0422020-09-23 01:02:11 -0600932struct shader_module_used_operators {
933 bool updated;
934 std::vector<unsigned> imagwrite_members;
935 std::vector<unsigned> atomic_members;
936 std::vector<unsigned> store_members;
937 std::vector<unsigned> atomic_store_members;
938 std::vector<unsigned> sampler_implicitLod_dref_proj_members; // sampler Load id
939 std::vector<unsigned> sampler_bias_offset_members; // sampler Load id
940 std::vector<std::pair<unsigned, unsigned>> sampledImage_members;
941 std::unordered_map<unsigned, unsigned> load_members;
942 std::unordered_map<unsigned, std::pair<unsigned, unsigned>> accesschain_members;
943 std::unordered_map<unsigned, unsigned> image_texel_pointer_members;
944
945 shader_module_used_operators() : updated(false) {}
946
947 void update(SHADER_MODULE_STATE const *module) {
948 if (updated) return;
949 updated = true;
950
951 for (auto insn : *module) {
952 switch (insn.opcode()) {
953 case spv::OpImageSampleImplicitLod:
954 case spv::OpImageSampleProjImplicitLod:
955 case spv::OpImageSampleProjExplicitLod:
956 case spv::OpImageSparseSampleImplicitLod:
957 case spv::OpImageSparseSampleProjImplicitLod:
958 case spv::OpImageSparseSampleProjExplicitLod: {
959 sampler_implicitLod_dref_proj_members.emplace_back(insn.word(3)); // Load id
960 // ImageOperands in index: 5
961 if (insn.len() > 5 && CheckImageOperandsBiasOffset(insn.word(5))) {
962 sampler_bias_offset_members.emplace_back(insn.word(3));
963 }
964 break;
965 }
966 case spv::OpImageSampleDrefImplicitLod:
967 case spv::OpImageSampleDrefExplicitLod:
968 case spv::OpImageSampleProjDrefImplicitLod:
969 case spv::OpImageSampleProjDrefExplicitLod:
970 case spv::OpImageSparseSampleDrefImplicitLod:
971 case spv::OpImageSparseSampleDrefExplicitLod:
972 case spv::OpImageSparseSampleProjDrefImplicitLod:
973 case spv::OpImageSparseSampleProjDrefExplicitLod: {
974 sampler_implicitLod_dref_proj_members.emplace_back(insn.word(3)); // Load id
975 // ImageOperands in index: 6
976 if (insn.len() > 6 && CheckImageOperandsBiasOffset(insn.word(6))) {
977 sampler_bias_offset_members.emplace_back(insn.word(3));
978 }
979 break;
980 }
981 case spv::OpImageSampleExplicitLod:
982 case spv::OpImageSparseSampleExplicitLod: {
983 // ImageOperands in index: 5
984 if (insn.len() > 5 && CheckImageOperandsBiasOffset(insn.word(5))) {
985 sampler_bias_offset_members.emplace_back(insn.word(3));
986 }
987 break;
988 }
989 case spv::OpStore: {
990 store_members.emplace_back(insn.word(1)); // object id or AccessChain id
991 break;
992 }
993 case spv::OpImageWrite: {
994 imagwrite_members.emplace_back(insn.word(1)); // Load id
995 break;
996 }
997 case spv::OpSampledImage: {
998 // 3: image load id, 4: sampler load id
999 sampledImage_members.emplace_back(std::pair<unsigned, unsigned>(insn.word(3), insn.word(4)));
1000 break;
1001 }
1002 case spv::OpLoad: {
1003 // 2: Load id, 3: object id or AccessChain id
1004 load_members.insert(std::make_pair(insn.word(2), insn.word(3)));
1005 break;
1006 }
1007 case spv::OpAccessChain: {
locke-lunarg025daa72020-10-13 11:07:51 -06001008 if (insn.len() == 4) {
1009 // If it is for struct, the length is only 4.
1010 // 2: AccessChain id, 3: object id
1011 accesschain_members.insert(std::make_pair(insn.word(2), std::pair<unsigned, unsigned>(insn.word(3), 0)));
1012 } else {
1013 // 2: AccessChain id, 3: object id, 4: object id of array index
1014 accesschain_members.insert(
1015 std::make_pair(insn.word(2), std::pair<unsigned, unsigned>(insn.word(3), insn.word(4))));
1016 }
locke-lunargd3da0422020-09-23 01:02:11 -06001017 break;
1018 }
1019 case spv::OpImageTexelPointer: {
1020 // 2: ImageTexelPointer id, 3: object id
1021 image_texel_pointer_members.insert(std::make_pair(insn.word(2), insn.word(3)));
1022 break;
1023 }
1024 default: {
1025 if (AtomicOperation(insn.opcode())) {
1026 if (insn.opcode() == spv::OpAtomicStore) {
1027 atomic_store_members.emplace_back(insn.word(1)); // ImageTexelPointer id
1028 } else {
1029 atomic_members.emplace_back(insn.word(3)); // ImageTexelPointer id
1030 }
1031 }
1032 break;
1033 }
1034 }
1035 }
1036 }
1037};
1038
locke-lunarg25b6c352020-08-06 17:44:18 -06001039// Check writable, image atomic operation
1040static void IsSpecificDescriptorType(SHADER_MODULE_STATE const *module, const spirv_inst_iter &id_it, bool is_storage_buffer,
locke-lunargd3da0422020-09-23 01:02:11 -06001041 bool is_check_writable, interface_var &out_interface_var,
1042 shader_module_used_operators &used_operators) {
locke-lunarg6f760f12020-06-05 16:19:37 -06001043 uint32_t type_id = id_it.word(1);
locke-lunarg36045992020-08-20 16:54:37 -06001044 unsigned int id = id_it.word(2);
1045
Chris Forbes8af24522018-03-07 11:37:45 -08001046 auto type = module->get_def(type_id);
1047
1048 // Strip off any array or ptrs. Where we remove array levels, adjust the descriptor count for each dimension.
locke-lunarg12d20992020-09-21 12:46:49 -06001049 while (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypePointer || type.opcode() == spv::OpTypeRuntimeArray ||
1050 type.opcode() == spv::OpTypeSampledImage) {
1051 if (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypeRuntimeArray ||
1052 type.opcode() == spv::OpTypeSampledImage) {
Chris Forbes8d31e5d2018-10-08 17:19:15 -07001053 type = module->get_def(type.word(2)); // Element type
Chris Forbes8af24522018-03-07 11:37:45 -08001054 } else {
locke-lunarg36045992020-08-20 16:54:37 -06001055 type = module->get_def(type.word(3)); // Pointer type
Chris Forbes8af24522018-03-07 11:37:45 -08001056 }
1057 }
Chris Forbes8af24522018-03-07 11:37:45 -08001058 switch (type.opcode()) {
1059 case spv::OpTypeImage: {
1060 auto dim = type.word(3);
locke-lunarg36045992020-08-20 16:54:37 -06001061 if (dim != spv::DimSubpassData) {
locke-lunargd3da0422020-09-23 01:02:11 -06001062 used_operators.update(module);
locke-lunarg25b6c352020-08-06 17:44:18 -06001063
locke-lunargd3da0422020-09-23 01:02:11 -06001064 if (CheckObjectIDFromOpLoad(id, used_operators.imagwrite_members, used_operators.load_members,
1065 used_operators.accesschain_members)) {
locke-lunarg25b6c352020-08-06 17:44:18 -06001066 out_interface_var.is_writable = true;
locke-lunarg12d20992020-09-21 12:46:49 -06001067 }
1068 if (CheckObjectIDFromOpLoad(id, used_operators.sampler_implicitLod_dref_proj_members, used_operators.load_members,
1069 used_operators.accesschain_members)) {
1070 out_interface_var.is_sampler_implicitLod_dref_proj = true;
locke-lunarg25b6c352020-08-06 17:44:18 -06001071 }
locke-lunargd3da0422020-09-23 01:02:11 -06001072 if (CheckObjectIDFromOpLoad(id, used_operators.sampler_bias_offset_members, used_operators.load_members,
1073 used_operators.accesschain_members)) {
locke-lunargae2a43c2020-09-22 17:21:57 -06001074 out_interface_var.is_sampler_bias_offset = true;
1075 }
locke-lunargd3da0422020-09-23 01:02:11 -06001076 if (CheckObjectIDFromOpLoad(id, used_operators.atomic_members, used_operators.image_texel_pointer_members,
1077 used_operators.accesschain_members) ||
1078 CheckObjectIDFromOpLoad(id, used_operators.atomic_store_members, used_operators.image_texel_pointer_members,
1079 used_operators.accesschain_members)) {
1080 out_interface_var.is_atomic_operation = true;
1081 }
locke-lunarg25b6c352020-08-06 17:44:18 -06001082
locke-lunargd3da0422020-09-23 01:02:11 -06001083 for (auto &itp_id : used_operators.sampledImage_members) {
locke-lunarg36045992020-08-20 16:54:37 -06001084 // Find if image id match.
1085 uint32_t image_index = 0;
locke-lunargd3da0422020-09-23 01:02:11 -06001086 auto load_it = used_operators.load_members.find(itp_id.first);
1087 if (load_it == used_operators.load_members.end()) {
locke-lunarg36045992020-08-20 16:54:37 -06001088 continue;
1089 } else {
1090 if (load_it->second != id) {
locke-lunargd3da0422020-09-23 01:02:11 -06001091 auto accesschain_it = used_operators.accesschain_members.find(load_it->second);
1092 if (accesschain_it == used_operators.accesschain_members.end()) {
locke-lunarg36045992020-08-20 16:54:37 -06001093 continue;
1094 } else {
1095 if (accesschain_it->second.first != id) {
1096 continue;
1097 }
locke-lunarg025daa72020-10-13 11:07:51 -06001098 if (used_operators.load_members.end() !=
1099 used_operators.load_members.find(accesschain_it->second.second)) {
1100 // image_index isn't a constant, skip.
1101 break;
1102 }
locke-lunarg36045992020-08-20 16:54:37 -06001103 image_index = GetConstantValue(module, accesschain_it->second.second);
1104 }
1105 }
1106 }
1107 // Find sampler's set binding.
locke-lunargd3da0422020-09-23 01:02:11 -06001108 load_it = used_operators.load_members.find(itp_id.second);
1109 if (load_it == used_operators.load_members.end()) {
locke-lunarg36045992020-08-20 16:54:37 -06001110 continue;
1111 } else {
1112 uint32_t sampler_id = load_it->second;
1113 uint32_t sampler_index = 0;
locke-lunargd3da0422020-09-23 01:02:11 -06001114 auto accesschain_it = used_operators.accesschain_members.find(load_it->second);
1115 if (accesschain_it != used_operators.accesschain_members.end()) {
locke-lunarg025daa72020-10-13 11:07:51 -06001116 if (used_operators.load_members.end() !=
1117 used_operators.load_members.find(accesschain_it->second.second)) {
1118 // sampler_index isn't a constant, skip.
1119 break;
1120 }
locke-lunarg36045992020-08-20 16:54:37 -06001121 sampler_id = accesschain_it->second.first;
1122 sampler_index = GetConstantValue(module, accesschain_it->second.second);
1123 }
1124 auto sampler_dec = module->get_decorations(sampler_id);
locke-lunarg654a9052020-10-13 16:28:42 -06001125 if (image_index >= out_interface_var.samplers_used_by_image.size()) {
1126 out_interface_var.samplers_used_by_image.resize(image_index + 1);
1127 }
1128 out_interface_var.samplers_used_by_image[image_index].emplace(
1129 SamplerUsedByImage{descriptor_slot_t{sampler_dec.descriptor_set, sampler_dec.binding}, sampler_index});
locke-lunarg36045992020-08-20 16:54:37 -06001130 }
1131 }
locke-lunarg6f760f12020-06-05 16:19:37 -06001132 }
locke-lunarg25b6c352020-08-06 17:44:18 -06001133 return;
Chris Forbes8af24522018-03-07 11:37:45 -08001134 }
1135
Chris Forbes8d31e5d2018-10-08 17:19:15 -07001136 case spv::OpTypeStruct: {
1137 std::unordered_set<unsigned> nonwritable_members;
Chris Forbes8a6d8cb2019-02-14 14:33:08 -08001138 if (module->get_decorations(type.word(1)).flags & decoration_set::buffer_block_bit) is_storage_buffer = true;
Chris Forbes8af24522018-03-07 11:37:45 -08001139 for (auto insn : *module) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -08001140 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1) &&
1141 insn.word(3) == spv::DecorationNonWritable) {
Chris Forbes8d31e5d2018-10-08 17:19:15 -07001142 nonwritable_members.insert(insn.word(2));
Chris Forbes8af24522018-03-07 11:37:45 -08001143 }
1144 }
Chris Forbes8d31e5d2018-10-08 17:19:15 -07001145
1146 // A buffer is writable if it's either flavor of storage buffer, and has any member not decorated
1147 // as nonwritable.
locke-lunarg6f760f12020-06-05 16:19:37 -06001148 if (is_storage_buffer && nonwritable_members.size() != type.len() - 2) {
locke-lunargd3da0422020-09-23 01:02:11 -06001149 used_operators.update(module);
locke-lunarg6f760f12020-06-05 16:19:37 -06001150
locke-lunargd3da0422020-09-23 01:02:11 -06001151 for (auto oid : used_operators.store_members) {
1152 if (id == oid) {
locke-lunarg25b6c352020-08-06 17:44:18 -06001153 out_interface_var.is_writable = true;
1154 return;
1155 }
locke-lunargd3da0422020-09-23 01:02:11 -06001156 auto accesschain_it = used_operators.accesschain_members.find(oid);
1157 if (accesschain_it == used_operators.accesschain_members.end()) {
locke-lunarg25b6c352020-08-06 17:44:18 -06001158 continue;
1159 }
locke-lunargd3da0422020-09-23 01:02:11 -06001160 if (accesschain_it->second.first == id) {
1161 out_interface_var.is_writable = true;
1162 return;
1163 }
1164 }
1165 if (CheckObjectIDFromOpLoad(id, used_operators.atomic_store_members, used_operators.image_texel_pointer_members,
1166 used_operators.accesschain_members)) {
locke-lunarg25b6c352020-08-06 17:44:18 -06001167 out_interface_var.is_writable = true;
1168 return;
locke-lunarg6f760f12020-06-05 16:19:37 -06001169 }
1170 }
Chris Forbes8d31e5d2018-10-08 17:19:15 -07001171 }
Chris Forbes8af24522018-03-07 11:37:45 -08001172 }
Chris Forbes8af24522018-03-07 11:37:45 -08001173}
1174
locke-lunargd9a069d2019-09-17 01:50:19 -06001175std::vector<std::pair<descriptor_slot_t, interface_var>> CollectInterfaceByDescriptorSlot(
locke-lunarg63e4daf2020-08-17 17:53:25 -06001176 SHADER_MODULE_STATE const *src, std::unordered_set<uint32_t> const &accessible_ids, bool *has_writable_descriptor,
1177 bool *has_atomic_descriptor) {
Chris Forbes47567b72017-06-09 12:09:45 -07001178 std::vector<std::pair<descriptor_slot_t, interface_var>> out;
locke-lunargd3da0422020-09-23 01:02:11 -06001179 shader_module_used_operators operators;
1180
Chris Forbes47567b72017-06-09 12:09:45 -07001181 for (auto id : accessible_ids) {
1182 auto insn = src->get_def(id);
1183 assert(insn != src->end());
1184
1185 if (insn.opcode() == spv::OpVariable &&
Chris Forbes9f89d752018-03-07 12:57:48 -08001186 (insn.word(3) == spv::StorageClassUniform || insn.word(3) == spv::StorageClassUniformConstant ||
1187 insn.word(3) == spv::StorageClassStorageBuffer)) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -08001188 auto d = src->get_decorations(insn.word(2));
1189 unsigned set = d.descriptor_set;
1190 unsigned binding = d.binding;
Chris Forbes47567b72017-06-09 12:09:45 -07001191
1192 interface_var v = {};
1193 v.id = insn.word(2);
1194 v.type_id = insn.word(1);
Chris Forbes8af24522018-03-07 11:37:45 -08001195
locke-lunarg25b6c352020-08-06 17:44:18 -06001196 IsSpecificDescriptorType(src, insn, insn.word(3) == spv::StorageClassStorageBuffer,
locke-lunargd3da0422020-09-23 01:02:11 -06001197 !(d.flags & decoration_set::nonwritable_bit), v, operators);
locke-lunarg63e4daf2020-08-17 17:53:25 -06001198 if (v.is_writable) *has_writable_descriptor = true;
1199 if (v.is_atomic_operation) *has_atomic_descriptor = true;
locke-lunarg654e3692020-06-04 17:19:15 -06001200 out.emplace_back(std::make_pair(set, binding), v);
Chris Forbes47567b72017-06-09 12:09:45 -07001201 }
1202 }
1203
1204 return out;
1205}
1206
locke-lunargde3f0fa2020-09-10 11:55:31 -06001207void DefineStructMember(const SHADER_MODULE_STATE &src, const spirv_inst_iter &it,
1208 const std::vector<uint32_t> &memberDecorate_offsets, shader_struct_member &data) {
1209 const auto struct_it = GetStructType(&src, it, false);
1210 assert(struct_it != src.end());
1211 data.size = 0;
1212
1213 shader_struct_member data1;
1214 uint32_t i = 2;
1215 uint32_t local_offset = 0;
1216 std::vector<uint32_t> offsets;
1217 offsets.resize(struct_it.len() - i);
1218
1219 // The members of struct in SPRIV_R aren't always sort, so we need to know their order.
1220 for (const auto offset : memberDecorate_offsets) {
1221 const auto member_decorate = src.at(offset);
1222 if (member_decorate.word(1) != struct_it.word(1)) {
1223 continue;
1224 }
1225
1226 offsets[member_decorate.word(2)] = member_decorate.word(4);
1227 }
1228
1229 for (const auto offset : offsets) {
1230 local_offset = offset;
1231 data1 = {};
1232 data1.root = data.root;
1233 data1.offset = local_offset;
1234 auto def_member = src.get_def(struct_it.word(i));
1235
1236 // Array could be multi-dimensional
1237 while (def_member.opcode() == spv::OpTypeArray) {
1238 const auto len_id = def_member.word(3);
1239 const auto def_len = src.get_def(len_id);
1240 data1.array_length_hierarchy.emplace_back(def_len.word(3)); // array length
1241 def_member = src.get_def(def_member.word(2));
1242 }
1243
1244 if (def_member.opcode() == spv::OpTypeStruct || def_member.opcode() == spv::OpTypePointer) {
1245 // If it's OpTypePointer. it means the member is a buffer, the type will be TypePointer, and then struct
1246 DefineStructMember(src, def_member, memberDecorate_offsets, data1);
1247 } else {
1248 if (def_member.opcode() == spv::OpTypeMatrix) {
1249 data1.array_length_hierarchy.emplace_back(def_member.word(3)); // matrix's columns. matrix's row is vector.
1250 def_member = src.get_def(def_member.word(2));
1251 }
1252
1253 if (def_member.opcode() == spv::OpTypeVector) {
1254 data1.array_length_hierarchy.emplace_back(def_member.word(3)); // vector length
1255 def_member = src.get_def(def_member.word(2));
1256 }
1257
1258 // Get scalar type size. The value in SPRV-R is bit. It needs to translate to byte.
1259 data1.size = (def_member.word(2) / 8);
1260 }
1261 const auto array_length_hierarchy_szie = data1.array_length_hierarchy.size();
1262 if (array_length_hierarchy_szie > 0) {
1263 data1.array_block_size.resize(array_length_hierarchy_szie, 1);
1264
1265 for (int i2 = static_cast<int>(array_length_hierarchy_szie - 1); i2 > 0; --i2) {
1266 data1.array_block_size[i2 - 1] = data1.array_length_hierarchy[i2] * data1.array_block_size[i2];
1267 }
1268 }
1269 data.struct_members.emplace_back(data1);
1270 ++i;
1271 }
1272 uint32_t total_array_length = 1;
1273 for (const auto length : data1.array_length_hierarchy) {
1274 total_array_length *= length;
1275 }
1276 data.size = local_offset + data1.size * total_array_length;
1277}
1278
1279uint32_t UpdateOffset(uint32_t offset, const std::vector<uint32_t> &array_indices, const shader_struct_member &data) {
1280 int array_indices_size = static_cast<int>(array_indices.size());
1281 if (array_indices_size) {
1282 uint32_t array_index = 0;
1283 uint32_t i = 0;
1284 for (const auto index : array_indices) {
1285 array_index += (data.array_block_size[i] * index);
1286 ++i;
1287 }
1288 offset += (array_index * data.size);
1289 }
1290 return offset;
1291}
1292
1293void SetUsedBytes(uint32_t offset, const std::vector<uint32_t> &array_indices, const shader_struct_member &data) {
1294 int array_indices_size = static_cast<int>(array_indices.size());
1295 uint32_t block_memory_size = data.size;
1296 for (uint32_t i = static_cast<int>(array_indices_size); i < data.array_length_hierarchy.size(); ++i) {
1297 block_memory_size *= data.array_length_hierarchy[i];
1298 }
1299
1300 offset = UpdateOffset(offset, array_indices, data);
1301
1302 uint32_t end = offset + block_memory_size;
1303 auto used_bytes = data.GetUsedbytes();
1304 if (used_bytes->size() < end) {
1305 used_bytes->resize(end, 0);
1306 }
1307 std::memset(used_bytes->data() + offset, true, static_cast<std::size_t>(block_memory_size));
1308}
1309
1310void RunUsedArray(const SHADER_MODULE_STATE &src, uint32_t offset, std::vector<uint32_t> array_indices,
1311 uint32_t access_chain_word_index, spirv_inst_iter &access_chain_it, const shader_struct_member &data) {
1312 if (access_chain_word_index < access_chain_it.len()) {
1313 if (data.array_length_hierarchy.size() > array_indices.size()) {
1314 auto def_it = src.get_def(access_chain_it.word(access_chain_word_index));
1315 ++access_chain_word_index;
1316
1317 if (def_it != src.end() && def_it.opcode() == spv::OpConstant) {
1318 array_indices.emplace_back(def_it.word(3));
1319 RunUsedArray(src, offset, array_indices, access_chain_word_index, access_chain_it, data);
1320 } else {
1321 // If it is a variable, set the all array is used.
1322 if (access_chain_word_index < access_chain_it.len()) {
1323 uint32_t array_length = data.array_length_hierarchy[array_indices.size()];
1324 for (uint32_t i = 0; i < array_length; ++i) {
1325 auto array_indices2 = array_indices;
1326 array_indices2.emplace_back(i);
1327 RunUsedArray(src, offset, array_indices2, access_chain_word_index, access_chain_it, data);
1328 }
1329 } else {
1330 SetUsedBytes(offset, array_indices, data);
1331 }
1332 }
1333 } else {
1334 offset = UpdateOffset(offset, array_indices, data);
1335 RunUsedStruct(src, offset, access_chain_word_index, access_chain_it, data);
1336 }
1337 } else {
1338 SetUsedBytes(offset, array_indices, data);
1339 }
1340}
1341
1342void RunUsedStruct(const SHADER_MODULE_STATE &src, uint32_t offset, uint32_t access_chain_word_index,
1343 spirv_inst_iter &access_chain_it, const shader_struct_member &data) {
1344 std::vector<uint32_t> array_indices_emptry;
1345
1346 if (access_chain_word_index < access_chain_it.len()) {
1347 auto strcut_member_index = GetConstantValue(&src, access_chain_it.word(access_chain_word_index));
1348 ++access_chain_word_index;
1349
1350 auto data1 = data.struct_members[strcut_member_index];
1351 RunUsedArray(src, offset + data1.offset, array_indices_emptry, access_chain_word_index, access_chain_it, data1);
1352 }
1353}
1354
1355void SetUsedStructMember(const SHADER_MODULE_STATE &src, const uint32_t variable_id,
1356 const std::vector<function_set> &function_set_list, const shader_struct_member &data) {
1357 for (const auto &func_set : function_set_list) {
1358 auto range = func_set.op_lists.equal_range(spv::OpAccessChain);
1359 for (auto it = range.first; it != range.second; ++it) {
1360 auto access_chain = src.at(it->second);
1361 if (access_chain.word(3) == variable_id) {
1362 RunUsedStruct(src, 0, 4, access_chain, data);
1363 }
1364 }
1365 }
1366}
1367
1368void SetPushConstantUsedInShader(SHADER_MODULE_STATE &src) {
1369 for (auto &entrypoint : src.entry_points) {
1370 auto range = entrypoint.second.decorate_list.equal_range(spv::OpVariable);
1371 for (auto it = range.first; it != range.second; ++it) {
1372 const auto def_insn = src.at(it->second);
1373
1374 if (def_insn.word(3) == spv::StorageClassPushConstant) {
1375 spirv_inst_iter type = src.get_def(def_insn.word(1));
1376 const auto range2 = entrypoint.second.decorate_list.equal_range(spv::OpMemberDecorate);
1377 std::vector<uint32_t> offsets;
1378
1379 for (auto it2 = range2.first; it2 != range2.second; ++it2) {
1380 auto member_decorate = src.at(it2->second);
1381 if (member_decorate.len() == 5 && member_decorate.word(3) == spv::DecorationOffset) {
1382 offsets.emplace_back(member_decorate.offset());
1383 }
1384 }
1385 entrypoint.second.push_constant_used_in_shader.root = &entrypoint.second.push_constant_used_in_shader;
1386 DefineStructMember(src, type, offsets, entrypoint.second.push_constant_used_in_shader);
1387 SetUsedStructMember(src, def_insn.word(2), entrypoint.second.function_set_list,
1388 entrypoint.second.push_constant_used_in_shader);
1389 }
1390 }
1391 }
1392}
1393
locke-lunarg96dc9632020-06-10 17:22:18 -06001394std::unordered_set<uint32_t> CollectWritableOutputLocationinFS(const SHADER_MODULE_STATE &module,
1395 const VkPipelineShaderStageCreateInfo &stage_info) {
1396 std::unordered_set<uint32_t> location_list;
1397 if (stage_info.stage != VK_SHADER_STAGE_FRAGMENT_BIT) return location_list;
1398 const auto entrypoint = FindEntrypoint(&module, stage_info.pName, stage_info.stage);
1399 const auto outputs = CollectInterfaceByLocation(&module, entrypoint, spv::StorageClassOutput, false);
1400 std::unordered_set<unsigned> store_members;
1401 std::unordered_map<unsigned, unsigned> accesschain_members;
1402
1403 for (auto insn : module) {
1404 switch (insn.opcode()) {
1405 case spv::OpStore:
1406 case spv::OpAtomicStore: {
1407 store_members.insert(insn.word(1)); // object id or AccessChain id
1408 break;
1409 }
1410 case spv::OpAccessChain: {
1411 // 2: AccessChain id, 3: object id
1412 if (insn.word(3)) accesschain_members.insert(std::make_pair(insn.word(2), insn.word(3)));
1413 break;
1414 }
1415 default:
1416 break;
1417 }
1418 }
1419 if (store_members.empty()) {
1420 return location_list;
1421 }
1422 for (auto output : outputs) {
1423 auto store_it = store_members.find(output.second.id);
1424 if (store_it != store_members.end()) {
1425 location_list.insert(output.first.first);
1426 store_members.erase(store_it);
1427 continue;
1428 }
1429 store_it = store_members.begin();
1430 while (store_it != store_members.end()) {
1431 auto accesschain_it = accesschain_members.find(*store_it);
1432 if (accesschain_it == accesschain_members.end()) {
1433 ++store_it;
1434 continue;
1435 }
1436 if (accesschain_it->second == output.second.id) {
1437 location_list.insert(output.first.first);
1438 store_members.erase(store_it);
1439 accesschain_members.erase(accesschain_it);
1440 break;
1441 }
1442 ++store_it;
1443 }
1444 }
1445 return location_list;
1446}
1447
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001448bool CoreChecks::ValidateViConsistency(VkPipelineVertexInputStateCreateInfo const *vi) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001449 // Walk the binding descriptions, which describe the step rate and stride of each vertex buffer. Each binding should
1450 // be specified only once.
1451 std::unordered_map<uint32_t, VkVertexInputBindingDescription const *> bindings;
1452 bool skip = false;
1453
1454 for (unsigned i = 0; i < vi->vertexBindingDescriptionCount; i++) {
1455 auto desc = &vi->pVertexBindingDescriptions[i];
1456 auto &binding = bindings[desc->binding];
1457 if (binding) {
Dave Houlton78d09922018-05-17 15:48:45 -06001458 // TODO: "VUID-VkGraphicsPipelineCreateInfo-pStages-00742" perhaps?
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001459 skip |= LogError(device, kVUID_Core_Shader_InconsistentVi, "Duplicate vertex input binding descriptions for binding %d",
1460 desc->binding);
Chris Forbes47567b72017-06-09 12:09:45 -07001461 } else {
1462 binding = desc;
1463 }
1464 }
1465
1466 return skip;
1467}
1468
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001469bool CoreChecks::ValidateViAgainstVsInputs(VkPipelineVertexInputStateCreateInfo const *vi, SHADER_MODULE_STATE const *vs,
1470 spirv_inst_iter entrypoint) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001471 bool skip = false;
1472
Petr Kraus25810d02019-08-27 17:41:15 +02001473 const auto inputs = CollectInterfaceByLocation(vs, entrypoint, spv::StorageClassInput, false);
Chris Forbes47567b72017-06-09 12:09:45 -07001474
1475 // Build index by location
Petr Kraus25810d02019-08-27 17:41:15 +02001476 std::map<uint32_t, const VkVertexInputAttributeDescription *> attribs;
Chris Forbes47567b72017-06-09 12:09:45 -07001477 if (vi) {
Petr Kraus25810d02019-08-27 17:41:15 +02001478 for (uint32_t i = 0; i < vi->vertexAttributeDescriptionCount; ++i) {
1479 const auto num_locations = GetLocationsConsumedByFormat(vi->pVertexAttributeDescriptions[i].format);
1480 for (uint32_t j = 0; j < num_locations; ++j) {
Chris Forbes47567b72017-06-09 12:09:45 -07001481 attribs[vi->pVertexAttributeDescriptions[i].location + j] = &vi->pVertexAttributeDescriptions[i];
1482 }
1483 }
1484 }
1485
Petr Kraus25810d02019-08-27 17:41:15 +02001486 struct AttribInputPair {
1487 const VkVertexInputAttributeDescription *attrib = nullptr;
1488 const interface_var *input = nullptr;
1489 };
1490 std::map<uint32_t, AttribInputPair> location_map;
1491 for (const auto &attrib_it : attribs) location_map[attrib_it.first].attrib = attrib_it.second;
1492 for (const auto &input_it : inputs) location_map[input_it.first.first].input = &input_it.second;
Chris Forbes47567b72017-06-09 12:09:45 -07001493
Jamie Madillc1f7ca82020-03-16 17:08:26 -04001494 for (const auto &location_it : location_map) {
Petr Kraus25810d02019-08-27 17:41:15 +02001495 const auto location = location_it.first;
1496 const auto attrib = location_it.second.attrib;
1497 const auto input = location_it.second.input;
Mark Lobodzinski7caa39c2018-07-25 15:48:34 -06001498
Petr Kraus25810d02019-08-27 17:41:15 +02001499 if (attrib && !input) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001500 skip |= LogPerformanceWarning(vs->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
1501 "Vertex attribute at location %" PRIu32 " not consumed by vertex shader", location);
Petr Kraus25810d02019-08-27 17:41:15 +02001502 } else if (!attrib && input) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001503 skip |= LogError(vs->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
1504 "Vertex shader consumes input at location %" PRIu32 " but not provided", location);
Petr Kraus25810d02019-08-27 17:41:15 +02001505 } else if (attrib && input) {
1506 const auto attrib_type = GetFormatType(attrib->format);
1507 const auto input_type = GetFundamentalType(vs, input->type_id);
Chris Forbes47567b72017-06-09 12:09:45 -07001508
1509 // Type checking
1510 if (!(attrib_type & input_type)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001511 skip |= LogError(vs->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
1512 "Attribute type of `%s` at location %" PRIu32 " does not match vertex shader input type of `%s`",
1513 string_VkFormat(attrib->format), location, DescribeType(vs, input->type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001514 }
Petr Kraus25810d02019-08-27 17:41:15 +02001515 } else { // !attrib && !input
1516 assert(false); // at least one exists in the map
Chris Forbes47567b72017-06-09 12:09:45 -07001517 }
1518 }
1519
1520 return skip;
1521}
1522
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001523bool CoreChecks::ValidateFsOutputsAgainstRenderPass(SHADER_MODULE_STATE const *fs, spirv_inst_iter entrypoint,
1524 PIPELINE_STATE const *pipeline, uint32_t subpass_index) const {
Petr Kraus25810d02019-08-27 17:41:15 +02001525 bool skip = false;
Chris Forbes8bca1652017-07-20 11:10:09 -07001526
Petr Kraus25810d02019-08-27 17:41:15 +02001527 const auto rpci = pipeline->rp_state->createInfo.ptr();
1528
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001529 struct Attachment {
1530 const VkAttachmentReference2KHR *reference = nullptr;
1531 const VkAttachmentDescription2KHR *attachment = nullptr;
1532 const interface_var *output = nullptr;
1533 };
1534 std::map<uint32_t, Attachment> location_map;
1535
Petr Kraus25810d02019-08-27 17:41:15 +02001536 const auto subpass = rpci->pSubpasses[subpass_index];
1537 for (uint32_t i = 0; i < subpass.colorAttachmentCount; ++i) {
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001538 auto const &reference = subpass.pColorAttachments[i];
1539 location_map[i].reference = &reference;
1540 if (reference.attachment != VK_ATTACHMENT_UNUSED &&
1541 rpci->pAttachments[reference.attachment].format != VK_FORMAT_UNDEFINED) {
1542 location_map[i].attachment = &rpci->pAttachments[reference.attachment];
Chris Forbes47567b72017-06-09 12:09:45 -07001543 }
1544 }
1545
Chris Forbes47567b72017-06-09 12:09:45 -07001546 // TODO: dual source blend index (spv::DecIndex, zero if not provided)
1547
Petr Kraus25810d02019-08-27 17:41:15 +02001548 const auto outputs = CollectInterfaceByLocation(fs, entrypoint, spv::StorageClassOutput, false);
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001549 for (const auto &output_it : outputs) {
1550 auto const location = output_it.first.first;
1551 location_map[location].output = &output_it.second;
1552 }
Chris Forbes47567b72017-06-09 12:09:45 -07001553
Petr Kraus25810d02019-08-27 17:41:15 +02001554 const bool alphaToCoverageEnabled = pipeline->graphicsPipelineCI.pMultisampleState != NULL &&
1555 pipeline->graphicsPipelineCI.pMultisampleState->alphaToCoverageEnable == VK_TRUE;
Chris Forbes47567b72017-06-09 12:09:45 -07001556
Jamie Madillc1f7ca82020-03-16 17:08:26 -04001557 for (const auto &location_it : location_map) {
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001558 const auto reference = location_it.second.reference;
1559 if (reference != nullptr && reference->attachment == VK_ATTACHMENT_UNUSED) {
1560 continue;
1561 }
1562
Petr Kraus25810d02019-08-27 17:41:15 +02001563 const auto location = location_it.first;
1564 const auto attachment = location_it.second.attachment;
1565 const auto output = location_it.second.output;
Petr Kraus25810d02019-08-27 17:41:15 +02001566 if (attachment && !output) {
1567 if (pipeline->attachments[location].colorWriteMask != 0) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001568 skip |= LogWarning(fs->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
1569 "Attachment %" PRIu32
1570 " not written by fragment shader; undefined values will be written to attachment",
1571 location);
Petr Kraus25810d02019-08-27 17:41:15 +02001572 }
1573 } else if (!attachment && output) {
1574 if (!(alphaToCoverageEnabled && location == 0)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001575 skip |= LogWarning(fs->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
1576 "fragment shader writes to output location %" PRIu32 " with no matching attachment", location);
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001577 }
Petr Kraus25810d02019-08-27 17:41:15 +02001578 } else if (attachment && output) {
1579 const auto attachment_type = GetFormatType(attachment->format);
1580 const auto output_type = GetFundamentalType(fs, output->type_id);
Chris Forbes47567b72017-06-09 12:09:45 -07001581
1582 // Type checking
Petr Kraus25810d02019-08-27 17:41:15 +02001583 if (!(output_type & attachment_type)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001584 skip |=
1585 LogWarning(fs->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
1586 "Attachment %" PRIu32
1587 " of type `%s` does not match fragment shader output type of `%s`; resulting values are undefined",
1588 location, string_VkFormat(attachment->format), DescribeType(fs, output->type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001589 }
Petr Kraus25810d02019-08-27 17:41:15 +02001590 } else { // !attachment && !output
1591 assert(false); // at least one exists in the map
Chris Forbes47567b72017-06-09 12:09:45 -07001592 }
1593 }
1594
Petr Kraus25810d02019-08-27 17:41:15 +02001595 const auto output_zero = location_map.count(0) ? location_map[0].output : nullptr;
1596 bool locationZeroHasAlpha = output_zero && fs->get_def(output_zero->type_id) != fs->end() &&
1597 GetComponentsConsumedByType(fs, output_zero->type_id, false) == 4;
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001598 if (alphaToCoverageEnabled && !locationZeroHasAlpha) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001599 skip |= LogError(fs->vk_shader_module, kVUID_Core_Shader_NoAlphaAtLocation0WithAlphaToCoverage,
1600 "fragment shader doesn't declare alpha output at location 0 even though alpha to coverage is enabled.");
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001601 }
1602
Chris Forbes47567b72017-06-09 12:09:45 -07001603 return skip;
1604}
1605
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001606// For PointSize analysis we need to know if the variable decorated with the PointSize built-in was actually written to.
1607// This function examines instructions in the static call tree for a write to this variable.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06001608static bool IsPointSizeWritten(SHADER_MODULE_STATE const *src, spirv_inst_iter builtin_instr, spirv_inst_iter entrypoint) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001609 auto type = builtin_instr.opcode();
1610 uint32_t target_id = builtin_instr.word(1);
1611 bool init_complete = false;
1612
1613 if (type == spv::OpMemberDecorate) {
1614 // Built-in is part of a structure -- examine instructions up to first function body to get initial IDs
1615 auto insn = entrypoint;
1616 while (!init_complete && (insn.opcode() != spv::OpFunction)) {
1617 switch (insn.opcode()) {
1618 case spv::OpTypePointer:
1619 if ((insn.word(3) == target_id) && (insn.word(2) == spv::StorageClassOutput)) {
1620 target_id = insn.word(1);
1621 }
1622 break;
1623 case spv::OpVariable:
1624 if (insn.word(1) == target_id) {
1625 target_id = insn.word(2);
1626 init_complete = true;
1627 }
1628 break;
1629 }
1630 insn++;
1631 }
1632 }
1633
Mark Lobodzinskif84b0b42018-09-11 14:54:32 -06001634 if (!init_complete && (type == spv::OpMemberDecorate)) return false;
1635
1636 bool found_write = false;
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001637 std::unordered_set<uint32_t> worklist;
1638 worklist.insert(entrypoint.word(2));
1639
1640 // Follow instructions in call graph looking for writes to target
1641 while (!worklist.empty() && !found_write) {
1642 auto id_iter = worklist.begin();
1643 auto id = *id_iter;
1644 worklist.erase(id_iter);
1645
1646 auto insn = src->get_def(id);
1647 if (insn == src->end()) {
1648 continue;
1649 }
1650
1651 if (insn.opcode() == spv::OpFunction) {
1652 // Scan body of function looking for other function calls or items in our ID chain
1653 while (++insn, insn.opcode() != spv::OpFunctionEnd) {
1654 switch (insn.opcode()) {
1655 case spv::OpAccessChain:
1656 if (insn.word(3) == target_id) {
1657 if (type == spv::OpMemberDecorate) {
1658 auto value = GetConstantValue(src, insn.word(4));
1659 if (value == builtin_instr.word(2)) {
1660 target_id = insn.word(2);
1661 }
1662 } else {
1663 target_id = insn.word(2);
1664 }
1665 }
1666 break;
1667 case spv::OpStore:
1668 if (insn.word(1) == target_id) {
1669 found_write = true;
1670 }
1671 break;
1672 case spv::OpFunctionCall:
1673 worklist.insert(insn.word(3));
1674 break;
1675 }
1676 }
1677 }
1678 }
1679 return found_write;
1680}
1681
Chris Forbes47567b72017-06-09 12:09:45 -07001682// For some analyses, we need to know about all ids referenced by the static call tree of a particular entrypoint. This is
1683// important for identifying the set of shader resources actually used by an entrypoint, for example.
1684// Note: we only explore parts of the image which might actually contain ids we care about for the above analyses.
1685// - NOT the shader input/output interfaces.
1686//
1687// TODO: The set of interesting opcodes here was determined by eyeballing the SPIRV spec. It might be worth
1688// converting parts of this to be generated from the machine-readable spec instead.
locke-lunargd9a069d2019-09-17 01:50:19 -06001689std::unordered_set<uint32_t> MarkAccessibleIds(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint) {
Chris Forbes47567b72017-06-09 12:09:45 -07001690 std::unordered_set<uint32_t> ids;
1691 std::unordered_set<uint32_t> worklist;
1692 worklist.insert(entrypoint.word(2));
1693
1694 while (!worklist.empty()) {
1695 auto id_iter = worklist.begin();
1696 auto id = *id_iter;
1697 worklist.erase(id_iter);
1698
1699 auto insn = src->get_def(id);
1700 if (insn == src->end()) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06001701 // ID is something we didn't collect in BuildDefIndex. that's OK -- we'll stumble across all kinds of things here
Chris Forbes47567b72017-06-09 12:09:45 -07001702 // that we may not care about.
1703 continue;
1704 }
1705
1706 // Try to add to the output set
1707 if (!ids.insert(id).second) {
1708 continue; // If we already saw this id, we don't want to walk it again.
1709 }
1710
1711 switch (insn.opcode()) {
1712 case spv::OpFunction:
1713 // Scan whole body of the function, enlisting anything interesting
1714 while (++insn, insn.opcode() != spv::OpFunctionEnd) {
1715 switch (insn.opcode()) {
1716 case spv::OpLoad:
Chris Forbes47567b72017-06-09 12:09:45 -07001717 worklist.insert(insn.word(3)); // ptr
1718 break;
1719 case spv::OpStore:
Chris Forbes47567b72017-06-09 12:09:45 -07001720 worklist.insert(insn.word(1)); // ptr
1721 break;
1722 case spv::OpAccessChain:
1723 case spv::OpInBoundsAccessChain:
1724 worklist.insert(insn.word(3)); // base ptr
1725 break;
1726 case spv::OpSampledImage:
1727 case spv::OpImageSampleImplicitLod:
1728 case spv::OpImageSampleExplicitLod:
1729 case spv::OpImageSampleDrefImplicitLod:
1730 case spv::OpImageSampleDrefExplicitLod:
1731 case spv::OpImageSampleProjImplicitLod:
1732 case spv::OpImageSampleProjExplicitLod:
1733 case spv::OpImageSampleProjDrefImplicitLod:
1734 case spv::OpImageSampleProjDrefExplicitLod:
1735 case spv::OpImageFetch:
1736 case spv::OpImageGather:
1737 case spv::OpImageDrefGather:
1738 case spv::OpImageRead:
1739 case spv::OpImage:
1740 case spv::OpImageQueryFormat:
1741 case spv::OpImageQueryOrder:
1742 case spv::OpImageQuerySizeLod:
1743 case spv::OpImageQuerySize:
1744 case spv::OpImageQueryLod:
1745 case spv::OpImageQueryLevels:
1746 case spv::OpImageQuerySamples:
1747 case spv::OpImageSparseSampleImplicitLod:
1748 case spv::OpImageSparseSampleExplicitLod:
1749 case spv::OpImageSparseSampleDrefImplicitLod:
1750 case spv::OpImageSparseSampleDrefExplicitLod:
1751 case spv::OpImageSparseSampleProjImplicitLod:
1752 case spv::OpImageSparseSampleProjExplicitLod:
1753 case spv::OpImageSparseSampleProjDrefImplicitLod:
1754 case spv::OpImageSparseSampleProjDrefExplicitLod:
1755 case spv::OpImageSparseFetch:
1756 case spv::OpImageSparseGather:
1757 case spv::OpImageSparseDrefGather:
1758 case spv::OpImageTexelPointer:
1759 worklist.insert(insn.word(3)); // Image or sampled image
1760 break;
1761 case spv::OpImageWrite:
1762 worklist.insert(insn.word(1)); // Image -- different operand order to above
1763 break;
1764 case spv::OpFunctionCall:
1765 for (uint32_t i = 3; i < insn.len(); i++) {
1766 worklist.insert(insn.word(i)); // fn itself, and all args
1767 }
1768 break;
1769
1770 case spv::OpExtInst:
1771 for (uint32_t i = 5; i < insn.len(); i++) {
1772 worklist.insert(insn.word(i)); // Operands to ext inst
1773 }
1774 break;
locke-lunarg25b6c352020-08-06 17:44:18 -06001775
1776 default: {
1777 if (AtomicOperation(insn.opcode())) {
1778 if (insn.opcode() == spv::OpAtomicStore) {
1779 worklist.insert(insn.word(1)); // ptr
1780 } else {
1781 worklist.insert(insn.word(3)); // ptr
1782 }
1783 }
1784 break;
1785 }
Chris Forbes47567b72017-06-09 12:09:45 -07001786 }
1787 }
1788 break;
1789 }
1790 }
1791
1792 return ids;
1793}
1794
locke-lunargde3f0fa2020-09-10 11:55:31 -06001795// return: 0: pass, 1: not set, 2: not update
1796int CoreChecks::ValidatePushConstantSetUpdate(const std::vector<int8_t> &push_constant_data_update,
1797 const shader_struct_member &push_constant_used_in_shader,
1798 uint32_t &out_issue_index) const {
1799 const auto *used_bytes = push_constant_used_in_shader.GetUsedbytes();
1800 if (used_bytes->size() == 0) {
1801 return 0;
1802 }
1803 uint32_t i = 0;
1804 for (const auto used : *used_bytes) {
1805 if (used) {
1806 if (i >= push_constant_data_update.size() || push_constant_data_update[i] == -1) {
1807 out_issue_index = i;
1808 return 1; // not set
1809 } else if (push_constant_data_update[i] == 0) {
1810 out_issue_index = i;
1811 return 2; // not update
1812 }
1813 }
1814 ++i;
1815 }
1816 return 0; // pass
1817}
1818
1819bool CoreChecks::ValidatePushConstantUsage(const PIPELINE_STATE &pipeline, SHADER_MODULE_STATE const *src,
1820 VkPipelineShaderStageCreateInfo const *pStage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001821 bool skip = false;
Chris Forbes47567b72017-06-09 12:09:45 -07001822 // Validate directly off the offsets. this isn't quite correct for arrays and matrices, but is a good first step.
locke-lunargde3f0fa2020-09-10 11:55:31 -06001823 const auto *entrypoint = FindEntrypointStruct(src, pStage->pName, pStage->stage);
1824 if (!entrypoint || !entrypoint->push_constant_used_in_shader.IsUsed()) {
1825 return skip;
1826 }
1827 std::vector<VkPushConstantRange> const *push_constant_ranges = pipeline.pipeline_layout->push_constant_ranges.get();
Chris Forbes47567b72017-06-09 12:09:45 -07001828
locke-lunargde3f0fa2020-09-10 11:55:31 -06001829 bool found_stage = false;
1830 for (auto const &range : *push_constant_ranges) {
1831 if (range.stageFlags & pStage->stage) {
1832 found_stage = true;
1833 std::string location_desc;
1834 std::vector<int8_t> push_constant_bytes_set;
1835 if (range.offset > 0) {
1836 push_constant_bytes_set.resize(range.offset, -1);
1837 }
1838 push_constant_bytes_set.resize(range.offset + range.size, 1);
1839 uint32_t issue_index = 0;
1840 int ret = ValidatePushConstantSetUpdate(push_constant_bytes_set, entrypoint->push_constant_used_in_shader, issue_index);
Chris Forbes47567b72017-06-09 12:09:45 -07001841
locke-lunargde3f0fa2020-09-10 11:55:31 -06001842 // "not set" error has been printed in ValidatePushConstantUsage.
1843 if (ret == 1) {
1844 const auto loc_descr = entrypoint->push_constant_used_in_shader.GetLocationDesc(issue_index);
1845 LogObjectList objlist(src->vk_shader_module);
1846 objlist.add(pipeline.pipeline_layout->layout);
1847 skip |= LogError(objlist, kVUID_Core_Shader_PushConstantOutOfRange,
1848 "Push-constant buffer:%s in %s is out of range in %s.", loc_descr.c_str(),
1849 string_VkShaderStageFlags(pStage->stage).c_str(),
1850 report_data->FormatHandle(pipeline.pipeline_layout->layout).c_str());
1851 break;
Chris Forbes47567b72017-06-09 12:09:45 -07001852 }
1853 }
1854 }
1855
locke-lunargde3f0fa2020-09-10 11:55:31 -06001856 if (!found_stage) {
1857 LogObjectList objlist(src->vk_shader_module);
1858 objlist.add(pipeline.pipeline_layout->layout);
1859 skip |= LogError(
1860 objlist, kVUID_Core_Shader_PushConstantOutOfRange, "Push constant is used in %s of %s. But %s doesn't set %s.",
1861 string_VkShaderStageFlags(pStage->stage).c_str(), report_data->FormatHandle(src->vk_shader_module).c_str(),
1862 report_data->FormatHandle(pipeline.pipeline_layout->layout).c_str(), string_VkShaderStageFlags(pStage->stage).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001863 }
Chris Forbes47567b72017-06-09 12:09:45 -07001864 return skip;
1865}
1866
sfricke-samsungef2a68c2020-10-26 04:22:46 -07001867bool CoreChecks::ValidateBuiltinLimits(SHADER_MODULE_STATE const *src, const std::unordered_set<uint32_t> &accessible_ids,
1868 VkShaderStageFlagBits stage) const {
1869 bool skip = false;
1870
1871 // Currently all builtin tested are only found in fragment shaders
1872 if (stage != VK_SHADER_STAGE_FRAGMENT_BIT) {
1873 return skip;
1874 }
1875
1876 for (const auto id : accessible_ids) {
1877 auto insn = src->get_def(id);
1878 const decoration_set decorations = src->get_decorations(insn.word(2));
1879
1880 // Built-ins are obtained from OpVariable
1881 if (((decorations.flags & decoration_set::builtin_bit) != 0) && (insn.opcode() == spv::OpVariable)) {
1882 auto type_pointer = src->get_def(insn.word(1));
1883 assert(type_pointer.opcode() == spv::OpTypePointer);
1884
1885 auto type = src->get_def(type_pointer.word(3));
1886 if (type.opcode() == spv::OpTypeArray) {
1887 uint32_t length = static_cast<uint32_t>(GetConstantValue(src, type.word(3)));
1888
1889 switch (decorations.builtin) {
1890 case spv::BuiltInSampleMask:
1891 // Handles both the input and output sampleMask
1892 if (length > phys_dev_props.limits.maxSampleMaskWords) {
1893 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-maxSampleMaskWords-00711",
1894 "vkCreateGraphicsPipelines(): The BuiltIns SampleMask array sizes is %u which exceeds "
1895 "maxSampleMaskWords of %u in %s.",
1896 length, phys_dev_props.limits.maxSampleMaskWords,
1897 report_data->FormatHandle(src->vk_shader_module).c_str());
1898 }
1899 break;
1900 }
1901 }
1902 }
1903 }
1904
1905 return skip;
1906}
1907
Chris Forbes47567b72017-06-09 12:09:45 -07001908// Validate that data for each specialization entry is fully contained within the buffer.
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001909bool CoreChecks::ValidateSpecializationOffsets(VkPipelineShaderStageCreateInfo const *info) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001910 bool skip = false;
1911
1912 VkSpecializationInfo const *spec = info->pSpecializationInfo;
1913
1914 if (spec) {
1915 for (auto i = 0u; i < spec->mapEntryCount; i++) {
Jeremy Hayes6c555c32019-09-09 17:14:09 -06001916 if (spec->pMapEntries[i].offset >= spec->dataSize) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001917 skip |= LogError(device, "VUID-VkSpecializationInfo-offset-00773",
1918 "Specialization entry %u (for constant id %u) references memory outside provided specialization "
1919 "data (bytes %u.." PRINTF_SIZE_T_SPECIFIER "; " PRINTF_SIZE_T_SPECIFIER " bytes provided)..",
1920 i, spec->pMapEntries[i].constantID, spec->pMapEntries[i].offset,
1921 spec->pMapEntries[i].offset + spec->dataSize - 1, spec->dataSize);
Jeremy Hayes6c555c32019-09-09 17:14:09 -06001922
1923 continue;
1924 }
Chris Forbes47567b72017-06-09 12:09:45 -07001925 if (spec->pMapEntries[i].offset + spec->pMapEntries[i].size > spec->dataSize) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001926 skip |= LogError(device, "VUID-VkSpecializationInfo-pMapEntries-00774",
1927 "Specialization entry %u (for constant id %u) references memory outside provided specialization "
1928 "data (bytes %u.." PRINTF_SIZE_T_SPECIFIER "; " PRINTF_SIZE_T_SPECIFIER " bytes provided)..",
1929 i, spec->pMapEntries[i].constantID, spec->pMapEntries[i].offset,
1930 spec->pMapEntries[i].offset + spec->pMapEntries[i].size - 1, spec->dataSize);
Chris Forbes47567b72017-06-09 12:09:45 -07001931 }
1932 }
1933 }
1934
1935 return skip;
1936}
1937
Jeff Bolz38b3ce72018-09-19 12:53:38 -05001938// TODO (jbolz): Can this return a const reference?
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06001939static std::set<uint32_t> TypeToDescriptorTypeSet(SHADER_MODULE_STATE const *module, uint32_t type_id, unsigned &descriptor_count) {
Chris Forbes47567b72017-06-09 12:09:45 -07001940 auto type = module->get_def(type_id);
Chris Forbes9f89d752018-03-07 12:57:48 -08001941 bool is_storage_buffer = false;
Chris Forbes47567b72017-06-09 12:09:45 -07001942 descriptor_count = 1;
Jeff Bolze54ae892018-09-08 12:16:29 -05001943 std::set<uint32_t> ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001944
1945 // Strip off any array or ptrs. Where we remove array levels, adjust the descriptor count for each dimension.
Jeff Bolzfdf96072018-04-10 14:32:18 -05001946 while (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypePointer || type.opcode() == spv::OpTypeRuntimeArray) {
1947 if (type.opcode() == spv::OpTypeRuntimeArray) {
1948 descriptor_count = 0;
1949 type = module->get_def(type.word(2));
1950 } else if (type.opcode() == spv::OpTypeArray) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06001951 descriptor_count *= GetConstantValue(module, type.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -07001952 type = module->get_def(type.word(2));
1953 } else {
Chris Forbes9f89d752018-03-07 12:57:48 -08001954 if (type.word(2) == spv::StorageClassStorageBuffer) {
1955 is_storage_buffer = true;
1956 }
Chris Forbes47567b72017-06-09 12:09:45 -07001957 type = module->get_def(type.word(3));
1958 }
1959 }
1960
1961 switch (type.opcode()) {
1962 case spv::OpTypeStruct: {
1963 for (auto insn : *module) {
1964 if (insn.opcode() == spv::OpDecorate && insn.word(1) == type.word(1)) {
1965 if (insn.word(2) == spv::DecorationBlock) {
Chris Forbes9f89d752018-03-07 12:57:48 -08001966 if (is_storage_buffer) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001967 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER);
1968 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC);
1969 return ret;
Chris Forbes9f89d752018-03-07 12:57:48 -08001970 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05001971 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER);
1972 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC);
1973 ret.insert(VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK_EXT);
1974 return ret;
Chris Forbes9f89d752018-03-07 12:57:48 -08001975 }
Chris Forbes47567b72017-06-09 12:09:45 -07001976 } else if (insn.word(2) == spv::DecorationBufferBlock) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001977 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER);
1978 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC);
1979 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001980 }
1981 }
1982 }
1983
1984 // Invalid
Jeff Bolze54ae892018-09-08 12:16:29 -05001985 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001986 }
1987
1988 case spv::OpTypeSampler:
Jeff Bolze54ae892018-09-08 12:16:29 -05001989 ret.insert(VK_DESCRIPTOR_TYPE_SAMPLER);
1990 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
1991 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001992
Chris Forbes73c00bf2018-06-22 16:28:06 -07001993 case spv::OpTypeSampledImage: {
1994 // Slight relaxation for some GLSL historical madness: samplerBuffer doesn't really have a sampler, and a texel
1995 // buffer descriptor doesn't really provide one. Allow this slight mismatch.
1996 auto image_type = module->get_def(type.word(2));
1997 auto dim = image_type.word(3);
1998 auto sampled = image_type.word(7);
1999 if (dim == spv::DimBuffer && sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05002000 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER);
2001 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07002002 }
Chris Forbes73c00bf2018-06-22 16:28:06 -07002003 }
Jeff Bolze54ae892018-09-08 12:16:29 -05002004 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
2005 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07002006
2007 case spv::OpTypeImage: {
2008 // Many descriptor types backing image types-- depends on dimension and whether the image will be used with a sampler.
2009 // SPIRV for Vulkan requires that sampled be 1 or 2 -- leaving the decision to runtime is unacceptable.
2010 auto dim = type.word(3);
2011 auto sampled = type.word(7);
2012
2013 if (dim == spv::DimSubpassData) {
Jeff Bolze54ae892018-09-08 12:16:29 -05002014 ret.insert(VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT);
2015 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07002016 } else if (dim == spv::DimBuffer) {
2017 if (sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05002018 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER);
2019 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07002020 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05002021 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER);
2022 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07002023 }
2024 } else if (sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05002025 ret.insert(VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE);
2026 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
2027 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07002028 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05002029 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_IMAGE);
2030 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07002031 }
2032 }
Shannon McPherson0fa28232018-11-01 11:59:02 -06002033 case spv::OpTypeAccelerationStructureNV:
Eric Werness30127fd2018-10-31 21:01:03 -07002034 ret.insert(VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_NV);
Jeff Bolz105d6492018-09-29 15:46:44 -05002035 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07002036
2037 // We shouldn't really see any other junk types -- but if we do, they're a mismatch.
2038 default:
Jeff Bolze54ae892018-09-08 12:16:29 -05002039 return ret; // Matches nothing
Chris Forbes47567b72017-06-09 12:09:45 -07002040 }
2041}
2042
Jeff Bolze54ae892018-09-08 12:16:29 -05002043static std::string string_descriptorTypes(const std::set<uint32_t> &descriptor_types) {
Chris Forbes73c00bf2018-06-22 16:28:06 -07002044 std::stringstream ss;
Jeff Bolze54ae892018-09-08 12:16:29 -05002045 for (auto it = descriptor_types.begin(); it != descriptor_types.end(); ++it) {
2046 if (ss.tellp()) ss << ", ";
2047 ss << string_VkDescriptorType(VkDescriptorType(*it));
Chris Forbes73c00bf2018-06-22 16:28:06 -07002048 }
2049 return ss.str();
2050}
2051
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002052bool CoreChecks::RequirePropertyFlag(VkBool32 check, char const *flag, char const *structure) const {
Jeff Bolzee743412019-06-20 22:24:32 -05002053 if (!check) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002054 if (LogError(device, kVUID_Core_Shader_ExceedDeviceLimit,
2055 "Shader requires flag %s set in %s but it is not set on the device", flag, structure)) {
Jeff Bolzee743412019-06-20 22:24:32 -05002056 return true;
2057 }
2058 }
2059
2060 return false;
2061}
2062
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002063bool CoreChecks::RequireFeature(VkBool32 feature, char const *feature_name) const {
Chris Forbes47567b72017-06-09 12:09:45 -07002064 if (!feature) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002065 if (LogError(device, kVUID_Core_Shader_FeatureNotEnabled, "Shader requires %s but is not enabled on the device",
2066 feature_name)) {
Chris Forbes47567b72017-06-09 12:09:45 -07002067 return true;
2068 }
2069 }
2070
2071 return false;
2072}
2073
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002074bool CoreChecks::RequireExtension(bool extension, char const *extension_name) const {
Chris Forbes47567b72017-06-09 12:09:45 -07002075 if (!extension) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002076 if (LogError(device, kVUID_Core_Shader_FeatureNotEnabled, "Shader requires extension %s but is not enabled on the device",
2077 extension_name)) {
Chris Forbes47567b72017-06-09 12:09:45 -07002078 return true;
2079 }
2080 }
2081
2082 return false;
2083}
2084
John Zulaufac4c6e12019-07-01 16:05:58 -06002085bool CoreChecks::ValidateShaderCapabilities(SHADER_MODULE_STATE const *src, VkShaderStageFlagBits stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07002086 bool skip = false;
2087
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06002088 struct FeaturePointer {
2089 // Callable object to test if this feature is enabled in the given aggregate feature struct
2090 const std::function<VkBool32(const DeviceFeatures &)> IsEnabled;
2091
2092 // Test if feature pointer is populated
2093 explicit operator bool() const { return static_cast<bool>(IsEnabled); }
2094
2095 // Default and nullptr constructor to create an empty FeaturePointer
2096 FeaturePointer() : IsEnabled(nullptr) {}
2097 FeaturePointer(std::nullptr_t ptr) : IsEnabled(nullptr) {}
2098
2099 // Constructors to populate FeaturePointer based on given pointer to member
2100 FeaturePointer(VkBool32 VkPhysicalDeviceFeatures::*ptr)
2101 : IsEnabled([=](const DeviceFeatures &features) { return features.core.*ptr; }) {}
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002102 FeaturePointer(VkBool32 VkPhysicalDeviceVulkan11Features::*ptr)
2103 : IsEnabled([=](const DeviceFeatures &features) { return features.core11.*ptr; }) {}
2104 FeaturePointer(VkBool32 VkPhysicalDeviceVulkan12Features::*ptr)
2105 : IsEnabled([=](const DeviceFeatures &features) { return features.core12.*ptr; }) {}
Brett Lawsonbebfb6f2018-10-23 16:58:50 -07002106 FeaturePointer(VkBool32 VkPhysicalDeviceTransformFeedbackFeaturesEXT::*ptr)
2107 : IsEnabled([=](const DeviceFeatures &features) { return features.transform_feedback_features.*ptr; }) {}
Jeff Bolze4356752019-03-07 11:23:46 -06002108 FeaturePointer(VkBool32 VkPhysicalDeviceCooperativeMatrixFeaturesNV::*ptr)
2109 : IsEnabled([=](const DeviceFeatures &features) { return features.cooperative_matrix_features.*ptr; }) {}
Jason Macnakc5a621d2019-06-10 12:42:50 -07002110 FeaturePointer(VkBool32 VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::*ptr)
2111 : IsEnabled([=](const DeviceFeatures &features) { return features.compute_shader_derivatives_features.*ptr; }) {}
Jason Macnak325e8b52019-06-10 13:33:10 -07002112 FeaturePointer(VkBool32 VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::*ptr)
2113 : IsEnabled([=](const DeviceFeatures &features) { return features.fragment_shader_barycentric_features.*ptr; }) {}
Jason Macnakd7fddf82019-06-13 09:52:49 -07002114 FeaturePointer(VkBool32 VkPhysicalDeviceShaderImageFootprintFeaturesNV::*ptr)
2115 : IsEnabled([=](const DeviceFeatures &features) { return features.shader_image_footprint_features.*ptr; }) {}
Jeff Bolz38f6cb52019-06-30 16:26:44 -05002116 FeaturePointer(VkBool32 VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::*ptr)
2117 : IsEnabled([=](const DeviceFeatures &features) { return features.fragment_shader_interlock_features.*ptr; }) {}
Jeff Bolza38fd3b2019-07-21 11:42:11 -05002118 FeaturePointer(VkBool32 VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::*ptr)
2119 : IsEnabled([=](const DeviceFeatures &features) { return features.demote_to_helper_invocation_features.*ptr; }) {}
Jeff Bolz443c2ca2020-03-19 12:11:51 -05002120 FeaturePointer(VkBool32 VkPhysicalDeviceRayTracingFeaturesKHR::*ptr)
2121 : IsEnabled([=](const DeviceFeatures &features) { return features.ray_tracing_features.*ptr; }) {}
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06002122 };
2123
Chris Forbes47567b72017-06-09 12:09:45 -07002124 struct CapabilityInfo {
2125 char const *name;
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06002126 FeaturePointer feature;
Tony-LunarG2ec96bb2019-11-26 13:43:02 -07002127 ExtEnabled DeviceExtensions::*extension;
Chris Forbes47567b72017-06-09 12:09:45 -07002128 };
2129
Chris Forbes47567b72017-06-09 12:09:45 -07002130 // clang-format off
Dave Houltoneb10ea82017-12-22 12:21:50 -07002131 static const std::unordered_multimap<uint32_t, CapabilityInfo> capabilities = {
Chris Forbes47567b72017-06-09 12:09:45 -07002132 // Capabilities always supported by a Vulkan 1.0 implementation -- no
2133 // feature bits.
2134 {spv::CapabilityMatrix, {nullptr}},
2135 {spv::CapabilityShader, {nullptr}},
2136 {spv::CapabilityInputAttachment, {nullptr}},
2137 {spv::CapabilitySampled1D, {nullptr}},
2138 {spv::CapabilityImage1D, {nullptr}},
2139 {spv::CapabilitySampledBuffer, {nullptr}},
Toni Merilehtib13a4a22019-05-21 12:58:44 +03002140 {spv::CapabilityStorageImageExtendedFormats, {nullptr}},
Chris Forbes47567b72017-06-09 12:09:45 -07002141 {spv::CapabilityImageQuery, {nullptr}},
2142 {spv::CapabilityDerivativeControl, {nullptr}},
2143
2144 // Capabilities that are optionally supported, but require a feature to
2145 // be enabled on the device
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06002146 {spv::CapabilityGeometry, {"VkPhysicalDeviceFeatures::geometryShader", &VkPhysicalDeviceFeatures::geometryShader}},
2147 {spv::CapabilityTessellation, {"VkPhysicalDeviceFeatures::tessellationShader", &VkPhysicalDeviceFeatures::tessellationShader}},
2148 {spv::CapabilityFloat64, {"VkPhysicalDeviceFeatures::shaderFloat64", &VkPhysicalDeviceFeatures::shaderFloat64}},
2149 {spv::CapabilityInt64, {"VkPhysicalDeviceFeatures::shaderInt64", &VkPhysicalDeviceFeatures::shaderInt64}},
2150 {spv::CapabilityTessellationPointSize, {"VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize", &VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize}},
2151 {spv::CapabilityGeometryPointSize, {"VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize", &VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize}},
2152 {spv::CapabilityImageGatherExtended, {"VkPhysicalDeviceFeatures::shaderImageGatherExtended", &VkPhysicalDeviceFeatures::shaderImageGatherExtended}},
2153 {spv::CapabilityStorageImageMultisample, {"VkPhysicalDeviceFeatures::shaderStorageImageMultisample", &VkPhysicalDeviceFeatures::shaderStorageImageMultisample}},
2154 {spv::CapabilityUniformBufferArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderUniformBufferArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderUniformBufferArrayDynamicIndexing}},
2155 {spv::CapabilitySampledImageArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderSampledImageArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderSampledImageArrayDynamicIndexing}},
2156 {spv::CapabilityStorageBufferArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing}},
2157 {spv::CapabilityStorageImageArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderStorageImageArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing}},
2158 {spv::CapabilityClipDistance, {"VkPhysicalDeviceFeatures::shaderClipDistance", &VkPhysicalDeviceFeatures::shaderClipDistance}},
2159 {spv::CapabilityCullDistance, {"VkPhysicalDeviceFeatures::shaderCullDistance", &VkPhysicalDeviceFeatures::shaderCullDistance}},
2160 {spv::CapabilityImageCubeArray, {"VkPhysicalDeviceFeatures::imageCubeArray", &VkPhysicalDeviceFeatures::imageCubeArray}},
2161 {spv::CapabilitySampleRateShading, {"VkPhysicalDeviceFeatures::sampleRateShading", &VkPhysicalDeviceFeatures::sampleRateShading}},
2162 {spv::CapabilitySparseResidency, {"VkPhysicalDeviceFeatures::shaderResourceResidency", &VkPhysicalDeviceFeatures::shaderResourceResidency}},
2163 {spv::CapabilityMinLod, {"VkPhysicalDeviceFeatures::shaderResourceMinLod", &VkPhysicalDeviceFeatures::shaderResourceMinLod}},
2164 {spv::CapabilitySampledCubeArray, {"VkPhysicalDeviceFeatures::imageCubeArray", &VkPhysicalDeviceFeatures::imageCubeArray}},
2165 {spv::CapabilityImageMSArray, {"VkPhysicalDeviceFeatures::shaderStorageImageMultisample", &VkPhysicalDeviceFeatures::shaderStorageImageMultisample}},
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06002166 {spv::CapabilityInterpolationFunction, {"VkPhysicalDeviceFeatures::sampleRateShading", &VkPhysicalDeviceFeatures::sampleRateShading}},
2167 {spv::CapabilityStorageImageReadWithoutFormat, {"VkPhysicalDeviceFeatures::shaderStorageImageReadWithoutFormat", &VkPhysicalDeviceFeatures::shaderStorageImageReadWithoutFormat}},
2168 {spv::CapabilityStorageImageWriteWithoutFormat, {"VkPhysicalDeviceFeatures::shaderStorageImageWriteWithoutFormat", &VkPhysicalDeviceFeatures::shaderStorageImageWriteWithoutFormat}},
2169 {spv::CapabilityMultiViewport, {"VkPhysicalDeviceFeatures::multiViewport", &VkPhysicalDeviceFeatures::multiViewport}},
Jeff Bolzfdf96072018-04-10 14:32:18 -05002170
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06002171 {spv::CapabilityShaderNonUniformEXT, {VK_EXT_DESCRIPTOR_INDEXING_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_descriptor_indexing}},
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002172 {spv::CapabilityRuntimeDescriptorArrayEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::runtimeDescriptorArray", &VkPhysicalDeviceVulkan12Features::runtimeDescriptorArray}},
2173 {spv::CapabilityInputAttachmentArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderInputAttachmentArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderInputAttachmentArrayDynamicIndexing}},
2174 {spv::CapabilityUniformTexelBufferArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformTexelBufferArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformTexelBufferArrayDynamicIndexing}},
2175 {spv::CapabilityStorageTexelBufferArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageTexelBufferArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageTexelBufferArrayDynamicIndexing}},
2176 {spv::CapabilityUniformBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformBufferArrayNonUniformIndexing}},
2177 {spv::CapabilitySampledImageArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderSampledImageArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderSampledImageArrayNonUniformIndexing}},
2178 {spv::CapabilityStorageBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageBufferArrayNonUniformIndexing}},
2179 {spv::CapabilityStorageImageArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageImageArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageImageArrayNonUniformIndexing}},
2180 {spv::CapabilityInputAttachmentArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderInputAttachmentArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderInputAttachmentArrayNonUniformIndexing}},
2181 {spv::CapabilityUniformTexelBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformTexelBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformTexelBufferArrayNonUniformIndexing}},
2182 {spv::CapabilityStorageTexelBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageTexelBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageTexelBufferArrayNonUniformIndexing}},
Chris Forbes47567b72017-06-09 12:09:45 -07002183
2184 // Capabilities that require an extension
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06002185 {spv::CapabilityDrawParameters, {VK_KHR_SHADER_DRAW_PARAMETERS_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_draw_parameters}},
2186 {spv::CapabilityGeometryShaderPassthroughNV, {VK_NV_GEOMETRY_SHADER_PASSTHROUGH_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_geometry_shader_passthrough}},
2187 {spv::CapabilitySampleMaskOverrideCoverageNV, {VK_NV_SAMPLE_MASK_OVERRIDE_COVERAGE_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_sample_mask_override_coverage}},
2188 {spv::CapabilityShaderViewportIndexLayerEXT, {VK_EXT_SHADER_VIEWPORT_INDEX_LAYER_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_viewport_index_layer}},
2189 {spv::CapabilityShaderViewportIndexLayerNV, {VK_NV_VIEWPORT_ARRAY2_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_viewport_array2}},
2190 {spv::CapabilityShaderViewportMaskNV, {VK_NV_VIEWPORT_ARRAY2_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_viewport_array2}},
2191 {spv::CapabilitySubgroupBallotKHR, {VK_EXT_SHADER_SUBGROUP_BALLOT_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_subgroup_ballot }},
2192 {spv::CapabilitySubgroupVoteKHR, {VK_EXT_SHADER_SUBGROUP_VOTE_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_subgroup_vote }},
Jason Macnakb7d091c2019-06-10 11:13:11 -07002193 {spv::CapabilityGroupNonUniformPartitionedNV, {VK_NV_SHADER_SUBGROUP_PARTITIONED_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_shader_subgroup_partitioned}},
aqnuep7033c702018-09-11 18:03:29 +02002194 {spv::CapabilityInt64Atomics, {VK_KHR_SHADER_ATOMIC_INT64_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_atomic_int64 }},
amhaganfa0b34d2019-10-15 16:03:53 -04002195 {spv::CapabilityShaderClockKHR, {VK_KHR_SHADER_CLOCK_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_clock }},
Alexander Galazin3bd8e342018-06-14 15:49:07 +02002196
Jason Macnakc5a621d2019-06-10 12:42:50 -07002197 {spv::CapabilityComputeDerivativeGroupQuadsNV, {"VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupQuads", &VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupQuads, &DeviceExtensions::vk_nv_compute_shader_derivatives}},
2198 {spv::CapabilityComputeDerivativeGroupLinearNV, {"VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupLinear", &VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupLinear, &DeviceExtensions::vk_nv_compute_shader_derivatives}},
Jason Macnakf7019582019-06-13 10:07:26 -07002199 {spv::CapabilityFragmentBarycentricNV, {"VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::fragmentShaderBarycentric", &VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::fragmentShaderBarycentric, &DeviceExtensions::vk_nv_fragment_shader_barycentric}},
Jason Macnakc5a621d2019-06-10 12:42:50 -07002200
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002201 {spv::CapabilityStorageBuffer8BitAccess, {"VkPhysicalDevice8BitStorageFeaturesKHR::storageBuffer8BitAccess", &VkPhysicalDeviceVulkan12Features::storageBuffer8BitAccess, &DeviceExtensions::vk_khr_8bit_storage}},
2202 {spv::CapabilityUniformAndStorageBuffer8BitAccess, {"VkPhysicalDevice8BitStorageFeaturesKHR::uniformAndStorageBuffer8BitAccess", &VkPhysicalDeviceVulkan12Features::uniformAndStorageBuffer8BitAccess, &DeviceExtensions::vk_khr_8bit_storage}},
2203 {spv::CapabilityStoragePushConstant8, {"VkPhysicalDevice8BitStorageFeaturesKHR::storagePushConstant8", &VkPhysicalDeviceVulkan12Features::storagePushConstant8, &DeviceExtensions::vk_khr_8bit_storage}},
Brett Lawsonbebfb6f2018-10-23 16:58:50 -07002204
Jason Macnakf7019582019-06-13 10:07:26 -07002205 {spv::CapabilityTransformFeedback, { "VkPhysicalDeviceTransformFeedbackFeaturesEXT::transformFeedback", &VkPhysicalDeviceTransformFeedbackFeaturesEXT::transformFeedback, &DeviceExtensions::vk_ext_transform_feedback}},
2206 {spv::CapabilityGeometryStreams, { "VkPhysicalDeviceTransformFeedbackFeaturesEXT::geometryStreams", &VkPhysicalDeviceTransformFeedbackFeaturesEXT::geometryStreams, &DeviceExtensions::vk_ext_transform_feedback}},
Jose-Emilio Munoz-Lopez1109b452018-08-21 09:44:07 +01002207
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002208 {spv::CapabilityFloat16, {"VkPhysicalDeviceFloat16Int8FeaturesKHR::shaderFloat16", &VkPhysicalDeviceVulkan12Features::shaderFloat16, &DeviceExtensions::vk_khr_shader_float16_int8}},
2209 {spv::CapabilityInt8, {"VkPhysicalDeviceFloat16Int8FeaturesKHR::shaderInt8", &VkPhysicalDeviceVulkan12Features::shaderInt8, &DeviceExtensions::vk_khr_shader_float16_int8}},
Jeff Bolze4356752019-03-07 11:23:46 -06002210
Jason Macnakd7fddf82019-06-13 09:52:49 -07002211 {spv::CapabilityImageFootprintNV, {"VkPhysicalDeviceShaderImageFootprintFeaturesNV::imageFootprint", &VkPhysicalDeviceShaderImageFootprintFeaturesNV::imageFootprint, &DeviceExtensions::vk_nv_shader_image_footprint}},
2212
Jeff Bolze4356752019-03-07 11:23:46 -06002213 {spv::CapabilityCooperativeMatrixNV, {"VkPhysicalDeviceCooperativeMatrixFeaturesNV::cooperativeMatrix", &VkPhysicalDeviceCooperativeMatrixFeaturesNV::cooperativeMatrix, &DeviceExtensions::vk_nv_cooperative_matrix}},
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002214
Graeme Leese41e6b842019-08-02 10:49:14 +01002215 {spv::CapabilitySignedZeroInfNanPreserve, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderSignedZeroInfNanPreserve", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
2216 {spv::CapabilityDenormPreserve, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderDenormPreserve", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
2217 {spv::CapabilityDenormFlushToZero, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderDenormFlushToZero", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
2218 {spv::CapabilityRoundingModeRTE, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderRoundingModeRTE", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
2219 {spv::CapabilityRoundingModeRTZ, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderRoundingModeRTZ", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
Jeff Bolz38f6cb52019-06-30 16:26:44 -05002220
2221 {spv::CapabilityFragmentShaderSampleInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderSampleInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderSampleInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
2222 {spv::CapabilityFragmentShaderPixelInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderPixelInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderPixelInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
2223 {spv::CapabilityFragmentShaderShadingRateInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderShadingRateInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderShadingRateInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
Jeff Bolza38fd3b2019-07-21 11:42:11 -05002224 {spv::CapabilityDemoteToHelperInvocationEXT, {"VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::shaderDemoteToHelperInvocation", &VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::shaderDemoteToHelperInvocation, &DeviceExtensions::vk_ext_shader_demote_to_helper_invocation}},
Jeff Bolz4563f2a2019-12-10 13:30:30 -06002225
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002226 {spv::CapabilityPhysicalStorageBufferAddresses, {"VkPhysicalDeviceBufferDeviceAddressFeatures::bufferDeviceAddress", &VkPhysicalDeviceVulkan12Features::bufferDeviceAddress, &DeviceExtensions::vk_ext_buffer_device_address}},
Jeff Bolz4563f2a2019-12-10 13:30:30 -06002227 // Should be non-EXT token, but Android SPIRV-Headers are out of date, and the token value is the same anyway
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002228 {spv::CapabilityPhysicalStorageBufferAddressesEXT, {"VkPhysicalDeviceBufferDeviceAddressFeaturesEXT::bufferDeviceAddress", &VkPhysicalDeviceVulkan12Features::bufferDeviceAddress, &DeviceExtensions::vk_khr_buffer_device_address}},
Jeff Bolz443c2ca2020-03-19 12:11:51 -05002229
2230 {spv::CapabilityRayTracingProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayTracing", &VkPhysicalDeviceRayTracingFeaturesKHR::rayTracing, &DeviceExtensions::vk_khr_ray_tracing}},
2231 {spv::CapabilityRayQueryProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayQuery", &VkPhysicalDeviceRayTracingFeaturesKHR::rayQuery, &DeviceExtensions::vk_khr_ray_tracing}},
2232 {spv::CapabilityRayTraversalPrimitiveCullingProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayTracingPrimitiveCulling", &VkPhysicalDeviceRayTracingFeaturesKHR::rayTracingPrimitiveCulling, &DeviceExtensions::vk_khr_ray_tracing}},
Chris Forbes47567b72017-06-09 12:09:45 -07002233 };
2234 // clang-format on
2235
2236 for (auto insn : *src) {
2237 if (insn.opcode() == spv::OpCapability) {
Dave Houltoneb10ea82017-12-22 12:21:50 -07002238 size_t n = capabilities.count(insn.word(1));
2239 if (1 == n) { // key occurs exactly once
2240 auto it = capabilities.find(insn.word(1));
2241 if (it != capabilities.end()) {
2242 if (it->second.feature) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002243 skip |= RequireFeature(it->second.feature.IsEnabled(enabled_features), it->second.name);
Dave Houltoneb10ea82017-12-22 12:21:50 -07002244 }
2245 if (it->second.extension) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002246 skip |= RequireExtension(IsExtEnabled((device_extensions.*(it->second.extension))), it->second.name);
Dave Houltoneb10ea82017-12-22 12:21:50 -07002247 }
Chris Forbes47567b72017-06-09 12:09:45 -07002248 }
Dave Houltoneb10ea82017-12-22 12:21:50 -07002249 } else if (1 < n) { // key occurs multiple times, at least one must be enabled
2250 bool needs_feature = false, has_feature = false;
2251 bool needs_ext = false, has_ext = false;
2252 std::string feature_names = "(one of) [ ";
2253 std::string extension_names = feature_names;
2254 auto caps = capabilities.equal_range(insn.word(1));
2255 for (auto it = caps.first; it != caps.second; ++it) {
2256 if (it->second.feature) {
2257 needs_feature = true;
Mark Lobodzinskid7b03cc2019-04-19 14:23:10 -06002258 has_feature = has_feature || it->second.feature.IsEnabled(enabled_features);
Dave Houltoneb10ea82017-12-22 12:21:50 -07002259 feature_names += it->second.name;
2260 feature_names += " ";
2261 }
2262 if (it->second.extension) {
2263 needs_ext = true;
Mark Lobodzinskif45e45f2019-04-19 14:15:39 -06002264 has_ext = has_ext || device_extensions.*(it->second.extension);
Dave Houltoneb10ea82017-12-22 12:21:50 -07002265 extension_names += it->second.name;
2266 extension_names += " ";
2267 }
2268 }
2269 if (needs_feature) {
2270 feature_names += "]";
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002271 skip |= RequireFeature(has_feature, feature_names.c_str());
Dave Houltoneb10ea82017-12-22 12:21:50 -07002272 }
2273 if (needs_ext) {
2274 extension_names += "]";
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002275 skip |= RequireExtension(has_ext, extension_names.c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07002276 }
Graeme Leesec82dbe02019-08-02 10:44:21 +01002277 }
2278
2279 { // Do group non-uniform checks
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002280 const VkSubgroupFeatureFlags supportedOperations = phys_dev_props_core11.subgroupSupportedOperations;
2281 const VkSubgroupFeatureFlags supportedStages = phys_dev_props_core11.subgroupSupportedStages;
Jeff Bolzee743412019-06-20 22:24:32 -05002282
2283 switch (insn.word(1)) {
2284 default:
2285 break;
2286 case spv::CapabilityGroupNonUniform:
2287 case spv::CapabilityGroupNonUniformVote:
2288 case spv::CapabilityGroupNonUniformArithmetic:
2289 case spv::CapabilityGroupNonUniformBallot:
2290 case spv::CapabilityGroupNonUniformShuffle:
2291 case spv::CapabilityGroupNonUniformShuffleRelative:
2292 case spv::CapabilityGroupNonUniformClustered:
2293 case spv::CapabilityGroupNonUniformQuad:
2294 case spv::CapabilityGroupNonUniformPartitionedNV:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002295 RequirePropertyFlag(supportedStages & stage, string_VkShaderStageFlagBits(stage),
Jeff Bolzee743412019-06-20 22:24:32 -05002296 "VkPhysicalDeviceSubgroupProperties::supportedStages");
2297 break;
2298 }
2299
2300 switch (insn.word(1)) {
2301 default:
2302 break;
2303 case spv::CapabilityGroupNonUniform:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002304 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_BASIC_BIT, "VK_SUBGROUP_FEATURE_BASIC_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05002305 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2306 break;
2307 case spv::CapabilityGroupNonUniformVote:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002308 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_VOTE_BIT, "VK_SUBGROUP_FEATURE_VOTE_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05002309 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2310 break;
2311 case spv::CapabilityGroupNonUniformArithmetic:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002312 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_ARITHMETIC_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05002313 "VK_SUBGROUP_FEATURE_ARITHMETIC_BIT",
2314 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2315 break;
2316 case spv::CapabilityGroupNonUniformBallot:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002317 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_BALLOT_BIT, "VK_SUBGROUP_FEATURE_BALLOT_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05002318 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2319 break;
2320 case spv::CapabilityGroupNonUniformShuffle:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002321 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_SHUFFLE_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05002322 "VK_SUBGROUP_FEATURE_SHUFFLE_BIT",
2323 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2324 break;
2325 case spv::CapabilityGroupNonUniformShuffleRelative:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002326 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_SHUFFLE_RELATIVE_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05002327 "VK_SUBGROUP_FEATURE_SHUFFLE_RELATIVE_BIT",
2328 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2329 break;
2330 case spv::CapabilityGroupNonUniformClustered:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002331 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_CLUSTERED_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05002332 "VK_SUBGROUP_FEATURE_CLUSTERED_BIT",
2333 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2334 break;
2335 case spv::CapabilityGroupNonUniformQuad:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002336 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_QUAD_BIT, "VK_SUBGROUP_FEATURE_QUAD_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05002337 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2338 break;
2339 case spv::CapabilityGroupNonUniformPartitionedNV:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002340 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_PARTITIONED_BIT_NV,
Jeff Bolzee743412019-06-20 22:24:32 -05002341 "VK_SUBGROUP_FEATURE_PARTITIONED_BIT_NV",
2342 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
2343 break;
2344 }
Chris Forbes47567b72017-06-09 12:09:45 -07002345 }
baldurk4095f932020-02-16 13:24:42 +00002346 } else if (insn.opcode() == spv::OpExtension) {
2347 std::string extension_name = (char const *)&insn.word(1);
2348
2349 if (extension_name == "SPV_KHR_non_semantic_info") {
2350 skip |= RequireExtension(IsExtEnabled(device_extensions.vk_khr_shader_non_semantic_info),
2351 VK_KHR_SHADER_NON_SEMANTIC_INFO_EXTENSION_NAME);
2352 }
Chris Forbes47567b72017-06-09 12:09:45 -07002353 }
2354 }
2355
Jeff Bolzee743412019-06-20 22:24:32 -05002356 return skip;
2357}
2358
locke-lunarg63e4daf2020-08-17 17:53:25 -06002359bool CoreChecks::ValidateShaderStageWritableOrAtomicDescriptor(VkShaderStageFlagBits stage, bool has_writable_descriptor,
2360 bool has_atomic_descriptor) const {
Jeff Bolzee743412019-06-20 22:24:32 -05002361 bool skip = false;
2362
locke-lunarg63e4daf2020-08-17 17:53:25 -06002363 if (has_writable_descriptor || has_atomic_descriptor) {
Chris Forbes349b3132018-03-07 11:38:08 -08002364 switch (stage) {
2365 case VK_SHADER_STAGE_COMPUTE_BIT:
Jeff Bolz148d94e2018-12-13 21:25:56 -06002366 case VK_SHADER_STAGE_RAYGEN_BIT_NV:
2367 case VK_SHADER_STAGE_ANY_HIT_BIT_NV:
2368 case VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV:
2369 case VK_SHADER_STAGE_MISS_BIT_NV:
2370 case VK_SHADER_STAGE_INTERSECTION_BIT_NV:
2371 case VK_SHADER_STAGE_CALLABLE_BIT_NV:
2372 case VK_SHADER_STAGE_TASK_BIT_NV:
2373 case VK_SHADER_STAGE_MESH_BIT_NV:
Chris Forbes349b3132018-03-07 11:38:08 -08002374 /* No feature requirements for writes and atomics from compute
Jeff Bolz148d94e2018-12-13 21:25:56 -06002375 * raytracing, or mesh stages */
Chris Forbes349b3132018-03-07 11:38:08 -08002376 break;
2377 case VK_SHADER_STAGE_FRAGMENT_BIT:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002378 skip |= RequireFeature(enabled_features.core.fragmentStoresAndAtomics, "fragmentStoresAndAtomics");
Chris Forbes349b3132018-03-07 11:38:08 -08002379 break;
2380 default:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002381 skip |= RequireFeature(enabled_features.core.vertexPipelineStoresAndAtomics, "vertexPipelineStoresAndAtomics");
Chris Forbes349b3132018-03-07 11:38:08 -08002382 break;
2383 }
2384 }
2385
Chris Forbes47567b72017-06-09 12:09:45 -07002386 return skip;
2387}
2388
Jeff Bolz526f2d52019-09-18 13:18:08 -05002389bool CoreChecks::ValidateShaderStageGroupNonUniform(SHADER_MODULE_STATE const *module, VkShaderStageFlagBits stage) const {
Jeff Bolzee743412019-06-20 22:24:32 -05002390 bool skip = false;
2391
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002392 auto const subgroup_props = phys_dev_props_core11;
Jeff Bolzee743412019-06-20 22:24:32 -05002393
Jeff Bolz526f2d52019-09-18 13:18:08 -05002394 for (auto inst : *module) {
Jeff Bolzee743412019-06-20 22:24:32 -05002395 // Check the quad operations.
2396 switch (inst.opcode()) {
2397 default:
2398 break;
2399 case spv::OpGroupNonUniformQuadBroadcast:
2400 case spv::OpGroupNonUniformQuadSwap:
2401 if ((stage != VK_SHADER_STAGE_FRAGMENT_BIT) && (stage != VK_SHADER_STAGE_COMPUTE_BIT)) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002402 skip |= RequireFeature(subgroup_props.subgroupQuadOperationsInAllStages,
Jeff Bolzee743412019-06-20 22:24:32 -05002403 "VkPhysicalDeviceSubgroupProperties::quadOperationsInAllStages");
2404 }
2405 break;
2406 }
Jeff Bolz526f2d52019-09-18 13:18:08 -05002407
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002408 if (!enabled_features.core12.shaderSubgroupExtendedTypes) {
Jeff Bolz526f2d52019-09-18 13:18:08 -05002409 switch (inst.opcode()) {
2410 default:
2411 break;
2412 case spv::OpGroupNonUniformAllEqual:
2413 case spv::OpGroupNonUniformBroadcast:
2414 case spv::OpGroupNonUniformBroadcastFirst:
2415 case spv::OpGroupNonUniformShuffle:
2416 case spv::OpGroupNonUniformShuffleXor:
2417 case spv::OpGroupNonUniformShuffleUp:
2418 case spv::OpGroupNonUniformShuffleDown:
2419 case spv::OpGroupNonUniformIAdd:
2420 case spv::OpGroupNonUniformFAdd:
2421 case spv::OpGroupNonUniformIMul:
2422 case spv::OpGroupNonUniformFMul:
2423 case spv::OpGroupNonUniformSMin:
2424 case spv::OpGroupNonUniformUMin:
2425 case spv::OpGroupNonUniformFMin:
2426 case spv::OpGroupNonUniformSMax:
2427 case spv::OpGroupNonUniformUMax:
2428 case spv::OpGroupNonUniformFMax:
2429 case spv::OpGroupNonUniformBitwiseAnd:
2430 case spv::OpGroupNonUniformBitwiseOr:
2431 case spv::OpGroupNonUniformBitwiseXor:
2432 case spv::OpGroupNonUniformLogicalAnd:
2433 case spv::OpGroupNonUniformLogicalOr:
2434 case spv::OpGroupNonUniformLogicalXor:
2435 case spv::OpGroupNonUniformQuadBroadcast:
2436 case spv::OpGroupNonUniformQuadSwap: {
2437 auto type = module->get_def(inst.word(1));
2438
2439 if (type.opcode() == spv::OpTypeVector) {
2440 // Get the element type
2441 type = module->get_def(type.word(2));
2442 }
2443
2444 if (type.opcode() == spv::OpTypeBool) {
2445 break;
2446 }
2447
2448 // Both OpTypeInt and OpTypeFloat the width is in the 2nd word.
2449 const uint32_t width = type.word(2);
2450
2451 if ((type.opcode() == spv::OpTypeFloat && width == 16) ||
2452 (type.opcode() == spv::OpTypeInt && (width == 8 || width == 16 || width == 64))) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07002453 skip |= RequireFeature(enabled_features.core12.shaderSubgroupExtendedTypes,
Tony-LunarGa74d3fe2019-11-22 15:43:20 -07002454 "VkPhysicalDeviceShaderSubgroupExtendedTypesFeatures::shaderSubgroupExtendedTypes");
Jeff Bolz526f2d52019-09-18 13:18:08 -05002455 }
2456 break;
2457 }
2458 }
2459 }
Jeff Bolzee743412019-06-20 22:24:32 -05002460 }
2461
2462 return skip;
2463}
2464
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002465bool CoreChecks::ValidateShaderStageInputOutputLimits(SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
John Zulaufac4c6e12019-07-01 16:05:58 -06002466 const PIPELINE_STATE *pipeline, spirv_inst_iter entrypoint) const {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002467 if (pStage->stage == VK_SHADER_STAGE_COMPUTE_BIT || pStage->stage == VK_SHADER_STAGE_ALL_GRAPHICS ||
2468 pStage->stage == VK_SHADER_STAGE_ALL) {
2469 return false;
2470 }
2471
2472 bool skip = false;
Mark Lobodzinski518eadc2019-03-09 12:07:30 -07002473 auto const &limits = phys_dev_props.limits;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002474
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002475 std::set<uint32_t> patchIDs;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002476 struct Variable {
2477 uint32_t baseTypePtrID;
2478 uint32_t ID;
2479 uint32_t storageClass;
2480 };
2481 std::vector<Variable> variables;
2482
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002483 uint32_t numVertices = 0;
2484
Jeff Bolzf234bf82019-11-04 14:07:15 -06002485 auto entrypointVariables = FindEntrypointInterfaces(entrypoint);
2486
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002487 for (auto insn : *src) {
2488 switch (insn.opcode()) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002489 // Find all Patch decorations
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002490 case spv::OpDecorate:
2491 switch (insn.word(2)) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002492 case spv::DecorationPatch: {
2493 patchIDs.insert(insn.word(1));
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002494 break;
2495 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002496 default:
2497 break;
2498 }
2499 break;
2500 // Find all input and output variables
2501 case spv::OpVariable: {
2502 Variable var = {};
2503 var.storageClass = insn.word(3);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002504 if ((var.storageClass == spv::StorageClassInput || var.storageClass == spv::StorageClassOutput) &&
2505 // Only include variables in the entrypoint's interface
2506 find(entrypointVariables.begin(), entrypointVariables.end(), insn.word(2)) != entrypointVariables.end()) {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002507 var.baseTypePtrID = insn.word(1);
2508 var.ID = insn.word(2);
2509 variables.push_back(var);
2510 }
2511 break;
2512 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002513 case spv::OpExecutionMode:
2514 if (insn.word(1) == entrypoint.word(2)) {
2515 switch (insn.word(2)) {
2516 default:
2517 break;
2518 case spv::ExecutionModeOutputVertices:
2519 numVertices = insn.word(3);
2520 break;
2521 }
2522 }
2523 break;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002524 default:
2525 break;
2526 }
2527 }
2528
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002529 bool strip_output_array_level =
2530 (pStage->stage == VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT || pStage->stage == VK_SHADER_STAGE_MESH_BIT_NV);
2531 bool strip_input_array_level =
2532 (pStage->stage == VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT ||
2533 pStage->stage == VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT || pStage->stage == VK_SHADER_STAGE_GEOMETRY_BIT);
2534
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002535 uint32_t numCompIn = 0, numCompOut = 0;
Jeff Bolzf234bf82019-11-04 14:07:15 -06002536 int maxCompIn = 0, maxCompOut = 0;
2537
2538 auto inputs = CollectInterfaceByLocation(src, entrypoint, spv::StorageClassInput, strip_input_array_level);
2539 auto outputs = CollectInterfaceByLocation(src, entrypoint, spv::StorageClassOutput, strip_output_array_level);
2540
2541 // Find max component location used for input variables.
2542 for (auto &var : inputs) {
2543 int location = var.first.first;
2544 int component = var.first.second;
2545 interface_var &iv = var.second;
2546
2547 // Only need to look at the first location, since we use the type's whole size
2548 if (iv.offset != 0) {
2549 continue;
2550 }
2551
2552 if (iv.is_patch) {
2553 continue;
2554 }
2555
2556 int numComponents = GetComponentsConsumedByType(src, iv.type_id, strip_input_array_level);
2557 maxCompIn = std::max(maxCompIn, location * 4 + component + numComponents);
2558 }
2559
2560 // Find max component location used for output variables.
2561 for (auto &var : outputs) {
2562 int location = var.first.first;
2563 int component = var.first.second;
2564 interface_var &iv = var.second;
2565
2566 // Only need to look at the first location, since we use the type's whole size
2567 if (iv.offset != 0) {
2568 continue;
2569 }
2570
2571 if (iv.is_patch) {
2572 continue;
2573 }
2574
2575 int numComponents = GetComponentsConsumedByType(src, iv.type_id, strip_output_array_level);
2576 maxCompOut = std::max(maxCompOut, location * 4 + component + numComponents);
2577 }
2578
2579 // XXX TODO: Would be nice to rewrite this to use CollectInterfaceByLocation (or something similar),
2580 // but that doesn't include builtins.
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002581 for (auto &var : variables) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002582 // Check if the variable is a patch. Patches can also be members of blocks,
2583 // but if they are then the top-level arrayness has already been stripped
2584 // by the time GetComponentsConsumedByType gets to it.
2585 bool isPatch = patchIDs.find(var.ID) != patchIDs.end();
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002586
2587 if (var.storageClass == spv::StorageClassInput) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002588 numCompIn += GetComponentsConsumedByType(src, var.baseTypePtrID, strip_input_array_level && !isPatch);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002589 } else { // var.storageClass == spv::StorageClassOutput
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002590 numCompOut += GetComponentsConsumedByType(src, var.baseTypePtrID, strip_output_array_level && !isPatch);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002591 }
2592 }
2593
2594 switch (pStage->stage) {
2595 case VK_SHADER_STAGE_VERTEX_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002596 if (numCompOut > limits.maxVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002597 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2598 "Invalid Pipeline CreateInfo State: Vertex shader exceeds "
2599 "VkPhysicalDeviceLimits::maxVertexOutputComponents of %u "
2600 "components by %u components",
2601 limits.maxVertexOutputComponents, numCompOut - limits.maxVertexOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002602 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002603 if (maxCompOut > (int)limits.maxVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002604 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2605 "Invalid Pipeline CreateInfo State: Vertex shader output variable uses location that "
2606 "exceeds component limit VkPhysicalDeviceLimits::maxVertexOutputComponents (%u)",
2607 limits.maxVertexOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002608 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002609 break;
2610
2611 case VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002612 if (numCompIn > limits.maxTessellationControlPerVertexInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002613 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2614 "Invalid Pipeline CreateInfo State: Tessellation control shader exceeds "
2615 "VkPhysicalDeviceLimits::maxTessellationControlPerVertexInputComponents of %u "
2616 "components by %u components",
2617 limits.maxTessellationControlPerVertexInputComponents,
2618 numCompIn - limits.maxTessellationControlPerVertexInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002619 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002620 if (maxCompIn > (int)limits.maxTessellationControlPerVertexInputComponents) {
2621 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002622 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2623 "Invalid Pipeline CreateInfo State: Tessellation control shader input variable uses location that "
2624 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationControlPerVertexInputComponents (%u)",
2625 limits.maxTessellationControlPerVertexInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002626 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002627 if (numCompOut > limits.maxTessellationControlPerVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002628 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2629 "Invalid Pipeline CreateInfo State: Tessellation control shader exceeds "
2630 "VkPhysicalDeviceLimits::maxTessellationControlPerVertexOutputComponents of %u "
2631 "components by %u components",
2632 limits.maxTessellationControlPerVertexOutputComponents,
2633 numCompOut - limits.maxTessellationControlPerVertexOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002634 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002635 if (maxCompOut > (int)limits.maxTessellationControlPerVertexOutputComponents) {
2636 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002637 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2638 "Invalid Pipeline CreateInfo State: Tessellation control shader output variable uses location that "
2639 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationControlPerVertexOutputComponents (%u)",
2640 limits.maxTessellationControlPerVertexOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002641 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002642 break;
2643
2644 case VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002645 if (numCompIn > limits.maxTessellationEvaluationInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002646 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2647 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader exceeds "
2648 "VkPhysicalDeviceLimits::maxTessellationEvaluationInputComponents of %u "
2649 "components by %u components",
2650 limits.maxTessellationEvaluationInputComponents,
2651 numCompIn - limits.maxTessellationEvaluationInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002652 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002653 if (maxCompIn > (int)limits.maxTessellationEvaluationInputComponents) {
2654 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002655 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2656 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader input variable uses location that "
2657 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationEvaluationInputComponents (%u)",
2658 limits.maxTessellationEvaluationInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002659 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002660 if (numCompOut > limits.maxTessellationEvaluationOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002661 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2662 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader exceeds "
2663 "VkPhysicalDeviceLimits::maxTessellationEvaluationOutputComponents of %u "
2664 "components by %u components",
2665 limits.maxTessellationEvaluationOutputComponents,
2666 numCompOut - limits.maxTessellationEvaluationOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002667 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002668 if (maxCompOut > (int)limits.maxTessellationEvaluationOutputComponents) {
2669 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002670 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2671 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader output variable uses location that "
2672 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationEvaluationOutputComponents (%u)",
2673 limits.maxTessellationEvaluationOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002674 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002675 break;
2676
2677 case VK_SHADER_STAGE_GEOMETRY_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002678 if (numCompIn > limits.maxGeometryInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002679 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2680 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2681 "VkPhysicalDeviceLimits::maxGeometryInputComponents of %u "
2682 "components by %u components",
2683 limits.maxGeometryInputComponents, numCompIn - limits.maxGeometryInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002684 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002685 if (maxCompIn > (int)limits.maxGeometryInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002686 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2687 "Invalid Pipeline CreateInfo State: Geometry shader input variable uses location that "
2688 "exceeds component limit VkPhysicalDeviceLimits::maxGeometryInputComponents (%u)",
2689 limits.maxGeometryInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002690 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002691 if (numCompOut > limits.maxGeometryOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002692 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2693 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2694 "VkPhysicalDeviceLimits::maxGeometryOutputComponents of %u "
2695 "components by %u components",
2696 limits.maxGeometryOutputComponents, numCompOut - limits.maxGeometryOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002697 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002698 if (maxCompOut > (int)limits.maxGeometryOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002699 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2700 "Invalid Pipeline CreateInfo State: Geometry shader output variable uses location that "
2701 "exceeds component limit VkPhysicalDeviceLimits::maxGeometryOutputComponents (%u)",
2702 limits.maxGeometryOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002703 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002704 if (numCompOut * numVertices > limits.maxGeometryTotalOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002705 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2706 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2707 "VkPhysicalDeviceLimits::maxGeometryTotalOutputComponents of %u "
2708 "components by %u components",
2709 limits.maxGeometryTotalOutputComponents,
2710 numCompOut * numVertices - limits.maxGeometryTotalOutputComponents);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002711 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002712 break;
2713
2714 case VK_SHADER_STAGE_FRAGMENT_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002715 if (numCompIn > limits.maxFragmentInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002716 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2717 "Invalid Pipeline CreateInfo State: Fragment shader exceeds "
2718 "VkPhysicalDeviceLimits::maxFragmentInputComponents of %u "
2719 "components by %u components",
2720 limits.maxFragmentInputComponents, numCompIn - limits.maxFragmentInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002721 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002722 if (maxCompIn > (int)limits.maxFragmentInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002723 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2724 "Invalid Pipeline CreateInfo State: Fragment shader input variable uses location that "
2725 "exceeds component limit VkPhysicalDeviceLimits::maxFragmentInputComponents (%u)",
2726 limits.maxFragmentInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002727 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002728 break;
2729
Jeff Bolz148d94e2018-12-13 21:25:56 -06002730 case VK_SHADER_STAGE_RAYGEN_BIT_NV:
2731 case VK_SHADER_STAGE_ANY_HIT_BIT_NV:
2732 case VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV:
2733 case VK_SHADER_STAGE_MISS_BIT_NV:
2734 case VK_SHADER_STAGE_INTERSECTION_BIT_NV:
2735 case VK_SHADER_STAGE_CALLABLE_BIT_NV:
2736 case VK_SHADER_STAGE_TASK_BIT_NV:
2737 case VK_SHADER_STAGE_MESH_BIT_NV:
2738 break;
2739
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002740 default:
2741 assert(false); // This should never happen
2742 }
2743 return skip;
2744}
2745
sfricke-samsungdc96f302020-03-18 20:42:10 -07002746bool CoreChecks::ValidateShaderStageMaxResources(VkShaderStageFlagBits stage, const PIPELINE_STATE *pipeline) const {
2747 bool skip = false;
2748 uint32_t total_resources = 0;
2749
2750 // Only currently testing for graphics and compute pipelines
2751 // TODO: Add check and support for Ray Tracing pipeline VUID 03428
2752 if ((stage & (VK_SHADER_STAGE_ALL_GRAPHICS | VK_SHADER_STAGE_COMPUTE_BIT)) == 0) {
2753 return false;
2754 }
2755
2756 if (stage == VK_SHADER_STAGE_FRAGMENT_BIT) {
2757 // "For the fragment shader stage the framebuffer color attachments also count against this limit"
2758 total_resources += pipeline->rp_state->createInfo.pSubpasses[pipeline->graphicsPipelineCI.subpass].colorAttachmentCount;
2759 }
2760
2761 // TODO: This reuses a lot of GetDescriptorCountMaxPerStage but currently would need to make it agnostic in a way to handle
2762 // input from CreatePipeline and CreatePipelineLayout level
2763 for (auto set_layout : pipeline->pipeline_layout->set_layouts) {
2764 if ((set_layout->GetCreateFlags() & VK_DESCRIPTOR_SET_LAYOUT_CREATE_UPDATE_AFTER_BIND_POOL_BIT) != 0) {
2765 continue;
2766 }
2767
2768 for (uint32_t binding_idx = 0; binding_idx < set_layout->GetBindingCount(); binding_idx++) {
2769 const VkDescriptorSetLayoutBinding *binding = set_layout->GetDescriptorSetLayoutBindingPtrFromIndex(binding_idx);
2770 // Bindings with a descriptorCount of 0 are "reserved" and should be skipped
2771 if (((stage & binding->stageFlags) != 0) && (binding->descriptorCount > 0)) {
2772 // Check only descriptor types listed in maxPerStageResources description in spec
2773 switch (binding->descriptorType) {
2774 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
2775 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
2776 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
2777 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
2778 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
2779 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
2780 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
2781 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
2782 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
2783 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
2784 total_resources += binding->descriptorCount;
2785 break;
2786 default:
2787 break;
2788 }
2789 }
2790 }
2791 }
2792
2793 if (total_resources > phys_dev_props.limits.maxPerStageResources) {
2794 const char *vuid = (stage == VK_SHADER_STAGE_COMPUTE_BIT) ? "VUID-VkComputePipelineCreateInfo-layout-01687"
2795 : "VUID-VkGraphicsPipelineCreateInfo-layout-01688";
2796 skip |= LogError(pipeline->pipeline, vuid,
2797 "Invalid Pipeline CreateInfo State: Shader Stage %s exceeds component limit "
2798 "VkPhysicalDeviceLimits::maxPerStageResources (%u)",
2799 string_VkShaderStageFlagBits(stage), phys_dev_props.limits.maxPerStageResources);
2800 }
2801
2802 return skip;
2803}
2804
Jeff Bolze4356752019-03-07 11:23:46 -06002805// copy the specialization constant value into buf, if it is present
2806void GetSpecConstantValue(VkPipelineShaderStageCreateInfo const *pStage, uint32_t spec_id, void *buf) {
2807 VkSpecializationInfo const *spec = pStage->pSpecializationInfo;
2808
2809 if (spec && spec_id < spec->mapEntryCount) {
2810 memcpy(buf, (uint8_t *)spec->pData + spec->pMapEntries[spec_id].offset, spec->pMapEntries[spec_id].size);
2811 }
2812}
2813
2814// Fill in value with the constant or specialization constant value, if available.
2815// Returns true if the value has been accurately filled out.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002816static bool GetIntConstantValue(spirv_inst_iter insn, SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
Jeff Bolze4356752019-03-07 11:23:46 -06002817 const std::unordered_map<uint32_t, uint32_t> &id_to_spec_id, uint32_t *value) {
2818 auto type_id = src->get_def(insn.word(1));
2819 if (type_id.opcode() != spv::OpTypeInt || type_id.word(2) != 32) {
2820 return false;
2821 }
2822 switch (insn.opcode()) {
2823 case spv::OpSpecConstant:
2824 *value = insn.word(3);
2825 GetSpecConstantValue(pStage, id_to_spec_id.at(insn.word(2)), value);
2826 return true;
2827 case spv::OpConstant:
2828 *value = insn.word(3);
2829 return true;
2830 default:
2831 return false;
2832 }
2833}
2834
2835// Map SPIR-V type to VK_COMPONENT_TYPE enum
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002836VkComponentTypeNV GetComponentType(spirv_inst_iter insn, SHADER_MODULE_STATE const *src) {
Jeff Bolze4356752019-03-07 11:23:46 -06002837 switch (insn.opcode()) {
2838 case spv::OpTypeInt:
2839 switch (insn.word(2)) {
2840 case 8:
2841 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT8_NV : VK_COMPONENT_TYPE_UINT8_NV;
2842 case 16:
2843 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT16_NV : VK_COMPONENT_TYPE_UINT16_NV;
2844 case 32:
2845 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT32_NV : VK_COMPONENT_TYPE_UINT32_NV;
2846 case 64:
2847 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT64_NV : VK_COMPONENT_TYPE_UINT64_NV;
2848 default:
2849 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2850 }
2851 case spv::OpTypeFloat:
2852 switch (insn.word(2)) {
2853 case 16:
2854 return VK_COMPONENT_TYPE_FLOAT16_NV;
2855 case 32:
2856 return VK_COMPONENT_TYPE_FLOAT32_NV;
2857 case 64:
2858 return VK_COMPONENT_TYPE_FLOAT64_NV;
2859 default:
2860 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2861 }
2862 default:
2863 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2864 }
2865}
2866
2867// Validate SPV_NV_cooperative_matrix behavior that can't be statically validated
2868// in SPIRV-Tools (e.g. due to specialization constant usage).
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002869bool CoreChecks::ValidateCooperativeMatrix(SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
John Zulaufac4c6e12019-07-01 16:05:58 -06002870 const PIPELINE_STATE *pipeline) const {
Jeff Bolze4356752019-03-07 11:23:46 -06002871 bool skip = false;
2872
2873 // Map SPIR-V result ID to specialization constant id (SpecId decoration value)
2874 std::unordered_map<uint32_t, uint32_t> id_to_spec_id;
2875 // Map SPIR-V result ID to the ID of its type.
2876 std::unordered_map<uint32_t, uint32_t> id_to_type_id;
2877
2878 struct CoopMatType {
2879 uint32_t scope, rows, cols;
2880 VkComponentTypeNV component_type;
2881 bool all_constant;
2882
2883 CoopMatType() : scope(0), rows(0), cols(0), component_type(VK_COMPONENT_TYPE_MAX_ENUM_NV), all_constant(false) {}
2884
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002885 void Init(uint32_t id, SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
Jeff Bolze4356752019-03-07 11:23:46 -06002886 const std::unordered_map<uint32_t, uint32_t> &id_to_spec_id) {
2887 spirv_inst_iter insn = src->get_def(id);
2888 uint32_t component_type_id = insn.word(2);
2889 uint32_t scope_id = insn.word(3);
2890 uint32_t rows_id = insn.word(4);
2891 uint32_t cols_id = insn.word(5);
2892 auto component_type_iter = src->get_def(component_type_id);
2893 auto scope_iter = src->get_def(scope_id);
2894 auto rows_iter = src->get_def(rows_id);
2895 auto cols_iter = src->get_def(cols_id);
2896
2897 all_constant = true;
2898 if (!GetIntConstantValue(scope_iter, src, pStage, id_to_spec_id, &scope)) {
2899 all_constant = false;
2900 }
2901 if (!GetIntConstantValue(rows_iter, src, pStage, id_to_spec_id, &rows)) {
2902 all_constant = false;
2903 }
2904 if (!GetIntConstantValue(cols_iter, src, pStage, id_to_spec_id, &cols)) {
2905 all_constant = false;
2906 }
2907 component_type = GetComponentType(component_type_iter, src);
2908 }
2909 };
2910
2911 bool seen_coopmat_capability = false;
2912
2913 for (auto insn : *src) {
2914 // Whitelist instructions whose result can be a cooperative matrix type, and
2915 // keep track of their types. It would be nice if SPIRV-Headers generated code
2916 // to identify which instructions have a result type and result id. Lacking that,
2917 // this whitelist is based on the set of instructions that
2918 // SPV_NV_cooperative_matrix says can be used with cooperative matrix types.
2919 switch (insn.opcode()) {
2920 case spv::OpLoad:
2921 case spv::OpCooperativeMatrixLoadNV:
2922 case spv::OpCooperativeMatrixMulAddNV:
2923 case spv::OpSNegate:
2924 case spv::OpFNegate:
2925 case spv::OpIAdd:
2926 case spv::OpFAdd:
2927 case spv::OpISub:
2928 case spv::OpFSub:
2929 case spv::OpFDiv:
2930 case spv::OpSDiv:
2931 case spv::OpUDiv:
2932 case spv::OpMatrixTimesScalar:
2933 case spv::OpConstantComposite:
2934 case spv::OpCompositeConstruct:
2935 case spv::OpConvertFToU:
2936 case spv::OpConvertFToS:
2937 case spv::OpConvertSToF:
2938 case spv::OpConvertUToF:
2939 case spv::OpUConvert:
2940 case spv::OpSConvert:
2941 case spv::OpFConvert:
2942 id_to_type_id[insn.word(2)] = insn.word(1);
2943 break;
2944 default:
2945 break;
2946 }
2947
2948 switch (insn.opcode()) {
2949 case spv::OpDecorate:
2950 if (insn.word(2) == spv::DecorationSpecId) {
2951 id_to_spec_id[insn.word(1)] = insn.word(3);
2952 }
2953 break;
2954 case spv::OpCapability:
2955 if (insn.word(1) == spv::CapabilityCooperativeMatrixNV) {
2956 seen_coopmat_capability = true;
2957
2958 if (!(pStage->stage & phys_dev_ext_props.cooperative_matrix_props.cooperativeMatrixSupportedStages)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002959 skip |= LogError(
2960 pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixSupportedStages,
2961 "OpTypeCooperativeMatrixNV used in shader stage not in cooperativeMatrixSupportedStages (= %u)",
2962 phys_dev_ext_props.cooperative_matrix_props.cooperativeMatrixSupportedStages);
Jeff Bolze4356752019-03-07 11:23:46 -06002963 }
2964 }
2965 break;
2966 case spv::OpMemoryModel:
2967 // If the capability isn't enabled, don't bother with the rest of this function.
2968 // OpMemoryModel is the first required instruction after all OpCapability instructions.
2969 if (!seen_coopmat_capability) {
2970 return skip;
2971 }
2972 break;
2973 case spv::OpTypeCooperativeMatrixNV: {
2974 CoopMatType M;
2975 M.Init(insn.word(1), src, pStage, id_to_spec_id);
2976
2977 if (M.all_constant) {
2978 // Validate that the type parameters are all supported for one of the
2979 // operands of a cooperative matrix property.
2980 bool valid = false;
2981 for (unsigned i = 0; i < cooperative_matrix_properties.size(); ++i) {
2982 if (cooperative_matrix_properties[i].AType == M.component_type &&
2983 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].KSize == M.cols &&
2984 cooperative_matrix_properties[i].scope == M.scope) {
2985 valid = true;
2986 break;
2987 }
2988 if (cooperative_matrix_properties[i].BType == M.component_type &&
2989 cooperative_matrix_properties[i].KSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
2990 cooperative_matrix_properties[i].scope == M.scope) {
2991 valid = true;
2992 break;
2993 }
2994 if (cooperative_matrix_properties[i].CType == M.component_type &&
2995 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
2996 cooperative_matrix_properties[i].scope == M.scope) {
2997 valid = true;
2998 break;
2999 }
3000 if (cooperative_matrix_properties[i].DType == M.component_type &&
3001 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
3002 cooperative_matrix_properties[i].scope == M.scope) {
3003 valid = true;
3004 break;
3005 }
3006 }
3007 if (!valid) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003008 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixType,
3009 "OpTypeCooperativeMatrixNV (result id = %u) operands don't match a supported matrix type",
3010 insn.word(1));
Jeff Bolze4356752019-03-07 11:23:46 -06003011 }
3012 }
3013 break;
3014 }
3015 case spv::OpCooperativeMatrixMulAddNV: {
3016 CoopMatType A, B, C, D;
3017 if (id_to_type_id.find(insn.word(2)) == id_to_type_id.end() ||
3018 id_to_type_id.find(insn.word(3)) == id_to_type_id.end() ||
3019 id_to_type_id.find(insn.word(4)) == id_to_type_id.end() ||
3020 id_to_type_id.find(insn.word(5)) == id_to_type_id.end()) {
Mike Schuchardte48dc142019-04-18 09:12:03 -07003021 // Couldn't find type of matrix
3022 assert(false);
Jeff Bolze4356752019-03-07 11:23:46 -06003023 break;
3024 }
3025 D.Init(id_to_type_id[insn.word(2)], src, pStage, id_to_spec_id);
3026 A.Init(id_to_type_id[insn.word(3)], src, pStage, id_to_spec_id);
3027 B.Init(id_to_type_id[insn.word(4)], src, pStage, id_to_spec_id);
3028 C.Init(id_to_type_id[insn.word(5)], src, pStage, id_to_spec_id);
3029
3030 if (A.all_constant && B.all_constant && C.all_constant && D.all_constant) {
3031 // Validate that the type parameters are all supported for the same
3032 // cooperative matrix property.
3033 bool valid = false;
3034 for (unsigned i = 0; i < cooperative_matrix_properties.size(); ++i) {
3035 if (cooperative_matrix_properties[i].AType == A.component_type &&
3036 cooperative_matrix_properties[i].MSize == A.rows && cooperative_matrix_properties[i].KSize == A.cols &&
3037 cooperative_matrix_properties[i].scope == A.scope &&
3038
3039 cooperative_matrix_properties[i].BType == B.component_type &&
3040 cooperative_matrix_properties[i].KSize == B.rows && cooperative_matrix_properties[i].NSize == B.cols &&
3041 cooperative_matrix_properties[i].scope == B.scope &&
3042
3043 cooperative_matrix_properties[i].CType == C.component_type &&
3044 cooperative_matrix_properties[i].MSize == C.rows && cooperative_matrix_properties[i].NSize == C.cols &&
3045 cooperative_matrix_properties[i].scope == C.scope &&
3046
3047 cooperative_matrix_properties[i].DType == D.component_type &&
3048 cooperative_matrix_properties[i].MSize == D.rows && cooperative_matrix_properties[i].NSize == D.cols &&
3049 cooperative_matrix_properties[i].scope == D.scope) {
3050 valid = true;
3051 break;
3052 }
3053 }
3054 if (!valid) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003055 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixMulAdd,
3056 "OpCooperativeMatrixMulAddNV (result id = %u) operands don't match a supported matrix "
3057 "VkCooperativeMatrixPropertiesNV",
3058 insn.word(2));
Jeff Bolze4356752019-03-07 11:23:46 -06003059 }
3060 }
3061 break;
3062 }
3063 default:
3064 break;
3065 }
3066 }
3067
3068 return skip;
3069}
3070
John Zulaufac4c6e12019-07-01 16:05:58 -06003071bool CoreChecks::ValidateExecutionModes(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint) const {
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003072 auto entrypoint_id = entrypoint.word(2);
3073
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01003074 // The first denorm execution mode encountered, along with its bit width.
3075 // Used to check if SeparateDenormSettings is respected.
3076 std::pair<spv::ExecutionMode, uint32_t> first_denorm_execution_mode = std::make_pair(spv::ExecutionModeMax, 0);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003077
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01003078 // The first rounding mode encountered, along with its bit width.
3079 // Used to check if SeparateRoundingModeSettings is respected.
3080 std::pair<spv::ExecutionMode, uint32_t> first_rounding_mode = std::make_pair(spv::ExecutionModeMax, 0);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003081
3082 bool skip = false;
3083
Jeff Bolze9ee3d82019-05-29 13:45:13 -05003084 uint32_t verticesOut = 0;
3085 uint32_t invocations = 0;
3086
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003087 for (auto insn : *src) {
3088 if (insn.opcode() == spv::OpExecutionMode && insn.word(1) == entrypoint_id) {
3089 auto mode = insn.word(2);
3090 switch (mode) {
3091 case spv::ExecutionModeSignedZeroInfNanPreserve: {
3092 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003093 if ((bit_width == 16 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat16) ||
3094 (bit_width == 32 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat32) ||
3095 (bit_width == 64 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003096 skip |= LogError(
3097 device, kVUID_Core_Shader_FeatureNotEnabled,
3098 "Shader requires SignedZeroInfNanPreserve for bit width %d but it is not enabled on the device",
3099 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003100 }
3101 break;
3102 }
3103
3104 case spv::ExecutionModeDenormPreserve: {
3105 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003106 if ((bit_width == 16 && !phys_dev_props_core12.shaderDenormPreserveFloat16) ||
3107 (bit_width == 32 && !phys_dev_props_core12.shaderDenormPreserveFloat32) ||
3108 (bit_width == 64 && !phys_dev_props_core12.shaderDenormPreserveFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003109 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3110 "Shader requires DenormPreserve for bit width %d but it is not enabled on the device",
3111 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003112 }
3113
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01003114 if (first_denorm_execution_mode.first == spv::ExecutionModeMax) {
3115 // Register the first denorm execution mode found
3116 first_denorm_execution_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003117 } else if (first_denorm_execution_mode.first != mode && first_denorm_execution_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003118 switch (phys_dev_props_core12.denormBehaviorIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003119 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
3120 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003121 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3122 "Shader uses different denorm execution modes for 16 and 64-bit but "
3123 "denormBehaviorIndependence is "
3124 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003125 }
3126 break;
3127
3128 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
3129 break;
3130
3131 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003132 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3133 "Shader uses different denorm execution modes for different bit widths but "
3134 "denormBehaviorIndependence is "
3135 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003136 break;
3137
3138 default:
3139 break;
3140 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003141 }
3142 break;
3143 }
3144
3145 case spv::ExecutionModeDenormFlushToZero: {
3146 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003147 if ((bit_width == 16 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat16) ||
3148 (bit_width == 32 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat32) ||
3149 (bit_width == 64 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003150 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3151 "Shader requires DenormFlushToZero for bit width %d but it is not enabled on the device",
3152 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003153 }
3154
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01003155 if (first_denorm_execution_mode.first == spv::ExecutionModeMax) {
3156 // Register the first denorm execution mode found
3157 first_denorm_execution_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003158 } else if (first_denorm_execution_mode.first != mode && first_denorm_execution_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003159 switch (phys_dev_props_core12.denormBehaviorIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003160 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
3161 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003162 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3163 "Shader uses different denorm execution modes for 16 and 64-bit but "
3164 "denormBehaviorIndependence is "
3165 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003166 }
3167 break;
3168
3169 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
3170 break;
3171
3172 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003173 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3174 "Shader uses different denorm execution modes for different bit widths but "
3175 "denormBehaviorIndependence is "
3176 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003177 break;
3178
3179 default:
3180 break;
3181 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003182 }
3183 break;
3184 }
3185
3186 case spv::ExecutionModeRoundingModeRTE: {
3187 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003188 if ((bit_width == 16 && !phys_dev_props_core12.shaderRoundingModeRTEFloat16) ||
3189 (bit_width == 32 && !phys_dev_props_core12.shaderRoundingModeRTEFloat32) ||
3190 (bit_width == 64 && !phys_dev_props_core12.shaderRoundingModeRTEFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003191 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3192 "Shader requires RoundingModeRTE for bit width %d but it is not enabled on the device",
3193 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003194 }
3195
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01003196 if (first_rounding_mode.first == spv::ExecutionModeMax) {
3197 // Register the first rounding mode found
3198 first_rounding_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003199 } else if (first_rounding_mode.first != mode && first_rounding_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003200 switch (phys_dev_props_core12.roundingModeIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003201 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
3202 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003203 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3204 "Shader uses different rounding modes for 16 and 64-bit but "
3205 "roundingModeIndependence is "
3206 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003207 }
3208 break;
3209
3210 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
3211 break;
3212
3213 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003214 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3215 "Shader uses different rounding modes for different bit widths but "
3216 "roundingModeIndependence is "
3217 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003218 break;
3219
3220 default:
3221 break;
3222 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003223 }
3224 break;
3225 }
3226
3227 case spv::ExecutionModeRoundingModeRTZ: {
3228 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003229 if ((bit_width == 16 && !phys_dev_props_core12.shaderRoundingModeRTZFloat16) ||
3230 (bit_width == 32 && !phys_dev_props_core12.shaderRoundingModeRTZFloat32) ||
3231 (bit_width == 64 && !phys_dev_props_core12.shaderRoundingModeRTZFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003232 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3233 "Shader requires RoundingModeRTZ for bit width %d but it is not enabled on the device",
3234 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003235 }
3236
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01003237 if (first_rounding_mode.first == spv::ExecutionModeMax) {
3238 // Register the first rounding mode found
3239 first_rounding_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003240 } else if (first_rounding_mode.first != mode && first_rounding_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07003241 switch (phys_dev_props_core12.roundingModeIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003242 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
3243 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003244 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3245 "Shader uses different rounding modes for 16 and 64-bit but "
3246 "roundingModeIndependence is "
3247 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003248 }
3249 break;
3250
3251 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
3252 break;
3253
3254 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003255 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
3256 "Shader uses different rounding modes for different bit widths but "
3257 "roundingModeIndependence is "
3258 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05003259 break;
3260
3261 default:
3262 break;
3263 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003264 }
3265 break;
3266 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05003267
3268 case spv::ExecutionModeOutputVertices: {
3269 verticesOut = insn.word(3);
3270 break;
3271 }
3272
3273 case spv::ExecutionModeInvocations: {
3274 invocations = insn.word(3);
3275 break;
3276 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003277 }
3278 }
3279 }
3280
Jeff Bolze9ee3d82019-05-29 13:45:13 -05003281 if (entrypoint.word(1) == spv::ExecutionModelGeometry) {
3282 if (verticesOut == 0 || verticesOut > phys_dev_props.limits.maxGeometryOutputVertices) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003283 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-stage-00714",
3284 "Geometry shader entry point must have an OpExecutionMode instruction that "
3285 "specifies a maximum output vertex count that is greater than 0 and less "
3286 "than or equal to maxGeometryOutputVertices. "
3287 "OutputVertices=%d, maxGeometryOutputVertices=%d",
3288 verticesOut, phys_dev_props.limits.maxGeometryOutputVertices);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05003289 }
3290
3291 if (invocations == 0 || invocations > phys_dev_props.limits.maxGeometryShaderInvocations) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003292 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-stage-00715",
3293 "Geometry shader entry point must have an OpExecutionMode instruction that "
3294 "specifies an invocation count that is greater than 0 and less "
3295 "than or equal to maxGeometryShaderInvocations. "
3296 "Invocations=%d, maxGeometryShaderInvocations=%d",
3297 invocations, phys_dev_props.limits.maxGeometryShaderInvocations);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05003298 }
3299 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003300 return skip;
3301}
3302
locke-lunargd9a069d2019-09-17 01:50:19 -06003303uint32_t DescriptorTypeToReqs(SHADER_MODULE_STATE const *module, uint32_t type_id) {
Chris Forbes47567b72017-06-09 12:09:45 -07003304 auto type = module->get_def(type_id);
3305
3306 while (true) {
3307 switch (type.opcode()) {
3308 case spv::OpTypeArray:
Chris Forbes062f1222018-08-21 15:34:15 -07003309 case spv::OpTypeRuntimeArray:
Chris Forbes47567b72017-06-09 12:09:45 -07003310 case spv::OpTypeSampledImage:
3311 type = module->get_def(type.word(2));
3312 break;
3313 case spv::OpTypePointer:
3314 type = module->get_def(type.word(3));
3315 break;
3316 case spv::OpTypeImage: {
3317 auto dim = type.word(3);
3318 auto arrayed = type.word(5);
3319 auto msaa = type.word(6);
3320
Chris Forbes74ba2232018-08-27 15:19:27 -07003321 uint32_t bits = 0;
3322 switch (GetFundamentalType(module, type.word(2))) {
3323 case FORMAT_TYPE_FLOAT:
3324 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_FLOAT;
3325 break;
3326 case FORMAT_TYPE_UINT:
3327 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_UINT;
3328 break;
3329 case FORMAT_TYPE_SINT:
3330 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_SINT;
3331 break;
3332 default:
3333 break;
3334 }
3335
Chris Forbes47567b72017-06-09 12:09:45 -07003336 switch (dim) {
3337 case spv::Dim1D:
Chris Forbes74ba2232018-08-27 15:19:27 -07003338 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_1D_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_1D;
3339 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07003340 case spv::Dim2D:
Chris Forbes74ba2232018-08-27 15:19:27 -07003341 bits |= msaa ? DESCRIPTOR_REQ_MULTI_SAMPLE : DESCRIPTOR_REQ_SINGLE_SAMPLE;
3342 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_2D_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_2D;
3343 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07003344 case spv::Dim3D:
Chris Forbes74ba2232018-08-27 15:19:27 -07003345 bits |= DESCRIPTOR_REQ_VIEW_TYPE_3D;
3346 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07003347 case spv::DimCube:
Chris Forbes74ba2232018-08-27 15:19:27 -07003348 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_CUBE_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_CUBE;
3349 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07003350 case spv::DimSubpassData:
Chris Forbes74ba2232018-08-27 15:19:27 -07003351 bits |= msaa ? DESCRIPTOR_REQ_MULTI_SAMPLE : DESCRIPTOR_REQ_SINGLE_SAMPLE;
3352 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07003353 default: // buffer, etc.
Chris Forbes74ba2232018-08-27 15:19:27 -07003354 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07003355 }
3356 }
3357 default:
3358 return 0;
3359 }
3360 }
3361}
3362
3363// For given pipelineLayout verify that the set_layout_node at slot.first
3364// has the requested binding at slot.second and return ptr to that binding
Mark Lobodzinskica6ebe32019-04-25 11:43:37 -06003365static VkDescriptorSetLayoutBinding const *GetDescriptorBinding(PIPELINE_LAYOUT_STATE const *pipelineLayout,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003366 descriptor_slot_t slot) {
Chris Forbes47567b72017-06-09 12:09:45 -07003367 if (!pipelineLayout) return nullptr;
3368
3369 if (slot.first >= pipelineLayout->set_layouts.size()) return nullptr;
3370
3371 return pipelineLayout->set_layouts[slot.first]->GetDescriptorSetLayoutBindingPtrFromBinding(slot.second);
3372}
3373
Sam Wallsd7ab6db2020-06-19 20:41:54 +01003374int32_t GetShaderResourceDimensionality(const SHADER_MODULE_STATE *module, const interface_var &resource) {
3375 if (module == nullptr) return -1;
3376
3377 auto type = module->get_def(resource.type_id);
3378 while (true) {
3379 switch (type.opcode()) {
3380 case spv::OpTypeSampledImage:
3381 type = module->get_def(type.word(2));
3382 break;
3383 case spv::OpTypePointer:
3384 type = module->get_def(type.word(3));
3385 break;
3386 case spv::OpTypeImage:
3387 return type.word(3);
3388 default:
3389 return -1;
3390 }
3391 }
3392}
3393
3394bool FindLocalSize(SHADER_MODULE_STATE const *src, uint32_t &local_size_x, uint32_t &local_size_y, uint32_t &local_size_z) {
Locke1ec6d952019-04-02 11:57:21 -06003395 for (auto insn : *src) {
3396 if (insn.opcode() == spv::OpEntryPoint) {
3397 auto executionModel = insn.word(1);
3398 auto entrypointStageBits = ExecutionModelToShaderStageFlagBits(executionModel);
3399 if (entrypointStageBits == VK_SHADER_STAGE_COMPUTE_BIT) {
3400 auto entrypoint_id = insn.word(2);
3401 for (auto insn1 : *src) {
3402 if (insn1.opcode() == spv::OpExecutionMode && insn1.word(1) == entrypoint_id &&
3403 insn1.word(2) == spv::ExecutionModeLocalSize) {
3404 local_size_x = insn1.word(3);
3405 local_size_y = insn1.word(4);
3406 local_size_z = insn1.word(5);
3407 return true;
3408 }
3409 }
3410 }
3411 }
3412 }
3413 return false;
3414}
3415
locke-lunargd9a069d2019-09-17 01:50:19 -06003416void ProcessExecutionModes(SHADER_MODULE_STATE const *src, const spirv_inst_iter &entrypoint, PIPELINE_STATE *pipeline) {
Jeff Bolz105d6492018-09-29 15:46:44 -05003417 auto entrypoint_id = entrypoint.word(2);
Chris Forbes0771b672018-03-22 21:13:46 -07003418 bool is_point_mode = false;
3419
3420 for (auto insn : *src) {
3421 if (insn.opcode() == spv::OpExecutionMode && insn.word(1) == entrypoint_id) {
3422 switch (insn.word(2)) {
3423 case spv::ExecutionModePointMode:
3424 // In tessellation shaders, PointMode is separate and trumps the tessellation topology.
3425 is_point_mode = true;
3426 break;
3427
3428 case spv::ExecutionModeOutputPoints:
3429 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_POINT_LIST;
3430 break;
3431
3432 case spv::ExecutionModeIsolines:
3433 case spv::ExecutionModeOutputLineStrip:
3434 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_LINE_STRIP;
3435 break;
3436
3437 case spv::ExecutionModeTriangles:
3438 case spv::ExecutionModeQuads:
3439 case spv::ExecutionModeOutputTriangleStrip:
3440 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_TRIANGLE_STRIP;
3441 break;
3442 }
3443 }
3444 }
3445
3446 if (is_point_mode) pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_POINT_LIST;
3447}
3448
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003449// If PointList topology is specified in the pipeline, verify that a shader geometry stage writes PointSize
3450// o If there is only a vertex shader : gl_PointSize must be written when using points
3451// o If there is a geometry or tessellation shader:
3452// - If shaderTessellationAndGeometryPointSize feature is enabled:
3453// * gl_PointSize must be written in the final geometry stage
3454// - If shaderTessellationAndGeometryPointSize feature is disabled:
3455// * gl_PointSize must NOT be written and a default of 1.0 is assumed
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06003456bool CoreChecks::ValidatePointListShaderState(const PIPELINE_STATE *pipeline, SHADER_MODULE_STATE const *src,
John Zulaufac4c6e12019-07-01 16:05:58 -06003457 spirv_inst_iter entrypoint, VkShaderStageFlagBits stage) const {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003458 if (pipeline->topology_at_rasterizer != VK_PRIMITIVE_TOPOLOGY_POINT_LIST) {
3459 return false;
3460 }
3461
3462 bool pointsize_written = false;
3463 bool skip = false;
3464
3465 // Search for PointSize built-in decorations
3466 std::vector<uint32_t> pointsize_builtin_offsets;
3467 spirv_inst_iter insn = entrypoint;
3468 while (!pointsize_written && (insn.opcode() != spv::OpFunction)) {
3469 if (insn.opcode() == spv::OpMemberDecorate) {
3470 if (insn.word(3) == spv::DecorationBuiltIn) {
3471 if (insn.word(4) == spv::BuiltInPointSize) {
3472 pointsize_written = IsPointSizeWritten(src, insn, entrypoint);
3473 }
3474 }
3475 } else if (insn.opcode() == spv::OpDecorate) {
3476 if (insn.word(2) == spv::DecorationBuiltIn) {
3477 if (insn.word(3) == spv::BuiltInPointSize) {
3478 pointsize_written = IsPointSizeWritten(src, insn, entrypoint);
3479 }
3480 }
3481 }
3482
3483 insn++;
3484 }
3485
3486 if ((stage == VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT || stage == VK_SHADER_STAGE_GEOMETRY_BIT) &&
Mark Lobodzinskid7b03cc2019-04-19 14:23:10 -06003487 !enabled_features.core.shaderTessellationAndGeometryPointSize) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003488 if (pointsize_written) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003489 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_PointSizeBuiltInOverSpecified,
3490 "Pipeline topology is set to POINT_LIST and geometry or tessellation shaders write PointSize which "
3491 "is prohibited when the shaderTessellationAndGeometryPointSize feature is not enabled.");
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003492 }
3493 } else if (!pointsize_written) {
3494 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003495 LogError(pipeline->pipeline, kVUID_Core_Shader_MissingPointSizeBuiltIn,
3496 "Pipeline topology is set to POINT_LIST, but PointSize is not written to in the shader corresponding to %s.",
3497 string_VkShaderStageFlagBits(stage));
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003498 }
3499 return skip;
3500}
John Zulauf14c355b2019-06-27 16:09:37 -06003501
3502bool CoreChecks::ValidatePipelineShaderStage(VkPipelineShaderStageCreateInfo const *pStage, const PIPELINE_STATE *pipeline,
3503 const PIPELINE_STATE::StageState &stage_state, const SHADER_MODULE_STATE *module,
John Zulaufac4c6e12019-07-01 16:05:58 -06003504 const spirv_inst_iter &entrypoint, bool check_point_size) const {
John Zulauf14c355b2019-06-27 16:09:37 -06003505 bool skip = false;
3506
3507 // Check the module
3508 if (!module->has_valid_spirv) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003509 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-module-parameter",
3510 "%s does not contain valid spirv for stage %s.",
3511 report_data->FormatHandle(module->vk_shader_module).c_str(), string_VkShaderStageFlagBits(pStage->stage));
John Zulauf14c355b2019-06-27 16:09:37 -06003512 }
3513
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003514 // If specialization-constant values are given and specialization-constant instructions are present in the shader, the
3515 // specializations should be applied and validated.
3516 if (pStage->pSpecializationInfo != nullptr && pStage->pSpecializationInfo->mapEntryCount > 0 &&
3517 pStage->pSpecializationInfo->pMapEntries != nullptr && module->has_specialization_constants) {
3518 // Gather the specialization-constant values.
3519 auto const &specialization_info = pStage->pSpecializationInfo;
Jeremy Hayes521221d2020-01-15 16:48:49 -07003520 auto const &specialization_data = reinterpret_cast<uint8_t const *>(specialization_info->pData);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003521 std::unordered_map<uint32_t, std::vector<uint32_t>> id_value_map;
3522 id_value_map.reserve(specialization_info->mapEntryCount);
3523 for (auto i = 0u; i < specialization_info->mapEntryCount; ++i) {
3524 auto const &map_entry = specialization_info->pMapEntries[i];
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003525
Jeremy Hayes521221d2020-01-15 16:48:49 -07003526 // Expect only scalar types.
3527 assert(map_entry.size == 1 || map_entry.size == 2 || map_entry.size == 4 || map_entry.size == 8);
3528 auto entry = id_value_map.emplace(map_entry.constantID, std::vector<uint32_t>(map_entry.size > 4 ? 2 : 1));
3529 memcpy(entry.first->second.data(), specialization_data + map_entry.offset, map_entry.size);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003530 }
3531
3532 // Apply the specialization-constant values and revalidate the shader module.
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06003533 spv_target_env spirv_environment = PickSpirvEnv(api_version, (device_extensions.vk_khr_spirv_1_4 != kNotEnabled));
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003534 spvtools::Optimizer optimizer(spirv_environment);
3535 spvtools::MessageConsumer consumer = [&skip, &module, &pStage, this](spv_message_level_t level, const char *source,
3536 const spv_position_t &position, const char *message) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003537 skip |= LogError(
3538 device, "VUID-VkPipelineShaderStageCreateInfo-module-parameter", "%s does not contain valid spirv for stage %s. %s",
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003539 report_data->FormatHandle(module->vk_shader_module).c_str(), string_VkShaderStageFlagBits(pStage->stage), message);
3540 };
3541 optimizer.SetMessageConsumer(consumer);
3542 optimizer.RegisterPass(spvtools::CreateSetSpecConstantDefaultValuePass(id_value_map));
3543 optimizer.RegisterPass(spvtools::CreateFreezeSpecConstantValuePass());
3544 std::vector<uint32_t> specialized_spirv;
3545 auto const optimized =
3546 optimizer.Run(module->words.data(), module->words.size(), &specialized_spirv, spvtools::ValidatorOptions(), true);
3547 assert(optimized == true);
3548
3549 if (optimized) {
3550 spv_context ctx = spvContextCreate(spirv_environment);
3551 spv_const_binary_t binary{specialized_spirv.data(), specialized_spirv.size()};
3552 spv_diagnostic diag = nullptr;
Tony-LunarG9fe69a42020-07-23 15:09:37 -06003553 spvtools::ValidatorOptions options;
3554 AdjustValidatorOptions(device_extensions, enabled_features, options);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003555 auto const spv_valid = spvValidateWithOptions(ctx, options, &binary, &diag);
3556 if (spv_valid != SPV_SUCCESS) {
sfricke-samsungd3793802020-08-18 22:55:03 -07003557 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-module-04145",
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003558 "After specialization was applied, %s does not contain valid spirv for stage %s.",
3559 report_data->FormatHandle(module->vk_shader_module).c_str(),
3560 string_VkShaderStageFlagBits(pStage->stage));
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003561 }
3562
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003563 spvDiagnosticDestroy(diag);
3564 spvContextDestroy(ctx);
3565 }
3566 }
3567
John Zulauf14c355b2019-06-27 16:09:37 -06003568 // Check the entrypoint
3569 if (entrypoint == module->end()) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003570 skip |=
3571 LogError(device, "VUID-VkPipelineShaderStageCreateInfo-pName-00707", "No entrypoint found named `%s` for stage %s..",
3572 pStage->pName, string_VkShaderStageFlagBits(pStage->stage));
John Zulauf14c355b2019-06-27 16:09:37 -06003573 }
3574 if (skip) return true; // no point continuing beyond here, any analysis is just going to be garbage.
3575
3576 // Mark accessible ids
3577 auto &accessible_ids = stage_state.accessible_ids;
3578
Chris Forbes47567b72017-06-09 12:09:45 -07003579 // Validate descriptor set layout against what the entrypoint actually uses
John Zulauf14c355b2019-06-27 16:09:37 -06003580 bool has_writable_descriptor = stage_state.has_writable_descriptor;
3581 auto &descriptor_uses = stage_state.descriptor_uses;
Chris Forbes47567b72017-06-09 12:09:45 -07003582
Chris Forbes349b3132018-03-07 11:38:08 -08003583 // Validate shader capabilities against enabled device features
Jeff Bolzee743412019-06-20 22:24:32 -05003584 skip |= ValidateShaderCapabilities(module, pStage->stage);
locke-lunarg63e4daf2020-08-17 17:53:25 -06003585 skip |=
3586 ValidateShaderStageWritableOrAtomicDescriptor(pStage->stage, has_writable_descriptor, stage_state.has_atomic_descriptor);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05003587 skip |= ValidateShaderStageInputOutputLimits(module, pStage, pipeline, entrypoint);
sfricke-samsungdc96f302020-03-18 20:42:10 -07003588 skip |= ValidateShaderStageMaxResources(pStage->stage, pipeline);
Jeff Bolz526f2d52019-09-18 13:18:08 -05003589 skip |= ValidateShaderStageGroupNonUniform(module, pStage->stage);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003590 skip |= ValidateExecutionModes(module, entrypoint);
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003591 skip |= ValidateSpecializationOffsets(pStage);
locke-lunargde3f0fa2020-09-10 11:55:31 -06003592 skip |= ValidatePushConstantUsage(*pipeline, module, pStage);
Jeff Bolze54ae892018-09-08 12:16:29 -05003593 if (check_point_size && !pipeline->graphicsPipelineCI.pRasterizationState->rasterizerDiscardEnable) {
Mark Lobodzinski518eadc2019-03-09 12:07:30 -07003594 skip |= ValidatePointListShaderState(pipeline, module, entrypoint, pStage->stage);
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003595 }
sfricke-samsungef2a68c2020-10-26 04:22:46 -07003596 skip |= ValidateBuiltinLimits(module, accessible_ids, pStage->stage);
Jeff Bolze4356752019-03-07 11:23:46 -06003597 skip |= ValidateCooperativeMatrix(module, pStage, pipeline);
Chris Forbes47567b72017-06-09 12:09:45 -07003598
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003599 std::string vuid_layout_mismatch;
3600 if (pipeline->graphicsPipelineCI.sType == VK_STRUCTURE_TYPE_GRAPHICS_PIPELINE_CREATE_INFO) {
3601 vuid_layout_mismatch = "VUID-VkGraphicsPipelineCreateInfo-layout-00756";
3602 } else if (pipeline->computePipelineCI.sType == VK_STRUCTURE_TYPE_COMPUTE_PIPELINE_CREATE_INFO) {
3603 vuid_layout_mismatch = "VUID-VkComputePipelineCreateInfo-layout-00703";
3604 } else if (pipeline->raytracingPipelineCI.sType == VK_STRUCTURE_TYPE_RAY_TRACING_PIPELINE_CREATE_INFO_KHR) {
3605 vuid_layout_mismatch = "VUID-VkRayTracingPipelineCreateInfoKHR-layout-03427";
3606 } else if (pipeline->raytracingPipelineCI.sType == VK_STRUCTURE_TYPE_RAY_TRACING_PIPELINE_CREATE_INFO_NV) {
3607 vuid_layout_mismatch = "VUID-VkRayTracingPipelineCreateInfoNV-layout-03427";
3608 }
3609
Chris Forbes47567b72017-06-09 12:09:45 -07003610 // Validate descriptor use
3611 for (auto use : descriptor_uses) {
Chris Forbes47567b72017-06-09 12:09:45 -07003612 // Verify given pipelineLayout has requested setLayout with requested binding
Jeff Bolze7fc67b2019-10-04 12:29:31 -05003613 const auto &binding = GetDescriptorBinding(pipeline->pipeline_layout.get(), use.first);
Chris Forbes47567b72017-06-09 12:09:45 -07003614 unsigned required_descriptor_count;
Jeff Bolze54ae892018-09-08 12:16:29 -05003615 std::set<uint32_t> descriptor_types = TypeToDescriptorTypeSet(module, use.second.type_id, required_descriptor_count);
Chris Forbes47567b72017-06-09 12:09:45 -07003616
3617 if (!binding) {
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003618 skip |= LogError(device, vuid_layout_mismatch,
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003619 "Shader uses descriptor slot %u.%u (expected `%s`) but not declared in pipeline layout",
3620 use.first.first, use.first.second, string_descriptorTypes(descriptor_types).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003621 } else if (~binding->stageFlags & pStage->stage) {
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003622 skip |= LogError(device, vuid_layout_mismatch,
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003623 "Shader uses descriptor slot %u.%u but descriptor not accessible from stage %s", use.first.first,
3624 use.first.second, string_VkShaderStageFlagBits(pStage->stage));
Jeff Bolze54ae892018-09-08 12:16:29 -05003625 } else if (descriptor_types.find(binding->descriptorType) == descriptor_types.end()) {
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003626 skip |= LogError(device, vuid_layout_mismatch,
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003627 "Type mismatch on descriptor slot %u.%u (expected `%s`) but descriptor of type %s", use.first.first,
3628 use.first.second, string_descriptorTypes(descriptor_types).c_str(),
3629 string_VkDescriptorType(binding->descriptorType));
Chris Forbes47567b72017-06-09 12:09:45 -07003630 } else if (binding->descriptorCount < required_descriptor_count) {
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003631 skip |= LogError(device, vuid_layout_mismatch,
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003632 "Shader expects at least %u descriptors for binding %u.%u but only %u provided",
3633 required_descriptor_count, use.first.first, use.first.second, binding->descriptorCount);
Chris Forbes47567b72017-06-09 12:09:45 -07003634 }
3635 }
3636
3637 // Validate use of input attachments against subpass structure
3638 if (pStage->stage == VK_SHADER_STAGE_FRAGMENT_BIT) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003639 auto input_attachment_uses = CollectInterfaceByInputAttachmentIndex(module, accessible_ids);
Chris Forbes47567b72017-06-09 12:09:45 -07003640
Petr Krause91f7a12017-12-14 20:57:36 +01003641 auto rpci = pipeline->rp_state->createInfo.ptr();
Chris Forbes47567b72017-06-09 12:09:45 -07003642 auto subpass = pipeline->graphicsPipelineCI.subpass;
3643
3644 for (auto use : input_attachment_uses) {
3645 auto input_attachments = rpci->pSubpasses[subpass].pInputAttachments;
3646 auto index = (input_attachments && use.first < rpci->pSubpasses[subpass].inputAttachmentCount)
Dave Houltona9df0ce2018-02-07 10:51:23 -07003647 ? input_attachments[use.first].attachment
3648 : VK_ATTACHMENT_UNUSED;
Chris Forbes47567b72017-06-09 12:09:45 -07003649
3650 if (index == VK_ATTACHMENT_UNUSED) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003651 skip |= LogError(device, kVUID_Core_Shader_MissingInputAttachment,
3652 "Shader consumes input attachment index %d but not provided in subpass", use.first);
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003653 } else if (!(GetFormatType(rpci->pAttachments[index].format) & GetFundamentalType(module, use.second.type_id))) {
Chris Forbes47567b72017-06-09 12:09:45 -07003654 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003655 LogError(device, kVUID_Core_Shader_InputAttachmentTypeMismatch,
3656 "Subpass input attachment %u format of %s does not match type used in shader `%s`", use.first,
3657 string_VkFormat(rpci->pAttachments[index].format), DescribeType(module, use.second.type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003658 }
3659 }
3660 }
Lockeaa8fdc02019-04-02 11:59:20 -06003661 if (pStage->stage == VK_SHADER_STAGE_COMPUTE_BIT) {
3662 skip |= ValidateComputeWorkGroupSizes(module);
3663 }
Chris Forbes47567b72017-06-09 12:09:45 -07003664 return skip;
3665}
3666
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003667bool CoreChecks::ValidateInterfaceBetweenStages(SHADER_MODULE_STATE const *producer, spirv_inst_iter producer_entrypoint,
3668 shader_stage_attributes const *producer_stage, SHADER_MODULE_STATE const *consumer,
3669 spirv_inst_iter consumer_entrypoint,
3670 shader_stage_attributes const *consumer_stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07003671 bool skip = false;
3672
3673 auto outputs =
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003674 CollectInterfaceByLocation(producer, producer_entrypoint, spv::StorageClassOutput, producer_stage->arrayed_output);
3675 auto inputs = CollectInterfaceByLocation(consumer, consumer_entrypoint, spv::StorageClassInput, consumer_stage->arrayed_input);
Chris Forbes47567b72017-06-09 12:09:45 -07003676
3677 auto a_it = outputs.begin();
3678 auto b_it = inputs.begin();
3679
3680 // Maps sorted by key (location); walk them together to find mismatches
3681 while ((outputs.size() > 0 && a_it != outputs.end()) || (inputs.size() && b_it != inputs.end())) {
3682 bool a_at_end = outputs.size() == 0 || a_it == outputs.end();
3683 bool b_at_end = inputs.size() == 0 || b_it == inputs.end();
3684 auto a_first = a_at_end ? std::make_pair(0u, 0u) : a_it->first;
3685 auto b_first = b_at_end ? std::make_pair(0u, 0u) : b_it->first;
3686
3687 if (b_at_end || ((!a_at_end) && (a_first < b_first))) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003688 skip |= LogPerformanceWarning(producer->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
3689 "%s writes to output location %u.%u which is not consumed by %s", producer_stage->name,
3690 a_first.first, a_first.second, consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003691 a_it++;
3692 } else if (a_at_end || a_first > b_first) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003693 skip |= LogError(consumer->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
3694 "%s consumes input location %u.%u which is not written by %s", consumer_stage->name, b_first.first,
3695 b_first.second, producer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003696 b_it++;
3697 } else {
3698 // subtleties of arrayed interfaces:
3699 // - if is_patch, then the member is not arrayed, even though the interface may be.
3700 // - if is_block_member, then the extra array level of an arrayed interface is not
3701 // expressed in the member type -- it's expressed in the block type.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003702 if (!TypesMatch(producer, consumer, a_it->second.type_id, b_it->second.type_id,
3703 producer_stage->arrayed_output && !a_it->second.is_patch && !a_it->second.is_block_member,
3704 consumer_stage->arrayed_input && !b_it->second.is_patch && !b_it->second.is_block_member, true)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003705 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3706 "Type mismatch on location %u.%u: '%s' vs '%s'", a_first.first, a_first.second,
3707 DescribeType(producer, a_it->second.type_id).c_str(),
3708 DescribeType(consumer, b_it->second.type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003709 }
3710 if (a_it->second.is_patch != b_it->second.is_patch) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003711 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3712 "Decoration mismatch on location %u.%u: is per-%s in %s stage but per-%s in %s stage",
3713 a_first.first, a_first.second, a_it->second.is_patch ? "patch" : "vertex", producer_stage->name,
3714 b_it->second.is_patch ? "patch" : "vertex", consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003715 }
3716 if (a_it->second.is_relaxed_precision != b_it->second.is_relaxed_precision) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003717 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3718 "Decoration mismatch on location %u.%u: %s and %s stages differ in precision", a_first.first,
3719 a_first.second, producer_stage->name, consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003720 }
3721 a_it++;
3722 b_it++;
3723 }
3724 }
3725
Ari Suonpaa696b3432019-03-11 14:02:57 +02003726 if (consumer_stage->stage != VK_SHADER_STAGE_FRAGMENT_BIT) {
3727 auto builtins_producer = CollectBuiltinBlockMembers(producer, producer_entrypoint, spv::StorageClassOutput);
3728 auto builtins_consumer = CollectBuiltinBlockMembers(consumer, consumer_entrypoint, spv::StorageClassInput);
3729
3730 if (!builtins_producer.empty() && !builtins_consumer.empty()) {
3731 if (builtins_producer.size() != builtins_consumer.size()) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003732 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3733 "Number of elements inside builtin block differ between stages (%s %d vs %s %d).",
3734 producer_stage->name, (int)builtins_producer.size(), consumer_stage->name,
3735 (int)builtins_consumer.size());
Ari Suonpaa696b3432019-03-11 14:02:57 +02003736 } else {
3737 auto it_producer = builtins_producer.begin();
3738 auto it_consumer = builtins_consumer.begin();
3739 while (it_producer != builtins_producer.end() && it_consumer != builtins_consumer.end()) {
3740 if (*it_producer != *it_consumer) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003741 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3742 "Builtin variable inside block doesn't match between %s and %s.", producer_stage->name,
3743 consumer_stage->name);
Ari Suonpaa696b3432019-03-11 14:02:57 +02003744 break;
3745 }
3746 it_producer++;
3747 it_consumer++;
3748 }
3749 }
3750 }
3751 }
3752
Chris Forbes47567b72017-06-09 12:09:45 -07003753 return skip;
3754}
3755
John Zulauf14c355b2019-06-27 16:09:37 -06003756static inline uint32_t DetermineFinalGeomStage(const PIPELINE_STATE *pipeline, const VkGraphicsPipelineCreateInfo *pCreateInfo) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003757 uint32_t stage_mask = 0;
3758 if (pipeline->topology_at_rasterizer == VK_PRIMITIVE_TOPOLOGY_POINT_LIST) {
3759 for (uint32_t i = 0; i < pCreateInfo->stageCount; i++) {
3760 stage_mask |= pCreateInfo->pStages[i].stage;
3761 }
3762 // Determine which shader in which PointSize should be written (the final geometry stage)
Jeff Bolz105d6492018-09-29 15:46:44 -05003763 if (stage_mask & VK_SHADER_STAGE_MESH_BIT_NV) {
3764 stage_mask = VK_SHADER_STAGE_MESH_BIT_NV;
3765 } else if (stage_mask & VK_SHADER_STAGE_GEOMETRY_BIT) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003766 stage_mask = VK_SHADER_STAGE_GEOMETRY_BIT;
3767 } else if (stage_mask & VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT) {
3768 stage_mask = VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT;
3769 } else if (stage_mask & VK_SHADER_STAGE_VERTEX_BIT) {
3770 stage_mask = VK_SHADER_STAGE_VERTEX_BIT;
Mark Lobodzinski2c984cc2018-07-31 09:57:46 -06003771 }
3772 }
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003773 return stage_mask;
Mark Lobodzinski2c984cc2018-07-31 09:57:46 -06003774}
3775
Chris Forbes47567b72017-06-09 12:09:45 -07003776// Validate that the shaders used by the given pipeline and store the active_slots
3777// that are actually used by the pipeline into pPipeline->active_slots
John Zulaufac4c6e12019-07-01 16:05:58 -06003778bool CoreChecks::ValidateGraphicsPipelineShaderState(const PIPELINE_STATE *pipeline) const {
Chris Forbesa400a8a2017-07-20 13:10:24 -07003779 auto pCreateInfo = pipeline->graphicsPipelineCI.ptr();
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003780 int vertex_stage = GetShaderStageId(VK_SHADER_STAGE_VERTEX_BIT);
3781 int fragment_stage = GetShaderStageId(VK_SHADER_STAGE_FRAGMENT_BIT);
Chris Forbes47567b72017-06-09 12:09:45 -07003782
John Zulauf14c355b2019-06-27 16:09:37 -06003783 const SHADER_MODULE_STATE *shaders[32];
Chris Forbes47567b72017-06-09 12:09:45 -07003784 memset(shaders, 0, sizeof(shaders));
Jeff Bolz7e35c392018-09-04 15:30:41 -05003785 spirv_inst_iter entrypoints[32];
Chris Forbes47567b72017-06-09 12:09:45 -07003786 memset(entrypoints, 0, sizeof(entrypoints));
3787 bool skip = false;
3788
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003789 uint32_t pointlist_stage_mask = DetermineFinalGeomStage(pipeline, pCreateInfo);
3790
Chris Forbes47567b72017-06-09 12:09:45 -07003791 for (uint32_t i = 0; i < pCreateInfo->stageCount; i++) {
3792 auto pStage = &pCreateInfo->pStages[i];
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003793 auto stage_id = GetShaderStageId(pStage->stage);
John Zulauf14c355b2019-06-27 16:09:37 -06003794 shaders[stage_id] = GetShaderModuleState(pStage->module);
3795 entrypoints[stage_id] = FindEntrypoint(shaders[stage_id], pStage->pName, pStage->stage);
3796 skip |= ValidatePipelineShaderStage(pStage, pipeline, pipeline->stage_state[i], shaders[stage_id], entrypoints[stage_id],
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003797 (pointlist_stage_mask == pStage->stage));
Chris Forbes47567b72017-06-09 12:09:45 -07003798 }
3799
3800 // if the shader stages are no good individually, cross-stage validation is pointless.
3801 if (skip) return true;
3802
3803 auto vi = pCreateInfo->pVertexInputState;
3804
3805 if (vi) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003806 skip |= ValidateViConsistency(vi);
Chris Forbes47567b72017-06-09 12:09:45 -07003807 }
3808
3809 if (shaders[vertex_stage] && shaders[vertex_stage]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003810 skip |= ValidateViAgainstVsInputs(vi, shaders[vertex_stage], entrypoints[vertex_stage]);
Chris Forbes47567b72017-06-09 12:09:45 -07003811 }
3812
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003813 int producer = GetShaderStageId(VK_SHADER_STAGE_VERTEX_BIT);
3814 int consumer = GetShaderStageId(VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT);
Chris Forbes47567b72017-06-09 12:09:45 -07003815
3816 while (!shaders[producer] && producer != fragment_stage) {
3817 producer++;
3818 consumer++;
3819 }
3820
3821 for (; producer != fragment_stage && consumer <= fragment_stage; consumer++) {
3822 assert(shaders[producer]);
Chris Forbesdbb43fc2018-02-16 16:59:23 -08003823 if (shaders[consumer]) {
3824 if (shaders[consumer]->has_valid_spirv && shaders[producer]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003825 skip |= ValidateInterfaceBetweenStages(shaders[producer], entrypoints[producer], &shader_stage_attribs[producer],
3826 shaders[consumer], entrypoints[consumer], &shader_stage_attribs[consumer]);
Chris Forbesdbb43fc2018-02-16 16:59:23 -08003827 }
Chris Forbes47567b72017-06-09 12:09:45 -07003828
3829 producer = consumer;
3830 }
3831 }
3832
3833 if (shaders[fragment_stage] && shaders[fragment_stage]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003834 skip |= ValidateFsOutputsAgainstRenderPass(shaders[fragment_stage], entrypoints[fragment_stage], pipeline,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003835 pCreateInfo->subpass);
Chris Forbes47567b72017-06-09 12:09:45 -07003836 }
3837
3838 return skip;
3839}
3840
sfricke-samsunge72a85e2020-02-29 21:48:37 -08003841bool CoreChecks::ValidateComputePipelineShaderState(PIPELINE_STATE *pipeline) const {
John Zulauf14c355b2019-06-27 16:09:37 -06003842 const auto &stage = *pipeline->computePipelineCI.stage.ptr();
Chris Forbes47567b72017-06-09 12:09:45 -07003843
John Zulauf14c355b2019-06-27 16:09:37 -06003844 const SHADER_MODULE_STATE *module = GetShaderModuleState(stage.module);
3845 const spirv_inst_iter entrypoint = FindEntrypoint(module, stage.pName, stage.stage);
Chris Forbes47567b72017-06-09 12:09:45 -07003846
John Zulauf14c355b2019-06-27 16:09:37 -06003847 return ValidatePipelineShaderStage(&stage, pipeline, pipeline->stage_state[0], module, entrypoint, false);
Chris Forbes47567b72017-06-09 12:09:45 -07003848}
Chris Forbes4ae55b32017-06-09 14:42:56 -07003849
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003850bool CoreChecks::ValidateRayTracingPipeline(PIPELINE_STATE *pipeline, bool isKHR) const {
John Zulaufe4474e72019-07-01 17:28:27 -06003851 bool skip = false;
Jason Macnak15f95e82019-08-21 21:52:02 -04003852
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003853 if (isKHR) {
3854 if (pipeline->raytracingPipelineCI.maxRecursionDepth > phys_dev_ext_props.ray_tracing_propsKHR.maxRecursionDepth) {
3855 skip |= LogError(device, "VUID-VkRayTracingPipelineCreateInfoKHR-maxRecursionDepth-03464", ": %d > %d",
3856 pipeline->raytracingPipelineCI.maxRecursionDepth,
3857 phys_dev_ext_props.ray_tracing_propsKHR.maxRecursionDepth);
3858 }
sourav parmar83c31b12020-05-06 12:30:54 -07003859 for (uint32_t i = 0; i < pipeline->raytracingPipelineCI.libraries.libraryCount; ++i) {
3860 const PIPELINE_STATE *pLibrary_pipelinestate = GetPipelineState(pipeline->raytracingPipelineCI.libraries.pLibraries[i]);
3861 if (pLibrary_pipelinestate->raytracingPipelineCI.maxRecursionDepth !=
3862 pipeline->raytracingPipelineCI.maxRecursionDepth) {
3863 skip |= LogError(
3864 device, "VUID-VkRayTracingPipelineCreateInfoKHR-pLibraries-03467",
3865 "vkCreateRayTracingPipelinesKHR: Each element (%d) of the pLibraries member of libraries must have been"
3866 "created with the value of maxRecursionDepth (%d) equal to that in this pipeline (%d) .",
3867 i, pLibrary_pipelinestate->raytracingPipelineCI.maxRecursionDepth,
3868 pipeline->raytracingPipelineCI.maxRecursionDepth);
3869 }
3870 if (pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxAttributeSize !=
3871 pipeline->raytracingPipelineCI.pLibraryInterface->maxAttributeSize ||
3872 pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxPayloadSize !=
3873 pipeline->raytracingPipelineCI.pLibraryInterface->maxPayloadSize ||
3874 pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxCallableSize !=
3875 pipeline->raytracingPipelineCI.pLibraryInterface->maxCallableSize) {
3876 skip |=
3877 LogError(device, "VUID-VkRayTracingPipelineCreateInfoKHR-pLibraries-03469",
3878 "vkCreateRayTracingPipelinesKHR: Each element of the pLibraries member of libraries must have been "
3879 "created with values of the maxPayloadSize,"
3880 "maxAttributeSize, and maxCallableSize members of pLibraryInterface equal to those in this pipeline.");
3881 }
3882 }
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003883 } else {
3884 if (pipeline->raytracingPipelineCI.maxRecursionDepth > phys_dev_ext_props.ray_tracing_propsNV.maxRecursionDepth) {
3885 skip |= LogError(device, "VUID-VkRayTracingPipelineCreateInfoNV-maxRecursionDepth-03457", ": %d > %d",
3886 pipeline->raytracingPipelineCI.maxRecursionDepth,
3887 phys_dev_ext_props.ray_tracing_propsNV.maxRecursionDepth);
3888 }
Jason Macnak15f95e82019-08-21 21:52:02 -04003889 }
Jason Macnak15f95e82019-08-21 21:52:02 -04003890 const auto *stages = pipeline->raytracingPipelineCI.ptr()->pStages;
3891 const auto *groups = pipeline->raytracingPipelineCI.ptr()->pGroups;
3892
3893 uint32_t raygen_stages_found = 0;
John Zulaufe4474e72019-07-01 17:28:27 -06003894 for (uint32_t stage_index = 0; stage_index < pipeline->raytracingPipelineCI.stageCount; stage_index++) {
Jason Macnak15f95e82019-08-21 21:52:02 -04003895 const auto &stage = stages[stage_index];
Jeff Bolzfbe51582018-09-13 10:01:35 -05003896
John Zulaufe4474e72019-07-01 17:28:27 -06003897 const SHADER_MODULE_STATE *module = GetShaderModuleState(stage.module);
3898 const spirv_inst_iter entrypoint = FindEntrypoint(module, stage.pName, stage.stage);
Jeff Bolzfbe51582018-09-13 10:01:35 -05003899
John Zulaufe4474e72019-07-01 17:28:27 -06003900 skip |= ValidatePipelineShaderStage(&stage, pipeline, pipeline->stage_state[stage_index], module, entrypoint, false);
Jason Macnak15f95e82019-08-21 21:52:02 -04003901
3902 if (stage.stage == VK_SHADER_STAGE_RAYGEN_BIT_NV) {
3903 raygen_stages_found++;
3904 }
3905 }
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003906 if (raygen_stages_found == 0) {
3907 skip |= LogError(
3908 device,
3909 isKHR ? "VUID-VkRayTracingPipelineCreateInfoKHR-stage-03425" : "VUID-VkRayTracingPipelineCreateInfoNV-stage-03425",
3910 " : zero raygen stages specified");
Jason Macnak15f95e82019-08-21 21:52:02 -04003911 }
3912
3913 for (uint32_t group_index = 0; group_index < pipeline->raytracingPipelineCI.groupCount; group_index++) {
3914 const auto &group = groups[group_index];
3915
3916 if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_GENERAL_NV) {
3917 if (group.generalShader >= pipeline->raytracingPipelineCI.stageCount ||
3918 (stages[group.generalShader].stage != VK_SHADER_STAGE_RAYGEN_BIT_NV &&
3919 stages[group.generalShader].stage != VK_SHADER_STAGE_MISS_BIT_NV &&
3920 stages[group.generalShader].stage != VK_SHADER_STAGE_CALLABLE_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003921 skip |= LogError(device,
3922 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03474"
3923 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02413",
3924 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003925 }
3926 if (group.anyHitShader != VK_SHADER_UNUSED_NV || group.closestHitShader != VK_SHADER_UNUSED_NV ||
3927 group.intersectionShader != VK_SHADER_UNUSED_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003928 skip |= LogError(device,
3929 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03475"
3930 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02414",
3931 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003932 }
3933 } else if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_PROCEDURAL_HIT_GROUP_NV) {
3934 if (group.intersectionShader >= pipeline->raytracingPipelineCI.stageCount ||
3935 stages[group.intersectionShader].stage != VK_SHADER_STAGE_INTERSECTION_BIT_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003936 skip |= LogError(device,
3937 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03476"
3938 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02415",
3939 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003940 }
3941 } else if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_TRIANGLES_HIT_GROUP_NV) {
3942 if (group.intersectionShader != VK_SHADER_UNUSED_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003943 skip |= LogError(device,
3944 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03477"
3945 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02416",
3946 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003947 }
3948 }
3949
3950 if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_PROCEDURAL_HIT_GROUP_NV ||
3951 group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_TRIANGLES_HIT_GROUP_NV) {
3952 if (group.anyHitShader != VK_SHADER_UNUSED_NV && (group.anyHitShader >= pipeline->raytracingPipelineCI.stageCount ||
3953 stages[group.anyHitShader].stage != VK_SHADER_STAGE_ANY_HIT_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003954 skip |= LogError(device,
3955 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-anyHitShader-03479"
3956 : "VUID-VkRayTracingShaderGroupCreateInfoNV-anyHitShader-02418",
3957 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003958 }
3959 if (group.closestHitShader != VK_SHADER_UNUSED_NV &&
3960 (group.closestHitShader >= pipeline->raytracingPipelineCI.stageCount ||
3961 stages[group.closestHitShader].stage != VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003962 skip |= LogError(device,
3963 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-closestHitShader-03478"
3964 : "VUID-VkRayTracingShaderGroupCreateInfoNV-closestHitShader-02417",
3965 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003966 }
3967 }
John Zulaufe4474e72019-07-01 17:28:27 -06003968 }
3969 return skip;
Jeff Bolzfbe51582018-09-13 10:01:35 -05003970}
3971
Dave Houltona9df0ce2018-02-07 10:51:23 -07003972uint32_t ValidationCache::MakeShaderHash(VkShaderModuleCreateInfo const *smci) { return XXH32(smci->pCode, smci->codeSize, 0); }
Chris Forbes9a61e082017-07-24 15:35:29 -07003973
Dave Houltona9df0ce2018-02-07 10:51:23 -07003974static ValidationCache *GetValidationCacheInfo(VkShaderModuleCreateInfo const *pCreateInfo) {
John Zulauf25ea2432019-04-05 10:07:38 -06003975 const auto validation_cache_ci = lvl_find_in_chain<VkShaderModuleValidationCacheCreateInfoEXT>(pCreateInfo->pNext);
3976 if (validation_cache_ci) {
John Zulauf146ee802019-04-05 15:31:06 -06003977 return CastFromHandle<ValidationCache *>(validation_cache_ci->validationCache);
Chris Forbes9a61e082017-07-24 15:35:29 -07003978 }
Chris Forbes9a61e082017-07-24 15:35:29 -07003979 return nullptr;
3980}
3981
Mark Lobodzinskib56bbb92019-02-18 11:49:59 -07003982bool CoreChecks::PreCallValidateCreateShaderModule(VkDevice device, const VkShaderModuleCreateInfo *pCreateInfo,
Jeff Bolz5c801d12019-10-09 10:38:45 -05003983 const VkAllocationCallbacks *pAllocator, VkShaderModule *pShaderModule) const {
Chris Forbes4ae55b32017-06-09 14:42:56 -07003984 bool skip = false;
3985 spv_result_t spv_valid = SPV_SUCCESS;
Chris Forbes4ae55b32017-06-09 14:42:56 -07003986
Mark Lobodzinski90eea5b2020-05-15 12:54:00 -06003987 if (disabled[shader_validation]) {
Chris Forbes4ae55b32017-06-09 14:42:56 -07003988 return false;
3989 }
3990
Mark Lobodzinskif45e45f2019-04-19 14:15:39 -06003991 auto have_glsl_shader = device_extensions.vk_nv_glsl_shader;
Chris Forbes4ae55b32017-06-09 14:42:56 -07003992
3993 if (!have_glsl_shader && (pCreateInfo->codeSize % 4)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003994 skip |= LogError(device, "VUID-VkShaderModuleCreateInfo-pCode-01376",
3995 "SPIR-V module not valid: Codesize must be a multiple of 4 but is " PRINTF_SIZE_T_SPECIFIER ".",
3996 pCreateInfo->codeSize);
Chris Forbes4ae55b32017-06-09 14:42:56 -07003997 } else {
Chris Forbes9a61e082017-07-24 15:35:29 -07003998 auto cache = GetValidationCacheInfo(pCreateInfo);
3999 uint32_t hash = 0;
4000 if (cache) {
4001 hash = ValidationCache::MakeShaderHash(pCreateInfo);
Dave Houltona9df0ce2018-02-07 10:51:23 -07004002 if (cache->Contains(hash)) return false;
Chris Forbes9a61e082017-07-24 15:35:29 -07004003 }
4004
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06004005 // Use SPIRV-Tools validator to try and catch any issues with the module itself. If specialization constants are present,
4006 // the default values will be used during validation.
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06004007 spv_target_env spirv_environment = PickSpirvEnv(api_version, (device_extensions.vk_khr_spirv_1_4 != kNotEnabled));
Dave Houlton0ea2d012018-06-21 14:00:26 -06004008 spv_context ctx = spvContextCreate(spirv_environment);
Dave Houltona9df0ce2018-02-07 10:51:23 -07004009 spv_const_binary_t binary{pCreateInfo->pCode, pCreateInfo->codeSize / sizeof(uint32_t)};
Chris Forbes4ae55b32017-06-09 14:42:56 -07004010 spv_diagnostic diag = nullptr;
Tony-LunarG9fe69a42020-07-23 15:09:37 -06004011 spvtools::ValidatorOptions options;
4012 AdjustValidatorOptions(device_extensions, enabled_features, options);
Karl Schultzfda1b382018-08-08 18:56:11 -06004013 spv_valid = spvValidateWithOptions(ctx, options, &binary, &diag);
Chris Forbes4ae55b32017-06-09 14:42:56 -07004014 if (spv_valid != SPV_SUCCESS) {
4015 if (!have_glsl_shader || (pCreateInfo->pCode[0] == spv::MagicNumber)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07004016 if (spv_valid == SPV_WARNING) {
4017 skip |= LogWarning(device, kVUID_Core_Shader_InconsistentSpirv, "SPIR-V module not valid: %s",
4018 diag && diag->error ? diag->error : "(no error text)");
4019 } else {
4020 skip |= LogError(device, kVUID_Core_Shader_InconsistentSpirv, "SPIR-V module not valid: %s",
4021 diag && diag->error ? diag->error : "(no error text)");
4022 }
Chris Forbes4ae55b32017-06-09 14:42:56 -07004023 }
Chris Forbes9a61e082017-07-24 15:35:29 -07004024 } else {
4025 if (cache) {
4026 cache->Insert(hash);
4027 }
Chris Forbes4ae55b32017-06-09 14:42:56 -07004028 }
4029
4030 spvDiagnosticDestroy(diag);
4031 spvContextDestroy(ctx);
4032 }
4033
Chris Forbes4ae55b32017-06-09 14:42:56 -07004034 return skip;
Mark Lobodzinski01734072019-02-13 17:39:15 -07004035}
4036
John Zulaufac4c6e12019-07-01 16:05:58 -06004037bool CoreChecks::ValidateComputeWorkGroupSizes(const SHADER_MODULE_STATE *shader) const {
Lockeaa8fdc02019-04-02 11:59:20 -06004038 bool skip = false;
4039 uint32_t local_size_x = 0;
4040 uint32_t local_size_y = 0;
4041 uint32_t local_size_z = 0;
4042 if (FindLocalSize(shader, local_size_x, local_size_y, local_size_z)) {
4043 if (local_size_x > phys_dev_props.limits.maxComputeWorkGroupSize[0]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07004044 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
4045 "%s local_size_x (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[0] (%" PRIu32 ").",
4046 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
4047 phys_dev_props.limits.maxComputeWorkGroupSize[0]);
Lockeaa8fdc02019-04-02 11:59:20 -06004048 }
4049 if (local_size_y > phys_dev_props.limits.maxComputeWorkGroupSize[1]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07004050 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
4051 "%s local_size_y (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[1] (%" PRIu32 ").",
4052 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
4053 phys_dev_props.limits.maxComputeWorkGroupSize[1]);
Lockeaa8fdc02019-04-02 11:59:20 -06004054 }
4055 if (local_size_z > phys_dev_props.limits.maxComputeWorkGroupSize[2]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07004056 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
4057 "%s local_size_z (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[2] (%" PRIu32 ").",
4058 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
4059 phys_dev_props.limits.maxComputeWorkGroupSize[2]);
Lockeaa8fdc02019-04-02 11:59:20 -06004060 }
4061
4062 uint32_t limit = phys_dev_props.limits.maxComputeWorkGroupInvocations;
4063 uint64_t invocations = local_size_x * local_size_y;
4064 // Prevent overflow.
4065 bool fail = false;
4066 if (invocations > UINT32_MAX || invocations > limit) {
4067 fail = true;
4068 }
4069 if (!fail) {
4070 invocations *= local_size_z;
4071 if (invocations > UINT32_MAX || invocations > limit) {
4072 fail = true;
4073 }
4074 }
4075 if (fail) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07004076 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupInvocations",
4077 "%s local_size (%" PRIu32 ", %" PRIu32 ", %" PRIu32
4078 ") exceeds device limit maxComputeWorkGroupInvocations (%" PRIu32 ").",
4079 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x, local_size_y, local_size_z,
4080 limit);
Lockeaa8fdc02019-04-02 11:59:20 -06004081 }
4082 }
4083 return skip;
4084}
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06004085
4086spv_target_env PickSpirvEnv(uint32_t api_version, bool spirv_1_4) {
4087 if (api_version >= VK_API_VERSION_1_2) {
4088 return SPV_ENV_VULKAN_1_2;
4089 } else if (api_version >= VK_API_VERSION_1_1) {
4090 if (spirv_1_4) {
4091 return SPV_ENV_VULKAN_1_1_SPIRV_1_4;
4092 } else {
4093 return SPV_ENV_VULKAN_1_1;
4094 }
4095 }
4096 return SPV_ENV_VULKAN_1_0;
4097}
Tony-LunarG9fe69a42020-07-23 15:09:37 -06004098
4099void AdjustValidatorOptions(const DeviceExtensions device_extensions, const DeviceFeatures enabled_features,
4100 spvtools::ValidatorOptions &options) {
4101 if (device_extensions.vk_khr_relaxed_block_layout) {
4102 options.SetRelaxBlockLayout(true);
4103 }
4104 if (device_extensions.vk_khr_uniform_buffer_standard_layout && enabled_features.core12.uniformBufferStandardLayout == VK_TRUE) {
4105 options.SetUniformBufferStandardLayout(true);
4106 }
4107 if (device_extensions.vk_ext_scalar_block_layout && enabled_features.core12.scalarBlockLayout == VK_TRUE) {
4108 options.SetScalarBlockLayout(true);
4109 }
4110}