blob: a18bed5494f30a4d6161b86b8b4c4fa071121050 [file] [log] [blame]
Tony-LunarG73719992020-01-15 10:20:28 -07001/* Copyright (c) 2015-2020 The Khronos Group Inc.
2 * Copyright (c) 2015-2020 Valve Corporation
3 * Copyright (c) 2015-2020 LunarG, Inc.
4 * Copyright (C) 2015-2020 Google Inc.
Chris Forbes47567b72017-06-09 12:09:45 -07005 *
6 * Licensed under the Apache License, Version 2.0 (the "License");
7 * you may not use this file except in compliance with the License.
8 * You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing, software
13 * distributed under the License is distributed on an "AS IS" BASIS,
14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 * See the License for the specific language governing permissions and
16 * limitations under the License.
17 *
18 * Author: Chris Forbes <chrisf@ijw.co.nz>
Dave Houlton51653902018-06-22 17:32:13 -060019 * Author: Dave Houlton <daveh@lunarg.com>
Chris Forbes47567b72017-06-09 12:09:45 -070020 */
21
Petr Kraus25810d02019-08-27 17:41:15 +020022#include "shader_validation.h"
23
Chris Forbes47567b72017-06-09 12:09:45 -070024#include <cassert>
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +020025#include <chrono>
Petr Kraus25810d02019-08-27 17:41:15 +020026#include <cinttypes>
Jeff Bolzf234bf82019-11-04 14:07:15 -060027#include <cmath>
Petr Kraus25810d02019-08-27 17:41:15 +020028#include <map>
Chris Forbes47567b72017-06-09 12:09:45 -070029#include <sstream>
Petr Kraus25810d02019-08-27 17:41:15 +020030#include <string>
31#include <unordered_map>
32#include <vector>
33
Mark Lobodzinski102687e2020-04-28 11:03:28 -060034#include <spirv/unified1/spirv.hpp>
Chris Forbes47567b72017-06-09 12:09:45 -070035#include "vk_loader_platform.h"
36#include "vk_enum_string_helper.h"
Chris Forbes47567b72017-06-09 12:09:45 -070037#include "vk_layer_data.h"
38#include "vk_layer_extension_utils.h"
39#include "vk_layer_utils.h"
Mark Lobodzinskib56bbb92019-02-18 11:49:59 -070040#include "chassis.h"
Chris Forbes47567b72017-06-09 12:09:45 -070041#include "core_validation.h"
Petr Kraus25810d02019-08-27 17:41:15 +020042
Chris Forbes4ae55b32017-06-09 14:42:56 -070043#include "spirv-tools/libspirv.h"
Chris Forbes9a61e082017-07-24 15:35:29 -070044#include "xxhash.h"
Chris Forbes47567b72017-06-09 12:09:45 -070045
Chris Forbes8a6d8cb2019-02-14 14:33:08 -080046void decoration_set::add(uint32_t decoration, uint32_t value) {
47 switch (decoration) {
48 case spv::DecorationLocation:
49 flags |= location_bit;
50 location = value;
51 break;
52 case spv::DecorationPatch:
53 flags |= patch_bit;
54 break;
55 case spv::DecorationRelaxedPrecision:
56 flags |= relaxed_precision_bit;
57 break;
58 case spv::DecorationBlock:
59 flags |= block_bit;
60 break;
61 case spv::DecorationBufferBlock:
62 flags |= buffer_block_bit;
63 break;
64 case spv::DecorationComponent:
65 flags |= component_bit;
66 component = value;
67 break;
68 case spv::DecorationInputAttachmentIndex:
69 flags |= input_attachment_index_bit;
70 input_attachment_index = value;
71 break;
72 case spv::DecorationDescriptorSet:
73 flags |= descriptor_set_bit;
74 descriptor_set = value;
75 break;
76 case spv::DecorationBinding:
77 flags |= binding_bit;
78 binding = value;
79 break;
80 case spv::DecorationNonWritable:
81 flags |= nonwritable_bit;
82 break;
83 case spv::DecorationBuiltIn:
84 flags |= builtin_bit;
85 builtin = value;
86 break;
87 }
88}
89
Chris Forbes47567b72017-06-09 12:09:45 -070090enum FORMAT_TYPE {
91 FORMAT_TYPE_FLOAT = 1, // UNORM, SNORM, FLOAT, USCALED, SSCALED, SRGB -- anything we consider float in the shader
92 FORMAT_TYPE_SINT = 2,
93 FORMAT_TYPE_UINT = 4,
94};
95
96typedef std::pair<unsigned, unsigned> location_t;
97
Chris Forbes47567b72017-06-09 12:09:45 -070098static shader_stage_attributes shader_stage_attribs[] = {
Ari Suonpaa696b3432019-03-11 14:02:57 +020099 {"vertex shader", false, false, VK_SHADER_STAGE_VERTEX_BIT},
100 {"tessellation control shader", true, true, VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT},
101 {"tessellation evaluation shader", true, false, VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT},
102 {"geometry shader", true, false, VK_SHADER_STAGE_GEOMETRY_BIT},
103 {"fragment shader", false, false, VK_SHADER_STAGE_FRAGMENT_BIT},
Chris Forbes47567b72017-06-09 12:09:45 -0700104};
105
John Zulauf14c355b2019-06-27 16:09:37 -0600106unsigned ExecutionModelToShaderStageFlagBits(unsigned mode);
107
Chris Forbes47567b72017-06-09 12:09:45 -0700108// SPIRV utility functions
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600109void SHADER_MODULE_STATE::BuildDefIndex() {
Chris Forbes47567b72017-06-09 12:09:45 -0700110 for (auto insn : *this) {
111 switch (insn.opcode()) {
112 // Types
113 case spv::OpTypeVoid:
114 case spv::OpTypeBool:
115 case spv::OpTypeInt:
116 case spv::OpTypeFloat:
117 case spv::OpTypeVector:
118 case spv::OpTypeMatrix:
119 case spv::OpTypeImage:
120 case spv::OpTypeSampler:
121 case spv::OpTypeSampledImage:
122 case spv::OpTypeArray:
123 case spv::OpTypeRuntimeArray:
124 case spv::OpTypeStruct:
125 case spv::OpTypeOpaque:
126 case spv::OpTypePointer:
127 case spv::OpTypeFunction:
128 case spv::OpTypeEvent:
129 case spv::OpTypeDeviceEvent:
130 case spv::OpTypeReserveId:
131 case spv::OpTypeQueue:
132 case spv::OpTypePipe:
Shannon McPherson0fa28232018-11-01 11:59:02 -0600133 case spv::OpTypeAccelerationStructureNV:
Jeff Bolze4356752019-03-07 11:23:46 -0600134 case spv::OpTypeCooperativeMatrixNV:
Chris Forbes47567b72017-06-09 12:09:45 -0700135 def_index[insn.word(1)] = insn.offset();
136 break;
137
138 // Fixed constants
139 case spv::OpConstantTrue:
140 case spv::OpConstantFalse:
141 case spv::OpConstant:
142 case spv::OpConstantComposite:
143 case spv::OpConstantSampler:
144 case spv::OpConstantNull:
145 def_index[insn.word(2)] = insn.offset();
146 break;
147
148 // Specialization constants
149 case spv::OpSpecConstantTrue:
150 case spv::OpSpecConstantFalse:
151 case spv::OpSpecConstant:
152 case spv::OpSpecConstantComposite:
153 case spv::OpSpecConstantOp:
154 def_index[insn.word(2)] = insn.offset();
155 break;
156
157 // Variables
158 case spv::OpVariable:
159 def_index[insn.word(2)] = insn.offset();
160 break;
161
162 // Functions
163 case spv::OpFunction:
164 def_index[insn.word(2)] = insn.offset();
165 break;
166
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800167 // Decorations
168 case spv::OpDecorate: {
169 auto targetId = insn.word(1);
170 decorations[targetId].add(insn.word(2), insn.len() > 3u ? insn.word(3) : 0u);
171 } break;
172 case spv::OpGroupDecorate: {
173 auto const &src = decorations[insn.word(1)];
174 for (auto i = 2u; i < insn.len(); i++) decorations[insn.word(i)].merge(src);
175 } break;
176
John Zulauf14c355b2019-06-27 16:09:37 -0600177 // Entry points ... add to the entrypoint table
178 case spv::OpEntryPoint: {
179 // Entry points do not have an id (the id is the function id) and thus need their own table
180 auto entrypoint_name = (char const *)&insn.word(3);
181 auto execution_model = insn.word(1);
182 auto entrypoint_stage = ExecutionModelToShaderStageFlagBits(execution_model);
183 entry_points.emplace(entrypoint_name, EntryPoint{insn.offset(), entrypoint_stage});
184 break;
185 }
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800186
Chris Forbes47567b72017-06-09 12:09:45 -0700187 default:
188 // We don't care about any other defs for now.
189 break;
190 }
191 }
192}
193
Jeff Bolz105d6492018-09-29 15:46:44 -0500194unsigned ExecutionModelToShaderStageFlagBits(unsigned mode) {
195 switch (mode) {
196 case spv::ExecutionModelVertex:
197 return VK_SHADER_STAGE_VERTEX_BIT;
198 case spv::ExecutionModelTessellationControl:
199 return VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT;
200 case spv::ExecutionModelTessellationEvaluation:
201 return VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT;
202 case spv::ExecutionModelGeometry:
203 return VK_SHADER_STAGE_GEOMETRY_BIT;
204 case spv::ExecutionModelFragment:
205 return VK_SHADER_STAGE_FRAGMENT_BIT;
206 case spv::ExecutionModelGLCompute:
207 return VK_SHADER_STAGE_COMPUTE_BIT;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600208 case spv::ExecutionModelRayGenerationNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700209 return VK_SHADER_STAGE_RAYGEN_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600210 case spv::ExecutionModelAnyHitNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700211 return VK_SHADER_STAGE_ANY_HIT_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600212 case spv::ExecutionModelClosestHitNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700213 return VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600214 case spv::ExecutionModelMissNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700215 return VK_SHADER_STAGE_MISS_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600216 case spv::ExecutionModelIntersectionNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700217 return VK_SHADER_STAGE_INTERSECTION_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600218 case spv::ExecutionModelCallableNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700219 return VK_SHADER_STAGE_CALLABLE_BIT_NV;
Jeff Bolz105d6492018-09-29 15:46:44 -0500220 case spv::ExecutionModelTaskNV:
221 return VK_SHADER_STAGE_TASK_BIT_NV;
222 case spv::ExecutionModelMeshNV:
223 return VK_SHADER_STAGE_MESH_BIT_NV;
224 default:
225 return 0;
226 }
227}
228
locke-lunargd9a069d2019-09-17 01:50:19 -0600229spirv_inst_iter FindEntrypoint(SHADER_MODULE_STATE const *src, char const *name, VkShaderStageFlagBits stageBits) {
John Zulauf14c355b2019-06-27 16:09:37 -0600230 auto range = src->entry_points.equal_range(name);
231 for (auto it = range.first; it != range.second; ++it) {
232 if (it->second.stage == stageBits) {
233 return src->at(it->second.offset);
Chris Forbes47567b72017-06-09 12:09:45 -0700234 }
235 }
Chris Forbes47567b72017-06-09 12:09:45 -0700236 return src->end();
237}
238
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600239static char const *StorageClassName(unsigned sc) {
Chris Forbes47567b72017-06-09 12:09:45 -0700240 switch (sc) {
241 case spv::StorageClassInput:
242 return "input";
243 case spv::StorageClassOutput:
244 return "output";
245 case spv::StorageClassUniformConstant:
246 return "const uniform";
247 case spv::StorageClassUniform:
248 return "uniform";
249 case spv::StorageClassWorkgroup:
250 return "workgroup local";
251 case spv::StorageClassCrossWorkgroup:
252 return "workgroup global";
253 case spv::StorageClassPrivate:
254 return "private global";
255 case spv::StorageClassFunction:
256 return "function";
257 case spv::StorageClassGeneric:
258 return "generic";
259 case spv::StorageClassAtomicCounter:
260 return "atomic counter";
261 case spv::StorageClassImage:
262 return "image";
263 case spv::StorageClassPushConstant:
264 return "push constant";
Chris Forbes9f89d752018-03-07 12:57:48 -0800265 case spv::StorageClassStorageBuffer:
266 return "storage buffer";
Chris Forbes47567b72017-06-09 12:09:45 -0700267 default:
268 return "unknown";
269 }
270}
271
272// Get the value of an integral constant
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600273unsigned GetConstantValue(SHADER_MODULE_STATE const *src, unsigned id) {
Chris Forbes47567b72017-06-09 12:09:45 -0700274 auto value = src->get_def(id);
275 assert(value != src->end());
276
277 if (value.opcode() != spv::OpConstant) {
278 // TODO: Either ensure that the specialization transform is already performed on a module we're
279 // considering here, OR -- specialize on the fly now.
280 return 1;
281 }
282
283 return value.word(3);
284}
285
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600286static void DescribeTypeInner(std::ostringstream &ss, SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700287 auto insn = src->get_def(type);
288 assert(insn != src->end());
289
290 switch (insn.opcode()) {
291 case spv::OpTypeBool:
292 ss << "bool";
293 break;
294 case spv::OpTypeInt:
295 ss << (insn.word(3) ? 's' : 'u') << "int" << insn.word(2);
296 break;
297 case spv::OpTypeFloat:
298 ss << "float" << insn.word(2);
299 break;
300 case spv::OpTypeVector:
301 ss << "vec" << insn.word(3) << " of ";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600302 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700303 break;
304 case spv::OpTypeMatrix:
305 ss << "mat" << insn.word(3) << " of ";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600306 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700307 break;
308 case spv::OpTypeArray:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600309 ss << "arr[" << GetConstantValue(src, insn.word(3)) << "] of ";
310 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700311 break;
Chris Forbes062f1222018-08-21 15:34:15 -0700312 case spv::OpTypeRuntimeArray:
313 ss << "runtime arr[] of ";
314 DescribeTypeInner(ss, src, insn.word(2));
315 break;
Chris Forbes47567b72017-06-09 12:09:45 -0700316 case spv::OpTypePointer:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600317 ss << "ptr to " << StorageClassName(insn.word(2)) << " ";
318 DescribeTypeInner(ss, src, insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700319 break;
320 case spv::OpTypeStruct: {
321 ss << "struct of (";
322 for (unsigned i = 2; i < insn.len(); i++) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600323 DescribeTypeInner(ss, src, insn.word(i));
Chris Forbes47567b72017-06-09 12:09:45 -0700324 if (i == insn.len() - 1) {
325 ss << ")";
326 } else {
327 ss << ", ";
328 }
329 }
330 break;
331 }
332 case spv::OpTypeSampler:
333 ss << "sampler";
334 break;
335 case spv::OpTypeSampledImage:
336 ss << "sampler+";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600337 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700338 break;
339 case spv::OpTypeImage:
340 ss << "image(dim=" << insn.word(3) << ", sampled=" << insn.word(7) << ")";
341 break;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600342 case spv::OpTypeAccelerationStructureNV:
Jeff Bolz105d6492018-09-29 15:46:44 -0500343 ss << "accelerationStruture";
344 break;
Chris Forbes47567b72017-06-09 12:09:45 -0700345 default:
346 ss << "oddtype";
347 break;
348 }
349}
350
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600351static std::string DescribeType(SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700352 std::ostringstream ss;
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600353 DescribeTypeInner(ss, src, type);
Chris Forbes47567b72017-06-09 12:09:45 -0700354 return ss.str();
355}
356
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600357static bool IsNarrowNumericType(spirv_inst_iter type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700358 if (type.opcode() != spv::OpTypeInt && type.opcode() != spv::OpTypeFloat) return false;
359 return type.word(2) < 64;
360}
361
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600362static bool TypesMatch(SHADER_MODULE_STATE const *a, SHADER_MODULE_STATE const *b, unsigned a_type, unsigned b_type, bool a_arrayed,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600363 bool b_arrayed, bool relaxed) {
Chris Forbes47567b72017-06-09 12:09:45 -0700364 // Walk two type trees together, and complain about differences
365 auto a_insn = a->get_def(a_type);
366 auto b_insn = b->get_def(b_type);
367 assert(a_insn != a->end());
368 assert(b_insn != b->end());
369
Chris Forbes062f1222018-08-21 15:34:15 -0700370 // Ignore runtime-sized arrays-- they cannot appear in these interfaces.
371
Chris Forbes47567b72017-06-09 12:09:45 -0700372 if (a_arrayed && a_insn.opcode() == spv::OpTypeArray) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600373 return TypesMatch(a, b, a_insn.word(2), b_type, false, b_arrayed, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700374 }
375
376 if (b_arrayed && b_insn.opcode() == spv::OpTypeArray) {
377 // We probably just found the extra level of arrayness in b_type: compare the type inside it to a_type
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600378 return TypesMatch(a, b, a_type, b_insn.word(2), a_arrayed, false, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700379 }
380
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600381 if (a_insn.opcode() == spv::OpTypeVector && relaxed && IsNarrowNumericType(b_insn)) {
382 return TypesMatch(a, b, a_insn.word(2), b_type, a_arrayed, b_arrayed, false);
Chris Forbes47567b72017-06-09 12:09:45 -0700383 }
384
385 if (a_insn.opcode() != b_insn.opcode()) {
386 return false;
387 }
388
389 if (a_insn.opcode() == spv::OpTypePointer) {
390 // Match on pointee type. storage class is expected to differ
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600391 return TypesMatch(a, b, a_insn.word(3), b_insn.word(3), a_arrayed, b_arrayed, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700392 }
393
394 if (a_arrayed || b_arrayed) {
395 // If we havent resolved array-of-verts by here, we're not going to.
396 return false;
397 }
398
399 switch (a_insn.opcode()) {
400 case spv::OpTypeBool:
401 return true;
402 case spv::OpTypeInt:
403 // Match on width, signedness
404 return a_insn.word(2) == b_insn.word(2) && a_insn.word(3) == b_insn.word(3);
405 case spv::OpTypeFloat:
406 // Match on width
407 return a_insn.word(2) == b_insn.word(2);
408 case spv::OpTypeVector:
409 // Match on element type, count.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600410 if (!TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false)) return false;
411 if (relaxed && IsNarrowNumericType(a->get_def(a_insn.word(2)))) {
Chris Forbes47567b72017-06-09 12:09:45 -0700412 return a_insn.word(3) >= b_insn.word(3);
413 } else {
414 return a_insn.word(3) == b_insn.word(3);
415 }
416 case spv::OpTypeMatrix:
417 // Match on element type, count.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600418 return TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false) &&
Dave Houltona9df0ce2018-02-07 10:51:23 -0700419 a_insn.word(3) == b_insn.word(3);
Chris Forbes47567b72017-06-09 12:09:45 -0700420 case spv::OpTypeArray:
421 // Match on element type, count. these all have the same layout. we don't get here if b_arrayed. This differs from
422 // vector & matrix types in that the array size is the id of a constant instruction, * not a literal within OpTypeArray
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600423 return TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false) &&
424 GetConstantValue(a, a_insn.word(3)) == GetConstantValue(b, b_insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700425 case spv::OpTypeStruct:
426 // Match on all element types
Dave Houltona9df0ce2018-02-07 10:51:23 -0700427 {
428 if (a_insn.len() != b_insn.len()) {
429 return false; // Structs cannot match if member counts differ
Chris Forbes47567b72017-06-09 12:09:45 -0700430 }
Chris Forbes47567b72017-06-09 12:09:45 -0700431
Dave Houltona9df0ce2018-02-07 10:51:23 -0700432 for (unsigned i = 2; i < a_insn.len(); i++) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600433 if (!TypesMatch(a, b, a_insn.word(i), b_insn.word(i), a_arrayed, b_arrayed, false)) {
Dave Houltona9df0ce2018-02-07 10:51:23 -0700434 return false;
435 }
436 }
437
438 return true;
439 }
Chris Forbes47567b72017-06-09 12:09:45 -0700440 default:
441 // Remaining types are CLisms, or may not appear in the interfaces we are interested in. Just claim no match.
442 return false;
443 }
444}
445
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600446static unsigned GetLocationsConsumedByType(SHADER_MODULE_STATE const *src, unsigned type, bool strip_array_level) {
Chris Forbes47567b72017-06-09 12:09:45 -0700447 auto insn = src->get_def(type);
448 assert(insn != src->end());
449
450 switch (insn.opcode()) {
451 case spv::OpTypePointer:
452 // See through the ptr -- this is only ever at the toplevel for graphics shaders we're never actually passing
453 // pointers around.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600454 return GetLocationsConsumedByType(src, insn.word(3), strip_array_level);
Chris Forbes47567b72017-06-09 12:09:45 -0700455 case spv::OpTypeArray:
456 if (strip_array_level) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600457 return GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700458 } else {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600459 return GetConstantValue(src, insn.word(3)) * GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700460 }
461 case spv::OpTypeMatrix:
462 // Num locations is the dimension * element size
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600463 return insn.word(3) * GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700464 case spv::OpTypeVector: {
465 auto scalar_type = src->get_def(insn.word(2));
466 auto bit_width =
467 (scalar_type.opcode() == spv::OpTypeInt || scalar_type.opcode() == spv::OpTypeFloat) ? scalar_type.word(2) : 32;
468
469 // Locations are 128-bit wide; 3- and 4-component vectors of 64 bit types require two.
470 return (bit_width * insn.word(3) + 127) / 128;
471 }
472 default:
473 // Everything else is just 1.
474 return 1;
475
476 // TODO: extend to handle 64bit scalar types, whose vectors may need multiple locations.
477 }
478}
479
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600480static unsigned GetComponentsConsumedByType(SHADER_MODULE_STATE const *src, unsigned type, bool strip_array_level) {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200481 auto insn = src->get_def(type);
482 assert(insn != src->end());
483
484 switch (insn.opcode()) {
485 case spv::OpTypePointer:
486 // See through the ptr -- this is only ever at the toplevel for graphics shaders we're never actually passing
487 // pointers around.
488 return GetComponentsConsumedByType(src, insn.word(3), strip_array_level);
489 case spv::OpTypeStruct: {
490 uint32_t sum = 0;
491 for (uint32_t i = 2; i < insn.len(); i++) { // i=2 to skip word(0) and word(1)=ID of struct
492 sum += GetComponentsConsumedByType(src, insn.word(i), false);
493 }
494 return sum;
495 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -0500496 case spv::OpTypeArray:
497 if (strip_array_level) {
498 return GetComponentsConsumedByType(src, insn.word(2), false);
499 } else {
500 return GetConstantValue(src, insn.word(3)) * GetComponentsConsumedByType(src, insn.word(2), false);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200501 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200502 case spv::OpTypeMatrix:
503 // Num locations is the dimension * element size
504 return insn.word(3) * GetComponentsConsumedByType(src, insn.word(2), false);
505 case spv::OpTypeVector: {
506 auto scalar_type = src->get_def(insn.word(2));
507 auto bit_width =
508 (scalar_type.opcode() == spv::OpTypeInt || scalar_type.opcode() == spv::OpTypeFloat) ? scalar_type.word(2) : 32;
509 // One component is 32-bit
510 return (bit_width * insn.word(3) + 31) / 32;
511 }
512 case spv::OpTypeFloat: {
513 auto bit_width = insn.word(2);
514 return (bit_width + 31) / 32;
515 }
516 case spv::OpTypeInt: {
517 auto bit_width = insn.word(2);
518 return (bit_width + 31) / 32;
519 }
520 case spv::OpConstant:
521 return GetComponentsConsumedByType(src, insn.word(1), false);
522 default:
523 return 0;
524 }
525}
526
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600527static unsigned GetLocationsConsumedByFormat(VkFormat format) {
Chris Forbes47567b72017-06-09 12:09:45 -0700528 switch (format) {
529 case VK_FORMAT_R64G64B64A64_SFLOAT:
530 case VK_FORMAT_R64G64B64A64_SINT:
531 case VK_FORMAT_R64G64B64A64_UINT:
532 case VK_FORMAT_R64G64B64_SFLOAT:
533 case VK_FORMAT_R64G64B64_SINT:
534 case VK_FORMAT_R64G64B64_UINT:
535 return 2;
536 default:
537 return 1;
538 }
539}
540
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600541static unsigned GetFormatType(VkFormat fmt) {
Dave Houltona9df0ce2018-02-07 10:51:23 -0700542 if (FormatIsSInt(fmt)) return FORMAT_TYPE_SINT;
543 if (FormatIsUInt(fmt)) return FORMAT_TYPE_UINT;
544 if (FormatIsDepthAndStencil(fmt)) return FORMAT_TYPE_FLOAT | FORMAT_TYPE_UINT;
545 if (fmt == VK_FORMAT_UNDEFINED) return 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700546 // everything else -- UNORM/SNORM/FLOAT/USCALED/SSCALED is all float in the shader.
547 return FORMAT_TYPE_FLOAT;
548}
549
550// characterizes a SPIR-V type appearing in an interface to a FF stage, for comparison to a VkFormat's characterization above.
Chris Forbes062f1222018-08-21 15:34:15 -0700551// also used for input attachments, as we statically know their format.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600552static unsigned GetFundamentalType(SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700553 auto insn = src->get_def(type);
554 assert(insn != src->end());
555
556 switch (insn.opcode()) {
557 case spv::OpTypeInt:
558 return insn.word(3) ? FORMAT_TYPE_SINT : FORMAT_TYPE_UINT;
559 case spv::OpTypeFloat:
560 return FORMAT_TYPE_FLOAT;
561 case spv::OpTypeVector:
Chris Forbes47567b72017-06-09 12:09:45 -0700562 case spv::OpTypeMatrix:
Chris Forbes47567b72017-06-09 12:09:45 -0700563 case spv::OpTypeArray:
Chris Forbes062f1222018-08-21 15:34:15 -0700564 case spv::OpTypeRuntimeArray:
565 case spv::OpTypeImage:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600566 return GetFundamentalType(src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700567 case spv::OpTypePointer:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600568 return GetFundamentalType(src, insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700569
570 default:
571 return 0;
572 }
573}
574
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600575static uint32_t GetShaderStageId(VkShaderStageFlagBits stage) {
Chris Forbes47567b72017-06-09 12:09:45 -0700576 uint32_t bit_pos = uint32_t(u_ffs(stage));
577 return bit_pos - 1;
578}
579
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600580static spirv_inst_iter GetStructType(SHADER_MODULE_STATE const *src, spirv_inst_iter def, bool is_array_of_verts) {
Chris Forbes47567b72017-06-09 12:09:45 -0700581 while (true) {
582 if (def.opcode() == spv::OpTypePointer) {
583 def = src->get_def(def.word(3));
584 } else if (def.opcode() == spv::OpTypeArray && is_array_of_verts) {
585 def = src->get_def(def.word(2));
586 is_array_of_verts = false;
587 } else if (def.opcode() == spv::OpTypeStruct) {
588 return def;
589 } else {
590 return src->end();
591 }
592 }
593}
594
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600595static bool CollectInterfaceBlockMembers(SHADER_MODULE_STATE const *src, std::map<location_t, interface_var> *out,
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800596 bool is_array_of_verts, uint32_t id, uint32_t type_id, bool is_patch,
597 int /*first_location*/) {
Chris Forbes47567b72017-06-09 12:09:45 -0700598 // Walk down the type_id presented, trying to determine whether it's actually an interface block.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600599 auto type = GetStructType(src, src->get_def(type_id), is_array_of_verts && !is_patch);
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800600 if (type == src->end() || !(src->get_decorations(type.word(1)).flags & decoration_set::block_bit)) {
Chris Forbes47567b72017-06-09 12:09:45 -0700601 // This isn't an interface block.
Chris Forbesa313d772017-06-13 13:59:41 -0700602 return false;
Chris Forbes47567b72017-06-09 12:09:45 -0700603 }
604
605 std::unordered_map<unsigned, unsigned> member_components;
606 std::unordered_map<unsigned, unsigned> member_relaxed_precision;
Chris Forbesa313d772017-06-13 13:59:41 -0700607 std::unordered_map<unsigned, unsigned> member_patch;
Chris Forbes47567b72017-06-09 12:09:45 -0700608
609 // Walk all the OpMemberDecorate for type's result id -- first pass, collect components.
610 for (auto insn : *src) {
611 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1)) {
612 unsigned member_index = insn.word(2);
613
614 if (insn.word(3) == spv::DecorationComponent) {
615 unsigned component = insn.word(4);
616 member_components[member_index] = component;
617 }
618
619 if (insn.word(3) == spv::DecorationRelaxedPrecision) {
620 member_relaxed_precision[member_index] = 1;
621 }
Chris Forbesa313d772017-06-13 13:59:41 -0700622
623 if (insn.word(3) == spv::DecorationPatch) {
624 member_patch[member_index] = 1;
625 }
Chris Forbes47567b72017-06-09 12:09:45 -0700626 }
627 }
628
Chris Forbesa313d772017-06-13 13:59:41 -0700629 // TODO: correctly handle location assignment from outside
630
Chris Forbes47567b72017-06-09 12:09:45 -0700631 // Second pass -- produce the output, from Location decorations
632 for (auto insn : *src) {
633 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1)) {
634 unsigned member_index = insn.word(2);
635 unsigned member_type_id = type.word(2 + member_index);
636
637 if (insn.word(3) == spv::DecorationLocation) {
638 unsigned location = insn.word(4);
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600639 unsigned num_locations = GetLocationsConsumedByType(src, member_type_id, false);
Chris Forbes47567b72017-06-09 12:09:45 -0700640 auto component_it = member_components.find(member_index);
641 unsigned component = component_it == member_components.end() ? 0 : component_it->second;
642 bool is_relaxed_precision = member_relaxed_precision.find(member_index) != member_relaxed_precision.end();
Dave Houltona9df0ce2018-02-07 10:51:23 -0700643 bool member_is_patch = is_patch || member_patch.count(member_index) > 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700644
645 for (unsigned int offset = 0; offset < num_locations; offset++) {
646 interface_var v = {};
647 v.id = id;
648 // TODO: member index in interface_var too?
649 v.type_id = member_type_id;
650 v.offset = offset;
Chris Forbesa313d772017-06-13 13:59:41 -0700651 v.is_patch = member_is_patch;
Chris Forbes47567b72017-06-09 12:09:45 -0700652 v.is_block_member = true;
653 v.is_relaxed_precision = is_relaxed_precision;
654 (*out)[std::make_pair(location + offset, component)] = v;
655 }
656 }
657 }
658 }
Chris Forbesa313d772017-06-13 13:59:41 -0700659
660 return true;
Chris Forbes47567b72017-06-09 12:09:45 -0700661}
662
Ari Suonpaa696b3432019-03-11 14:02:57 +0200663static std::vector<uint32_t> FindEntrypointInterfaces(spirv_inst_iter entrypoint) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800664 assert(entrypoint.opcode() == spv::OpEntryPoint);
665
Ari Suonpaa696b3432019-03-11 14:02:57 +0200666 std::vector<uint32_t> interfaces;
667 // Find the end of the entrypoint's name string. additional zero bytes follow the actual null terminator, to fill out the
668 // rest of the word - so we only need to look at the last byte in the word to determine which word contains the terminator.
669 uint32_t word = 3;
670 while (entrypoint.word(word) & 0xff000000u) {
671 ++word;
672 }
673 ++word;
674
675 for (; word < entrypoint.len(); word++) interfaces.push_back(entrypoint.word(word));
676
677 return interfaces;
678}
679
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600680static std::map<location_t, interface_var> CollectInterfaceByLocation(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600681 spv::StorageClass sinterface, bool is_array_of_verts) {
Chris Forbes47567b72017-06-09 12:09:45 -0700682 // TODO: handle index=1 dual source outputs from FS -- two vars will have the same location, and we DON'T want to clobber.
683
Chris Forbes47567b72017-06-09 12:09:45 -0700684 std::map<location_t, interface_var> out;
685
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800686 for (uint32_t iid : FindEntrypointInterfaces(entrypoint)) {
687 auto insn = src->get_def(iid);
Chris Forbes47567b72017-06-09 12:09:45 -0700688 assert(insn != src->end());
689 assert(insn.opcode() == spv::OpVariable);
690
691 if (insn.word(3) == static_cast<uint32_t>(sinterface)) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800692 auto d = src->get_decorations(iid);
Chris Forbes47567b72017-06-09 12:09:45 -0700693 unsigned id = insn.word(2);
694 unsigned type = insn.word(1);
695
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800696 int location = d.location;
697 int builtin = d.builtin;
698 unsigned component = d.component;
699 bool is_patch = (d.flags & decoration_set::patch_bit) != 0;
700 bool is_relaxed_precision = (d.flags & decoration_set::relaxed_precision_bit) != 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700701
Dave Houltona9df0ce2018-02-07 10:51:23 -0700702 if (builtin != -1)
703 continue;
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800704 else if (!CollectInterfaceBlockMembers(src, &out, is_array_of_verts, id, type, is_patch, location)) {
Chris Forbes47567b72017-06-09 12:09:45 -0700705 // A user-defined interface variable, with a location. Where a variable occupied multiple locations, emit
706 // one result for each.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600707 unsigned num_locations = GetLocationsConsumedByType(src, type, is_array_of_verts && !is_patch);
Chris Forbes47567b72017-06-09 12:09:45 -0700708 for (unsigned int offset = 0; offset < num_locations; offset++) {
709 interface_var v = {};
710 v.id = id;
711 v.type_id = type;
712 v.offset = offset;
713 v.is_patch = is_patch;
714 v.is_relaxed_precision = is_relaxed_precision;
715 out[std::make_pair(location + offset, component)] = v;
716 }
Chris Forbes47567b72017-06-09 12:09:45 -0700717 }
718 }
719 }
720
721 return out;
722}
723
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600724static std::vector<uint32_t> CollectBuiltinBlockMembers(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint,
Ari Suonpaa696b3432019-03-11 14:02:57 +0200725 uint32_t storageClass) {
726 std::vector<uint32_t> variables;
727 std::vector<uint32_t> builtinStructMembers;
728 std::vector<uint32_t> builtinDecorations;
729
730 for (auto insn : *src) {
731 switch (insn.opcode()) {
732 // Find all built-in member decorations
733 case spv::OpMemberDecorate:
734 if (insn.word(3) == spv::DecorationBuiltIn) {
735 builtinStructMembers.push_back(insn.word(1));
736 }
737 break;
738 // Find all built-in decorations
739 case spv::OpDecorate:
740 switch (insn.word(2)) {
741 case spv::DecorationBlock: {
742 uint32_t blockID = insn.word(1);
743 for (auto builtInBlockID : builtinStructMembers) {
744 // Check if one of the members of the block are built-in -> the block is built-in
745 if (blockID == builtInBlockID) {
746 builtinDecorations.push_back(blockID);
747 break;
748 }
749 }
750 break;
751 }
752 case spv::DecorationBuiltIn:
753 builtinDecorations.push_back(insn.word(1));
754 break;
755 default:
756 break;
757 }
758 break;
759 default:
760 break;
761 }
762 }
763
764 // Find all interface variables belonging to the entrypoint and matching the storage class
765 for (uint32_t id : FindEntrypointInterfaces(entrypoint)) {
766 auto def = src->get_def(id);
767 assert(def != src->end());
768 assert(def.opcode() == spv::OpVariable);
769
770 if (def.word(3) == storageClass) variables.push_back(def.word(1));
771 }
772
773 // Find all members belonging to the builtin block selected
774 std::vector<uint32_t> builtinBlockMembers;
775 for (auto &var : variables) {
776 auto def = src->get_def(src->get_def(var).word(3));
777
778 // It could be an array of IO blocks. The element type should be the struct defining the block contents
779 if (def.opcode() == spv::OpTypeArray) def = src->get_def(def.word(2));
780
781 // Now find all members belonging to the struct defining the IO block
782 if (def.opcode() == spv::OpTypeStruct) {
783 for (auto builtInID : builtinDecorations) {
784 if (builtInID == def.word(1)) {
785 for (int i = 2; i < (int)def.len(); i++)
786 builtinBlockMembers.push_back(spv::BuiltInMax); // Start with undefined builtin for each struct member.
787 // These shouldn't be left after replacing.
788 for (auto insn : *src) {
789 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == builtInID &&
790 insn.word(3) == spv::DecorationBuiltIn) {
791 auto structIndex = insn.word(2);
792 assert(structIndex < builtinBlockMembers.size());
793 builtinBlockMembers[structIndex] = insn.word(4);
794 }
795 }
796 }
797 }
798 }
799 }
800
801 return builtinBlockMembers;
802}
803
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600804static std::vector<std::pair<uint32_t, interface_var>> CollectInterfaceByInputAttachmentIndex(
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600805 SHADER_MODULE_STATE const *src, std::unordered_set<uint32_t> const &accessible_ids) {
Chris Forbes47567b72017-06-09 12:09:45 -0700806 std::vector<std::pair<uint32_t, interface_var>> out;
807
808 for (auto insn : *src) {
809 if (insn.opcode() == spv::OpDecorate) {
810 if (insn.word(2) == spv::DecorationInputAttachmentIndex) {
811 auto attachment_index = insn.word(3);
812 auto id = insn.word(1);
813
814 if (accessible_ids.count(id)) {
815 auto def = src->get_def(id);
816 assert(def != src->end());
locke-lunarg9a16ebb2020-07-30 16:56:33 -0600817 if (def.opcode() == spv::OpVariable && def.word(3) == spv::StorageClassUniformConstant) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600818 auto num_locations = GetLocationsConsumedByType(src, def.word(1), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700819 for (unsigned int offset = 0; offset < num_locations; offset++) {
820 interface_var v = {};
821 v.id = id;
822 v.type_id = def.word(1);
823 v.offset = offset;
824 out.emplace_back(attachment_index + offset, v);
825 }
826 }
827 }
828 }
829 }
830 }
831
832 return out;
833}
834
locke-lunarg6f760f12020-06-05 16:19:37 -0600835static bool IsWritableDescriptorType(SHADER_MODULE_STATE const *module, const spirv_inst_iter &id_it, bool is_storage_buffer) {
836 uint32_t type_id = id_it.word(1);
Chris Forbes8af24522018-03-07 11:37:45 -0800837 auto type = module->get_def(type_id);
838
839 // Strip off any array or ptrs. Where we remove array levels, adjust the descriptor count for each dimension.
Chris Forbes062f1222018-08-21 15:34:15 -0700840 while (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypePointer || type.opcode() == spv::OpTypeRuntimeArray) {
841 if (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypeRuntimeArray) {
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700842 type = module->get_def(type.word(2)); // Element type
Chris Forbes8af24522018-03-07 11:37:45 -0800843 } else {
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700844 type = module->get_def(type.word(3)); // Pointee type
Chris Forbes8af24522018-03-07 11:37:45 -0800845 }
846 }
Chris Forbes8af24522018-03-07 11:37:45 -0800847 switch (type.opcode()) {
848 case spv::OpTypeImage: {
849 auto dim = type.word(3);
850 auto sampled = type.word(7);
locke-lunarg6f760f12020-06-05 16:19:37 -0600851 if (sampled == 2 && dim != spv::DimSubpassData) {
852 std::vector<unsigned> imagwrite_members;
853 std::unordered_map<unsigned, unsigned> load_members;
854 std::unordered_map<unsigned, unsigned> accesschain_members;
855 unsigned int id = id_it.word(2);
856
857 for (auto insn : *module) {
858 switch (insn.opcode()) {
859 case spv::OpImageWrite: {
860 imagwrite_members.emplace_back(insn.word(1)); // Load id
861 break;
862 }
863 case spv::OpLoad: {
864 // 2: Load id, 3: object id or AccessChain id
865 load_members.insert(std::make_pair(insn.word(2), insn.word(3)));
866 break;
867 }
868 case spv::OpAccessChain: {
869 // 2: AccessChain id, 3: object id
870 if (insn.word(3) == id) {
871 accesschain_members.insert(std::make_pair(insn.word(2), insn.word(3)));
872 }
873 break;
874 }
875 default:
876 break;
877 }
878 }
879 if (imagwrite_members.empty() || load_members.empty()) {
880 return false;
881 }
882 for (auto load_id : imagwrite_members) {
883 auto load_it = load_members.find(load_id);
884 if (load_it == load_members.end()) {
885 continue;
886 }
887 if (load_it->second == id) {
888 return true;
889 }
890 auto accesschain_it = accesschain_members.find(load_it->second);
891 if (accesschain_it == accesschain_members.end()) {
892 continue;
893 }
894 return true;
895 }
896 }
897 return false;
Chris Forbes8af24522018-03-07 11:37:45 -0800898 }
899
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700900 case spv::OpTypeStruct: {
901 std::unordered_set<unsigned> nonwritable_members;
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800902 if (module->get_decorations(type.word(1)).flags & decoration_set::buffer_block_bit) is_storage_buffer = true;
Chris Forbes8af24522018-03-07 11:37:45 -0800903 for (auto insn : *module) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800904 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1) &&
905 insn.word(3) == spv::DecorationNonWritable) {
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700906 nonwritable_members.insert(insn.word(2));
Chris Forbes8af24522018-03-07 11:37:45 -0800907 }
908 }
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700909
910 // A buffer is writable if it's either flavor of storage buffer, and has any member not decorated
911 // as nonwritable.
locke-lunarg6f760f12020-06-05 16:19:37 -0600912 if (is_storage_buffer && nonwritable_members.size() != type.len() - 2) {
913 std::vector<unsigned> store_members;
914 std::unordered_map<unsigned, unsigned> accesschain_members;
915 unsigned int id = id_it.word(2);
916
917 for (auto insn : *module) {
918 switch (insn.opcode()) {
919 case spv::OpStore:
920 case spv::OpAtomicStore: {
921 if (insn.word(1) == id) {
922 return true;
923 }
924 store_members.emplace_back(insn.word(1)); // object id or AccessChain id
925 break;
926 }
927 case spv::OpAccessChain: {
928 // 2: AccessChain id, 3: object id
929 if (insn.word(3) == id) {
930 accesschain_members.insert(std::make_pair(insn.word(2), insn.word(3)));
931 }
932 break;
933 }
934 default:
935 break;
936 }
937 }
938 if (store_members.empty() || accesschain_members.empty()) {
939 return false;
940 }
941 for (auto oid : store_members) {
942 auto accesschain_it = accesschain_members.find(oid);
943 if (accesschain_it == accesschain_members.end()) {
944 continue;
945 }
946 return true;
947 }
948 }
949 return false;
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700950 }
Chris Forbes8af24522018-03-07 11:37:45 -0800951 }
952
953 return false;
954}
955
locke-lunargd9a069d2019-09-17 01:50:19 -0600956std::vector<std::pair<descriptor_slot_t, interface_var>> CollectInterfaceByDescriptorSlot(
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -0700957 SHADER_MODULE_STATE const *src, std::unordered_set<uint32_t> const &accessible_ids, bool *has_writable_descriptor) {
Chris Forbes47567b72017-06-09 12:09:45 -0700958 std::vector<std::pair<descriptor_slot_t, interface_var>> out;
959
960 for (auto id : accessible_ids) {
961 auto insn = src->get_def(id);
962 assert(insn != src->end());
963
964 if (insn.opcode() == spv::OpVariable &&
Chris Forbes9f89d752018-03-07 12:57:48 -0800965 (insn.word(3) == spv::StorageClassUniform || insn.word(3) == spv::StorageClassUniformConstant ||
966 insn.word(3) == spv::StorageClassStorageBuffer)) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800967 auto d = src->get_decorations(insn.word(2));
968 unsigned set = d.descriptor_set;
969 unsigned binding = d.binding;
Chris Forbes47567b72017-06-09 12:09:45 -0700970
971 interface_var v = {};
972 v.id = insn.word(2);
973 v.type_id = insn.word(1);
locke-lunarg654e3692020-06-04 17:19:15 -0600974 v.is_writable = false;
locke-lunarg9a16ebb2020-07-30 16:56:33 -0600975 v.input_index = -1;
Chris Forbes8af24522018-03-07 11:37:45 -0800976
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800977 if (!(d.flags & decoration_set::nonwritable_bit) &&
locke-lunarg6f760f12020-06-05 16:19:37 -0600978 IsWritableDescriptorType(src, insn, insn.word(3) == spv::StorageClassStorageBuffer)) {
Chris Forbes8af24522018-03-07 11:37:45 -0800979 *has_writable_descriptor = true;
locke-lunarg654e3692020-06-04 17:19:15 -0600980 v.is_writable = true;
Chris Forbes8af24522018-03-07 11:37:45 -0800981 }
locke-lunarg9a16ebb2020-07-30 16:56:33 -0600982 if (d.flags & decoration_set::input_attachment_index_bit) {
983 v.input_index = d.input_attachment_index;
984 }
locke-lunarg654e3692020-06-04 17:19:15 -0600985 out.emplace_back(std::make_pair(set, binding), v);
Chris Forbes47567b72017-06-09 12:09:45 -0700986 }
987 }
988
989 return out;
990}
991
locke-lunarg96dc9632020-06-10 17:22:18 -0600992std::unordered_set<uint32_t> CollectWritableOutputLocationinFS(const SHADER_MODULE_STATE &module,
993 const VkPipelineShaderStageCreateInfo &stage_info) {
994 std::unordered_set<uint32_t> location_list;
995 if (stage_info.stage != VK_SHADER_STAGE_FRAGMENT_BIT) return location_list;
996 const auto entrypoint = FindEntrypoint(&module, stage_info.pName, stage_info.stage);
997 const auto outputs = CollectInterfaceByLocation(&module, entrypoint, spv::StorageClassOutput, false);
998 std::unordered_set<unsigned> store_members;
999 std::unordered_map<unsigned, unsigned> accesschain_members;
1000
1001 for (auto insn : module) {
1002 switch (insn.opcode()) {
1003 case spv::OpStore:
1004 case spv::OpAtomicStore: {
1005 store_members.insert(insn.word(1)); // object id or AccessChain id
1006 break;
1007 }
1008 case spv::OpAccessChain: {
1009 // 2: AccessChain id, 3: object id
1010 if (insn.word(3)) accesschain_members.insert(std::make_pair(insn.word(2), insn.word(3)));
1011 break;
1012 }
1013 default:
1014 break;
1015 }
1016 }
1017 if (store_members.empty()) {
1018 return location_list;
1019 }
1020 for (auto output : outputs) {
1021 auto store_it = store_members.find(output.second.id);
1022 if (store_it != store_members.end()) {
1023 location_list.insert(output.first.first);
1024 store_members.erase(store_it);
1025 continue;
1026 }
1027 store_it = store_members.begin();
1028 while (store_it != store_members.end()) {
1029 auto accesschain_it = accesschain_members.find(*store_it);
1030 if (accesschain_it == accesschain_members.end()) {
1031 ++store_it;
1032 continue;
1033 }
1034 if (accesschain_it->second == output.second.id) {
1035 location_list.insert(output.first.first);
1036 store_members.erase(store_it);
1037 accesschain_members.erase(accesschain_it);
1038 break;
1039 }
1040 ++store_it;
1041 }
1042 }
1043 return location_list;
1044}
1045
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001046bool CoreChecks::ValidateViConsistency(VkPipelineVertexInputStateCreateInfo const *vi) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001047 // Walk the binding descriptions, which describe the step rate and stride of each vertex buffer. Each binding should
1048 // be specified only once.
1049 std::unordered_map<uint32_t, VkVertexInputBindingDescription const *> bindings;
1050 bool skip = false;
1051
1052 for (unsigned i = 0; i < vi->vertexBindingDescriptionCount; i++) {
1053 auto desc = &vi->pVertexBindingDescriptions[i];
1054 auto &binding = bindings[desc->binding];
1055 if (binding) {
Dave Houlton78d09922018-05-17 15:48:45 -06001056 // TODO: "VUID-VkGraphicsPipelineCreateInfo-pStages-00742" perhaps?
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001057 skip |= LogError(device, kVUID_Core_Shader_InconsistentVi, "Duplicate vertex input binding descriptions for binding %d",
1058 desc->binding);
Chris Forbes47567b72017-06-09 12:09:45 -07001059 } else {
1060 binding = desc;
1061 }
1062 }
1063
1064 return skip;
1065}
1066
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001067bool CoreChecks::ValidateViAgainstVsInputs(VkPipelineVertexInputStateCreateInfo const *vi, SHADER_MODULE_STATE const *vs,
1068 spirv_inst_iter entrypoint) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001069 bool skip = false;
1070
Petr Kraus25810d02019-08-27 17:41:15 +02001071 const auto inputs = CollectInterfaceByLocation(vs, entrypoint, spv::StorageClassInput, false);
Chris Forbes47567b72017-06-09 12:09:45 -07001072
1073 // Build index by location
Petr Kraus25810d02019-08-27 17:41:15 +02001074 std::map<uint32_t, const VkVertexInputAttributeDescription *> attribs;
Chris Forbes47567b72017-06-09 12:09:45 -07001075 if (vi) {
Petr Kraus25810d02019-08-27 17:41:15 +02001076 for (uint32_t i = 0; i < vi->vertexAttributeDescriptionCount; ++i) {
1077 const auto num_locations = GetLocationsConsumedByFormat(vi->pVertexAttributeDescriptions[i].format);
1078 for (uint32_t j = 0; j < num_locations; ++j) {
Chris Forbes47567b72017-06-09 12:09:45 -07001079 attribs[vi->pVertexAttributeDescriptions[i].location + j] = &vi->pVertexAttributeDescriptions[i];
1080 }
1081 }
1082 }
1083
Petr Kraus25810d02019-08-27 17:41:15 +02001084 struct AttribInputPair {
1085 const VkVertexInputAttributeDescription *attrib = nullptr;
1086 const interface_var *input = nullptr;
1087 };
1088 std::map<uint32_t, AttribInputPair> location_map;
1089 for (const auto &attrib_it : attribs) location_map[attrib_it.first].attrib = attrib_it.second;
1090 for (const auto &input_it : inputs) location_map[input_it.first.first].input = &input_it.second;
Chris Forbes47567b72017-06-09 12:09:45 -07001091
Jamie Madillc1f7ca82020-03-16 17:08:26 -04001092 for (const auto &location_it : location_map) {
Petr Kraus25810d02019-08-27 17:41:15 +02001093 const auto location = location_it.first;
1094 const auto attrib = location_it.second.attrib;
1095 const auto input = location_it.second.input;
Mark Lobodzinski7caa39c2018-07-25 15:48:34 -06001096
Petr Kraus25810d02019-08-27 17:41:15 +02001097 if (attrib && !input) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001098 skip |= LogPerformanceWarning(vs->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
1099 "Vertex attribute at location %" PRIu32 " not consumed by vertex shader", location);
Petr Kraus25810d02019-08-27 17:41:15 +02001100 } else if (!attrib && input) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001101 skip |= LogError(vs->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
1102 "Vertex shader consumes input at location %" PRIu32 " but not provided", location);
Petr Kraus25810d02019-08-27 17:41:15 +02001103 } else if (attrib && input) {
1104 const auto attrib_type = GetFormatType(attrib->format);
1105 const auto input_type = GetFundamentalType(vs, input->type_id);
Chris Forbes47567b72017-06-09 12:09:45 -07001106
1107 // Type checking
1108 if (!(attrib_type & input_type)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001109 skip |= LogError(vs->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
1110 "Attribute type of `%s` at location %" PRIu32 " does not match vertex shader input type of `%s`",
1111 string_VkFormat(attrib->format), location, DescribeType(vs, input->type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001112 }
Petr Kraus25810d02019-08-27 17:41:15 +02001113 } else { // !attrib && !input
1114 assert(false); // at least one exists in the map
Chris Forbes47567b72017-06-09 12:09:45 -07001115 }
1116 }
1117
1118 return skip;
1119}
1120
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001121bool CoreChecks::ValidateFsOutputsAgainstRenderPass(SHADER_MODULE_STATE const *fs, spirv_inst_iter entrypoint,
1122 PIPELINE_STATE const *pipeline, uint32_t subpass_index) const {
Petr Kraus25810d02019-08-27 17:41:15 +02001123 bool skip = false;
Chris Forbes8bca1652017-07-20 11:10:09 -07001124
Petr Kraus25810d02019-08-27 17:41:15 +02001125 const auto rpci = pipeline->rp_state->createInfo.ptr();
1126
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001127 struct Attachment {
1128 const VkAttachmentReference2KHR *reference = nullptr;
1129 const VkAttachmentDescription2KHR *attachment = nullptr;
1130 const interface_var *output = nullptr;
1131 };
1132 std::map<uint32_t, Attachment> location_map;
1133
Petr Kraus25810d02019-08-27 17:41:15 +02001134 const auto subpass = rpci->pSubpasses[subpass_index];
1135 for (uint32_t i = 0; i < subpass.colorAttachmentCount; ++i) {
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001136 auto const &reference = subpass.pColorAttachments[i];
1137 location_map[i].reference = &reference;
1138 if (reference.attachment != VK_ATTACHMENT_UNUSED &&
1139 rpci->pAttachments[reference.attachment].format != VK_FORMAT_UNDEFINED) {
1140 location_map[i].attachment = &rpci->pAttachments[reference.attachment];
Chris Forbes47567b72017-06-09 12:09:45 -07001141 }
1142 }
1143
Chris Forbes47567b72017-06-09 12:09:45 -07001144 // TODO: dual source blend index (spv::DecIndex, zero if not provided)
1145
Petr Kraus25810d02019-08-27 17:41:15 +02001146 const auto outputs = CollectInterfaceByLocation(fs, entrypoint, spv::StorageClassOutput, false);
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001147 for (const auto &output_it : outputs) {
1148 auto const location = output_it.first.first;
1149 location_map[location].output = &output_it.second;
1150 }
Chris Forbes47567b72017-06-09 12:09:45 -07001151
Petr Kraus25810d02019-08-27 17:41:15 +02001152 const bool alphaToCoverageEnabled = pipeline->graphicsPipelineCI.pMultisampleState != NULL &&
1153 pipeline->graphicsPipelineCI.pMultisampleState->alphaToCoverageEnable == VK_TRUE;
Chris Forbes47567b72017-06-09 12:09:45 -07001154
Jamie Madillc1f7ca82020-03-16 17:08:26 -04001155 for (const auto &location_it : location_map) {
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001156 const auto reference = location_it.second.reference;
1157 if (reference != nullptr && reference->attachment == VK_ATTACHMENT_UNUSED) {
1158 continue;
1159 }
1160
Petr Kraus25810d02019-08-27 17:41:15 +02001161 const auto location = location_it.first;
1162 const auto attachment = location_it.second.attachment;
1163 const auto output = location_it.second.output;
Petr Kraus25810d02019-08-27 17:41:15 +02001164 if (attachment && !output) {
1165 if (pipeline->attachments[location].colorWriteMask != 0) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001166 skip |= LogWarning(fs->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
1167 "Attachment %" PRIu32
1168 " not written by fragment shader; undefined values will be written to attachment",
1169 location);
Petr Kraus25810d02019-08-27 17:41:15 +02001170 }
1171 } else if (!attachment && output) {
1172 if (!(alphaToCoverageEnabled && location == 0)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001173 skip |= LogWarning(fs->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
1174 "fragment shader writes to output location %" PRIu32 " with no matching attachment", location);
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001175 }
Petr Kraus25810d02019-08-27 17:41:15 +02001176 } else if (attachment && output) {
1177 const auto attachment_type = GetFormatType(attachment->format);
1178 const auto output_type = GetFundamentalType(fs, output->type_id);
Chris Forbes47567b72017-06-09 12:09:45 -07001179
1180 // Type checking
Petr Kraus25810d02019-08-27 17:41:15 +02001181 if (!(output_type & attachment_type)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001182 skip |=
1183 LogWarning(fs->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
1184 "Attachment %" PRIu32
1185 " of type `%s` does not match fragment shader output type of `%s`; resulting values are undefined",
1186 location, string_VkFormat(attachment->format), DescribeType(fs, output->type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001187 }
Petr Kraus25810d02019-08-27 17:41:15 +02001188 } else { // !attachment && !output
1189 assert(false); // at least one exists in the map
Chris Forbes47567b72017-06-09 12:09:45 -07001190 }
1191 }
1192
Petr Kraus25810d02019-08-27 17:41:15 +02001193 const auto output_zero = location_map.count(0) ? location_map[0].output : nullptr;
1194 bool locationZeroHasAlpha = output_zero && fs->get_def(output_zero->type_id) != fs->end() &&
1195 GetComponentsConsumedByType(fs, output_zero->type_id, false) == 4;
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001196 if (alphaToCoverageEnabled && !locationZeroHasAlpha) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001197 skip |= LogError(fs->vk_shader_module, kVUID_Core_Shader_NoAlphaAtLocation0WithAlphaToCoverage,
1198 "fragment shader doesn't declare alpha output at location 0 even though alpha to coverage is enabled.");
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001199 }
1200
Chris Forbes47567b72017-06-09 12:09:45 -07001201 return skip;
1202}
1203
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001204// For PointSize analysis we need to know if the variable decorated with the PointSize built-in was actually written to.
1205// This function examines instructions in the static call tree for a write to this variable.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06001206static bool IsPointSizeWritten(SHADER_MODULE_STATE const *src, spirv_inst_iter builtin_instr, spirv_inst_iter entrypoint) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001207 auto type = builtin_instr.opcode();
1208 uint32_t target_id = builtin_instr.word(1);
1209 bool init_complete = false;
1210
1211 if (type == spv::OpMemberDecorate) {
1212 // Built-in is part of a structure -- examine instructions up to first function body to get initial IDs
1213 auto insn = entrypoint;
1214 while (!init_complete && (insn.opcode() != spv::OpFunction)) {
1215 switch (insn.opcode()) {
1216 case spv::OpTypePointer:
1217 if ((insn.word(3) == target_id) && (insn.word(2) == spv::StorageClassOutput)) {
1218 target_id = insn.word(1);
1219 }
1220 break;
1221 case spv::OpVariable:
1222 if (insn.word(1) == target_id) {
1223 target_id = insn.word(2);
1224 init_complete = true;
1225 }
1226 break;
1227 }
1228 insn++;
1229 }
1230 }
1231
Mark Lobodzinskif84b0b42018-09-11 14:54:32 -06001232 if (!init_complete && (type == spv::OpMemberDecorate)) return false;
1233
1234 bool found_write = false;
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001235 std::unordered_set<uint32_t> worklist;
1236 worklist.insert(entrypoint.word(2));
1237
1238 // Follow instructions in call graph looking for writes to target
1239 while (!worklist.empty() && !found_write) {
1240 auto id_iter = worklist.begin();
1241 auto id = *id_iter;
1242 worklist.erase(id_iter);
1243
1244 auto insn = src->get_def(id);
1245 if (insn == src->end()) {
1246 continue;
1247 }
1248
1249 if (insn.opcode() == spv::OpFunction) {
1250 // Scan body of function looking for other function calls or items in our ID chain
1251 while (++insn, insn.opcode() != spv::OpFunctionEnd) {
1252 switch (insn.opcode()) {
1253 case spv::OpAccessChain:
1254 if (insn.word(3) == target_id) {
1255 if (type == spv::OpMemberDecorate) {
1256 auto value = GetConstantValue(src, insn.word(4));
1257 if (value == builtin_instr.word(2)) {
1258 target_id = insn.word(2);
1259 }
1260 } else {
1261 target_id = insn.word(2);
1262 }
1263 }
1264 break;
1265 case spv::OpStore:
1266 if (insn.word(1) == target_id) {
1267 found_write = true;
1268 }
1269 break;
1270 case spv::OpFunctionCall:
1271 worklist.insert(insn.word(3));
1272 break;
1273 }
1274 }
1275 }
1276 }
1277 return found_write;
1278}
1279
Chris Forbes47567b72017-06-09 12:09:45 -07001280// For some analyses, we need to know about all ids referenced by the static call tree of a particular entrypoint. This is
1281// important for identifying the set of shader resources actually used by an entrypoint, for example.
1282// Note: we only explore parts of the image which might actually contain ids we care about for the above analyses.
1283// - NOT the shader input/output interfaces.
1284//
1285// TODO: The set of interesting opcodes here was determined by eyeballing the SPIRV spec. It might be worth
1286// converting parts of this to be generated from the machine-readable spec instead.
locke-lunargd9a069d2019-09-17 01:50:19 -06001287std::unordered_set<uint32_t> MarkAccessibleIds(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint) {
Chris Forbes47567b72017-06-09 12:09:45 -07001288 std::unordered_set<uint32_t> ids;
1289 std::unordered_set<uint32_t> worklist;
1290 worklist.insert(entrypoint.word(2));
1291
1292 while (!worklist.empty()) {
1293 auto id_iter = worklist.begin();
1294 auto id = *id_iter;
1295 worklist.erase(id_iter);
1296
1297 auto insn = src->get_def(id);
1298 if (insn == src->end()) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06001299 // ID is something we didn't collect in BuildDefIndex. that's OK -- we'll stumble across all kinds of things here
Chris Forbes47567b72017-06-09 12:09:45 -07001300 // that we may not care about.
1301 continue;
1302 }
1303
1304 // Try to add to the output set
1305 if (!ids.insert(id).second) {
1306 continue; // If we already saw this id, we don't want to walk it again.
1307 }
1308
1309 switch (insn.opcode()) {
1310 case spv::OpFunction:
1311 // Scan whole body of the function, enlisting anything interesting
1312 while (++insn, insn.opcode() != spv::OpFunctionEnd) {
1313 switch (insn.opcode()) {
1314 case spv::OpLoad:
1315 case spv::OpAtomicLoad:
1316 case spv::OpAtomicExchange:
1317 case spv::OpAtomicCompareExchange:
1318 case spv::OpAtomicCompareExchangeWeak:
1319 case spv::OpAtomicIIncrement:
1320 case spv::OpAtomicIDecrement:
1321 case spv::OpAtomicIAdd:
1322 case spv::OpAtomicISub:
1323 case spv::OpAtomicSMin:
1324 case spv::OpAtomicUMin:
1325 case spv::OpAtomicSMax:
1326 case spv::OpAtomicUMax:
1327 case spv::OpAtomicAnd:
1328 case spv::OpAtomicOr:
1329 case spv::OpAtomicXor:
1330 worklist.insert(insn.word(3)); // ptr
1331 break;
1332 case spv::OpStore:
1333 case spv::OpAtomicStore:
1334 worklist.insert(insn.word(1)); // ptr
1335 break;
1336 case spv::OpAccessChain:
1337 case spv::OpInBoundsAccessChain:
1338 worklist.insert(insn.word(3)); // base ptr
1339 break;
1340 case spv::OpSampledImage:
1341 case spv::OpImageSampleImplicitLod:
1342 case spv::OpImageSampleExplicitLod:
1343 case spv::OpImageSampleDrefImplicitLod:
1344 case spv::OpImageSampleDrefExplicitLod:
1345 case spv::OpImageSampleProjImplicitLod:
1346 case spv::OpImageSampleProjExplicitLod:
1347 case spv::OpImageSampleProjDrefImplicitLod:
1348 case spv::OpImageSampleProjDrefExplicitLod:
1349 case spv::OpImageFetch:
1350 case spv::OpImageGather:
1351 case spv::OpImageDrefGather:
1352 case spv::OpImageRead:
1353 case spv::OpImage:
1354 case spv::OpImageQueryFormat:
1355 case spv::OpImageQueryOrder:
1356 case spv::OpImageQuerySizeLod:
1357 case spv::OpImageQuerySize:
1358 case spv::OpImageQueryLod:
1359 case spv::OpImageQueryLevels:
1360 case spv::OpImageQuerySamples:
1361 case spv::OpImageSparseSampleImplicitLod:
1362 case spv::OpImageSparseSampleExplicitLod:
1363 case spv::OpImageSparseSampleDrefImplicitLod:
1364 case spv::OpImageSparseSampleDrefExplicitLod:
1365 case spv::OpImageSparseSampleProjImplicitLod:
1366 case spv::OpImageSparseSampleProjExplicitLod:
1367 case spv::OpImageSparseSampleProjDrefImplicitLod:
1368 case spv::OpImageSparseSampleProjDrefExplicitLod:
1369 case spv::OpImageSparseFetch:
1370 case spv::OpImageSparseGather:
1371 case spv::OpImageSparseDrefGather:
1372 case spv::OpImageTexelPointer:
1373 worklist.insert(insn.word(3)); // Image or sampled image
1374 break;
1375 case spv::OpImageWrite:
1376 worklist.insert(insn.word(1)); // Image -- different operand order to above
1377 break;
1378 case spv::OpFunctionCall:
1379 for (uint32_t i = 3; i < insn.len(); i++) {
1380 worklist.insert(insn.word(i)); // fn itself, and all args
1381 }
1382 break;
1383
1384 case spv::OpExtInst:
1385 for (uint32_t i = 5; i < insn.len(); i++) {
1386 worklist.insert(insn.word(i)); // Operands to ext inst
1387 }
1388 break;
1389 }
1390 }
1391 break;
1392 }
1393 }
1394
1395 return ids;
1396}
1397
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001398bool CoreChecks::ValidatePushConstantBlockAgainstPipeline(std::vector<VkPushConstantRange> const *push_constant_ranges,
1399 SHADER_MODULE_STATE const *src, spirv_inst_iter type,
1400 VkShaderStageFlagBits stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001401 bool skip = false;
1402
1403 // Strip off ptrs etc
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06001404 type = GetStructType(src, type, false);
Chris Forbes47567b72017-06-09 12:09:45 -07001405 assert(type != src->end());
1406
1407 // Validate directly off the offsets. this isn't quite correct for arrays and matrices, but is a good first step.
1408 // TODO: arrays, matrices, weird sizes
1409 for (auto insn : *src) {
1410 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1)) {
1411 if (insn.word(3) == spv::DecorationOffset) {
Jeremy Hayesadf93862020-07-22 14:29:30 -06001412 auto const member = insn.word(2);
1413 auto const offset = insn.word(4);
1414 auto const size = 4; // Bytes; TODO: calculate this based on the type
Chris Forbes47567b72017-06-09 12:09:45 -07001415
1416 bool found_range = false;
1417 for (auto const &range : *push_constant_ranges) {
Jeremy Hayese883b362019-12-10 15:12:26 -07001418 if ((range.offset <= offset) && ((range.offset + range.size) >= (offset + size)) &&
1419 (range.stageFlags & stage)) {
Chris Forbes47567b72017-06-09 12:09:45 -07001420 found_range = true;
1421
Chris Forbes47567b72017-06-09 12:09:45 -07001422 break;
1423 }
1424 }
1425
1426 if (!found_range) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001427 skip |= LogError(device, kVUID_Core_Shader_PushConstantOutOfRange,
Jeremy Hayesadf93862020-07-22 14:29:30 -06001428 "Shader push-constant buffer member %u at offset %u is not declared in pipeline layout",
1429 member, offset);
Chris Forbes47567b72017-06-09 12:09:45 -07001430 }
1431 }
1432 }
1433 }
1434
1435 return skip;
1436}
1437
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001438bool CoreChecks::ValidatePushConstantUsage(std::vector<VkPushConstantRange> const *push_constant_ranges,
1439 SHADER_MODULE_STATE const *src, std::unordered_set<uint32_t> accessible_ids,
1440 VkShaderStageFlagBits stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001441 bool skip = false;
1442
1443 for (auto id : accessible_ids) {
1444 auto def_insn = src->get_def(id);
1445 if (def_insn.opcode() == spv::OpVariable && def_insn.word(3) == spv::StorageClassPushConstant) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001446 skip |= ValidatePushConstantBlockAgainstPipeline(push_constant_ranges, src, src->get_def(def_insn.word(1)), stage);
Chris Forbes47567b72017-06-09 12:09:45 -07001447 }
1448 }
1449
1450 return skip;
1451}
1452
1453// Validate that data for each specialization entry is fully contained within the buffer.
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001454bool CoreChecks::ValidateSpecializationOffsets(VkPipelineShaderStageCreateInfo const *info) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001455 bool skip = false;
1456
1457 VkSpecializationInfo const *spec = info->pSpecializationInfo;
1458
1459 if (spec) {
1460 for (auto i = 0u; i < spec->mapEntryCount; i++) {
Jeremy Hayes6c555c32019-09-09 17:14:09 -06001461 if (spec->pMapEntries[i].offset >= spec->dataSize) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001462 skip |= LogError(device, "VUID-VkSpecializationInfo-offset-00773",
1463 "Specialization entry %u (for constant id %u) references memory outside provided specialization "
1464 "data (bytes %u.." PRINTF_SIZE_T_SPECIFIER "; " PRINTF_SIZE_T_SPECIFIER " bytes provided)..",
1465 i, spec->pMapEntries[i].constantID, spec->pMapEntries[i].offset,
1466 spec->pMapEntries[i].offset + spec->dataSize - 1, spec->dataSize);
Jeremy Hayes6c555c32019-09-09 17:14:09 -06001467
1468 continue;
1469 }
Chris Forbes47567b72017-06-09 12:09:45 -07001470 if (spec->pMapEntries[i].offset + spec->pMapEntries[i].size > spec->dataSize) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001471 skip |= LogError(device, "VUID-VkSpecializationInfo-pMapEntries-00774",
1472 "Specialization entry %u (for constant id %u) references memory outside provided specialization "
1473 "data (bytes %u.." PRINTF_SIZE_T_SPECIFIER "; " PRINTF_SIZE_T_SPECIFIER " bytes provided)..",
1474 i, spec->pMapEntries[i].constantID, spec->pMapEntries[i].offset,
1475 spec->pMapEntries[i].offset + spec->pMapEntries[i].size - 1, spec->dataSize);
Chris Forbes47567b72017-06-09 12:09:45 -07001476 }
1477 }
1478 }
1479
1480 return skip;
1481}
1482
Jeff Bolz38b3ce72018-09-19 12:53:38 -05001483// TODO (jbolz): Can this return a const reference?
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06001484static std::set<uint32_t> TypeToDescriptorTypeSet(SHADER_MODULE_STATE const *module, uint32_t type_id, unsigned &descriptor_count) {
Chris Forbes47567b72017-06-09 12:09:45 -07001485 auto type = module->get_def(type_id);
Chris Forbes9f89d752018-03-07 12:57:48 -08001486 bool is_storage_buffer = false;
Chris Forbes47567b72017-06-09 12:09:45 -07001487 descriptor_count = 1;
Jeff Bolze54ae892018-09-08 12:16:29 -05001488 std::set<uint32_t> ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001489
1490 // Strip off any array or ptrs. Where we remove array levels, adjust the descriptor count for each dimension.
Jeff Bolzfdf96072018-04-10 14:32:18 -05001491 while (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypePointer || type.opcode() == spv::OpTypeRuntimeArray) {
1492 if (type.opcode() == spv::OpTypeRuntimeArray) {
1493 descriptor_count = 0;
1494 type = module->get_def(type.word(2));
1495 } else if (type.opcode() == spv::OpTypeArray) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06001496 descriptor_count *= GetConstantValue(module, type.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -07001497 type = module->get_def(type.word(2));
1498 } else {
Chris Forbes9f89d752018-03-07 12:57:48 -08001499 if (type.word(2) == spv::StorageClassStorageBuffer) {
1500 is_storage_buffer = true;
1501 }
Chris Forbes47567b72017-06-09 12:09:45 -07001502 type = module->get_def(type.word(3));
1503 }
1504 }
1505
1506 switch (type.opcode()) {
1507 case spv::OpTypeStruct: {
1508 for (auto insn : *module) {
1509 if (insn.opcode() == spv::OpDecorate && insn.word(1) == type.word(1)) {
1510 if (insn.word(2) == spv::DecorationBlock) {
Chris Forbes9f89d752018-03-07 12:57:48 -08001511 if (is_storage_buffer) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001512 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER);
1513 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC);
1514 return ret;
Chris Forbes9f89d752018-03-07 12:57:48 -08001515 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05001516 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER);
1517 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC);
1518 ret.insert(VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK_EXT);
1519 return ret;
Chris Forbes9f89d752018-03-07 12:57:48 -08001520 }
Chris Forbes47567b72017-06-09 12:09:45 -07001521 } else if (insn.word(2) == spv::DecorationBufferBlock) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001522 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER);
1523 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC);
1524 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001525 }
1526 }
1527 }
1528
1529 // Invalid
Jeff Bolze54ae892018-09-08 12:16:29 -05001530 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001531 }
1532
1533 case spv::OpTypeSampler:
Jeff Bolze54ae892018-09-08 12:16:29 -05001534 ret.insert(VK_DESCRIPTOR_TYPE_SAMPLER);
1535 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
1536 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001537
Chris Forbes73c00bf2018-06-22 16:28:06 -07001538 case spv::OpTypeSampledImage: {
1539 // Slight relaxation for some GLSL historical madness: samplerBuffer doesn't really have a sampler, and a texel
1540 // buffer descriptor doesn't really provide one. Allow this slight mismatch.
1541 auto image_type = module->get_def(type.word(2));
1542 auto dim = image_type.word(3);
1543 auto sampled = image_type.word(7);
1544 if (dim == spv::DimBuffer && sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001545 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER);
1546 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001547 }
Chris Forbes73c00bf2018-06-22 16:28:06 -07001548 }
Jeff Bolze54ae892018-09-08 12:16:29 -05001549 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
1550 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001551
1552 case spv::OpTypeImage: {
1553 // Many descriptor types backing image types-- depends on dimension and whether the image will be used with a sampler.
1554 // SPIRV for Vulkan requires that sampled be 1 or 2 -- leaving the decision to runtime is unacceptable.
1555 auto dim = type.word(3);
1556 auto sampled = type.word(7);
1557
1558 if (dim == spv::DimSubpassData) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001559 ret.insert(VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT);
1560 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001561 } else if (dim == spv::DimBuffer) {
1562 if (sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001563 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER);
1564 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001565 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05001566 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER);
1567 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001568 }
1569 } else if (sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001570 ret.insert(VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE);
1571 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
1572 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001573 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05001574 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_IMAGE);
1575 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001576 }
1577 }
Shannon McPherson0fa28232018-11-01 11:59:02 -06001578 case spv::OpTypeAccelerationStructureNV:
Eric Werness30127fd2018-10-31 21:01:03 -07001579 ret.insert(VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_NV);
Jeff Bolz105d6492018-09-29 15:46:44 -05001580 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001581
1582 // We shouldn't really see any other junk types -- but if we do, they're a mismatch.
1583 default:
Jeff Bolze54ae892018-09-08 12:16:29 -05001584 return ret; // Matches nothing
Chris Forbes47567b72017-06-09 12:09:45 -07001585 }
1586}
1587
Jeff Bolze54ae892018-09-08 12:16:29 -05001588static std::string string_descriptorTypes(const std::set<uint32_t> &descriptor_types) {
Chris Forbes73c00bf2018-06-22 16:28:06 -07001589 std::stringstream ss;
Jeff Bolze54ae892018-09-08 12:16:29 -05001590 for (auto it = descriptor_types.begin(); it != descriptor_types.end(); ++it) {
1591 if (ss.tellp()) ss << ", ";
1592 ss << string_VkDescriptorType(VkDescriptorType(*it));
Chris Forbes73c00bf2018-06-22 16:28:06 -07001593 }
1594 return ss.str();
1595}
1596
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001597bool CoreChecks::RequirePropertyFlag(VkBool32 check, char const *flag, char const *structure) const {
Jeff Bolzee743412019-06-20 22:24:32 -05001598 if (!check) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001599 if (LogError(device, kVUID_Core_Shader_ExceedDeviceLimit,
1600 "Shader requires flag %s set in %s but it is not set on the device", flag, structure)) {
Jeff Bolzee743412019-06-20 22:24:32 -05001601 return true;
1602 }
1603 }
1604
1605 return false;
1606}
1607
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001608bool CoreChecks::RequireFeature(VkBool32 feature, char const *feature_name) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001609 if (!feature) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001610 if (LogError(device, kVUID_Core_Shader_FeatureNotEnabled, "Shader requires %s but is not enabled on the device",
1611 feature_name)) {
Chris Forbes47567b72017-06-09 12:09:45 -07001612 return true;
1613 }
1614 }
1615
1616 return false;
1617}
1618
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001619bool CoreChecks::RequireExtension(bool extension, char const *extension_name) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001620 if (!extension) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001621 if (LogError(device, kVUID_Core_Shader_FeatureNotEnabled, "Shader requires extension %s but is not enabled on the device",
1622 extension_name)) {
Chris Forbes47567b72017-06-09 12:09:45 -07001623 return true;
1624 }
1625 }
1626
1627 return false;
1628}
1629
John Zulaufac4c6e12019-07-01 16:05:58 -06001630bool CoreChecks::ValidateShaderCapabilities(SHADER_MODULE_STATE const *src, VkShaderStageFlagBits stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001631 bool skip = false;
1632
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001633 struct FeaturePointer {
1634 // Callable object to test if this feature is enabled in the given aggregate feature struct
1635 const std::function<VkBool32(const DeviceFeatures &)> IsEnabled;
1636
1637 // Test if feature pointer is populated
1638 explicit operator bool() const { return static_cast<bool>(IsEnabled); }
1639
1640 // Default and nullptr constructor to create an empty FeaturePointer
1641 FeaturePointer() : IsEnabled(nullptr) {}
1642 FeaturePointer(std::nullptr_t ptr) : IsEnabled(nullptr) {}
1643
1644 // Constructors to populate FeaturePointer based on given pointer to member
1645 FeaturePointer(VkBool32 VkPhysicalDeviceFeatures::*ptr)
1646 : IsEnabled([=](const DeviceFeatures &features) { return features.core.*ptr; }) {}
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001647 FeaturePointer(VkBool32 VkPhysicalDeviceVulkan11Features::*ptr)
1648 : IsEnabled([=](const DeviceFeatures &features) { return features.core11.*ptr; }) {}
1649 FeaturePointer(VkBool32 VkPhysicalDeviceVulkan12Features::*ptr)
1650 : IsEnabled([=](const DeviceFeatures &features) { return features.core12.*ptr; }) {}
Brett Lawsonbebfb6f2018-10-23 16:58:50 -07001651 FeaturePointer(VkBool32 VkPhysicalDeviceTransformFeedbackFeaturesEXT::*ptr)
1652 : IsEnabled([=](const DeviceFeatures &features) { return features.transform_feedback_features.*ptr; }) {}
Jeff Bolze4356752019-03-07 11:23:46 -06001653 FeaturePointer(VkBool32 VkPhysicalDeviceCooperativeMatrixFeaturesNV::*ptr)
1654 : IsEnabled([=](const DeviceFeatures &features) { return features.cooperative_matrix_features.*ptr; }) {}
Jason Macnakc5a621d2019-06-10 12:42:50 -07001655 FeaturePointer(VkBool32 VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::*ptr)
1656 : IsEnabled([=](const DeviceFeatures &features) { return features.compute_shader_derivatives_features.*ptr; }) {}
Jason Macnak325e8b52019-06-10 13:33:10 -07001657 FeaturePointer(VkBool32 VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::*ptr)
1658 : IsEnabled([=](const DeviceFeatures &features) { return features.fragment_shader_barycentric_features.*ptr; }) {}
Jason Macnakd7fddf82019-06-13 09:52:49 -07001659 FeaturePointer(VkBool32 VkPhysicalDeviceShaderImageFootprintFeaturesNV::*ptr)
1660 : IsEnabled([=](const DeviceFeatures &features) { return features.shader_image_footprint_features.*ptr; }) {}
Jeff Bolz38f6cb52019-06-30 16:26:44 -05001661 FeaturePointer(VkBool32 VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::*ptr)
1662 : IsEnabled([=](const DeviceFeatures &features) { return features.fragment_shader_interlock_features.*ptr; }) {}
Jeff Bolza38fd3b2019-07-21 11:42:11 -05001663 FeaturePointer(VkBool32 VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::*ptr)
1664 : IsEnabled([=](const DeviceFeatures &features) { return features.demote_to_helper_invocation_features.*ptr; }) {}
Jeff Bolz443c2ca2020-03-19 12:11:51 -05001665 FeaturePointer(VkBool32 VkPhysicalDeviceRayTracingFeaturesKHR::*ptr)
1666 : IsEnabled([=](const DeviceFeatures &features) { return features.ray_tracing_features.*ptr; }) {}
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001667 };
1668
Chris Forbes47567b72017-06-09 12:09:45 -07001669 struct CapabilityInfo {
1670 char const *name;
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001671 FeaturePointer feature;
Tony-LunarG2ec96bb2019-11-26 13:43:02 -07001672 ExtEnabled DeviceExtensions::*extension;
Chris Forbes47567b72017-06-09 12:09:45 -07001673 };
1674
Chris Forbes47567b72017-06-09 12:09:45 -07001675 // clang-format off
Dave Houltoneb10ea82017-12-22 12:21:50 -07001676 static const std::unordered_multimap<uint32_t, CapabilityInfo> capabilities = {
Chris Forbes47567b72017-06-09 12:09:45 -07001677 // Capabilities always supported by a Vulkan 1.0 implementation -- no
1678 // feature bits.
1679 {spv::CapabilityMatrix, {nullptr}},
1680 {spv::CapabilityShader, {nullptr}},
1681 {spv::CapabilityInputAttachment, {nullptr}},
1682 {spv::CapabilitySampled1D, {nullptr}},
1683 {spv::CapabilityImage1D, {nullptr}},
1684 {spv::CapabilitySampledBuffer, {nullptr}},
Toni Merilehtib13a4a22019-05-21 12:58:44 +03001685 {spv::CapabilityStorageImageExtendedFormats, {nullptr}},
Chris Forbes47567b72017-06-09 12:09:45 -07001686 {spv::CapabilityImageQuery, {nullptr}},
1687 {spv::CapabilityDerivativeControl, {nullptr}},
1688
1689 // Capabilities that are optionally supported, but require a feature to
1690 // be enabled on the device
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001691 {spv::CapabilityGeometry, {"VkPhysicalDeviceFeatures::geometryShader", &VkPhysicalDeviceFeatures::geometryShader}},
1692 {spv::CapabilityTessellation, {"VkPhysicalDeviceFeatures::tessellationShader", &VkPhysicalDeviceFeatures::tessellationShader}},
1693 {spv::CapabilityFloat64, {"VkPhysicalDeviceFeatures::shaderFloat64", &VkPhysicalDeviceFeatures::shaderFloat64}},
1694 {spv::CapabilityInt64, {"VkPhysicalDeviceFeatures::shaderInt64", &VkPhysicalDeviceFeatures::shaderInt64}},
1695 {spv::CapabilityTessellationPointSize, {"VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize", &VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize}},
1696 {spv::CapabilityGeometryPointSize, {"VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize", &VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize}},
1697 {spv::CapabilityImageGatherExtended, {"VkPhysicalDeviceFeatures::shaderImageGatherExtended", &VkPhysicalDeviceFeatures::shaderImageGatherExtended}},
1698 {spv::CapabilityStorageImageMultisample, {"VkPhysicalDeviceFeatures::shaderStorageImageMultisample", &VkPhysicalDeviceFeatures::shaderStorageImageMultisample}},
1699 {spv::CapabilityUniformBufferArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderUniformBufferArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderUniformBufferArrayDynamicIndexing}},
1700 {spv::CapabilitySampledImageArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderSampledImageArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderSampledImageArrayDynamicIndexing}},
1701 {spv::CapabilityStorageBufferArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing}},
1702 {spv::CapabilityStorageImageArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderStorageImageArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing}},
1703 {spv::CapabilityClipDistance, {"VkPhysicalDeviceFeatures::shaderClipDistance", &VkPhysicalDeviceFeatures::shaderClipDistance}},
1704 {spv::CapabilityCullDistance, {"VkPhysicalDeviceFeatures::shaderCullDistance", &VkPhysicalDeviceFeatures::shaderCullDistance}},
1705 {spv::CapabilityImageCubeArray, {"VkPhysicalDeviceFeatures::imageCubeArray", &VkPhysicalDeviceFeatures::imageCubeArray}},
1706 {spv::CapabilitySampleRateShading, {"VkPhysicalDeviceFeatures::sampleRateShading", &VkPhysicalDeviceFeatures::sampleRateShading}},
1707 {spv::CapabilitySparseResidency, {"VkPhysicalDeviceFeatures::shaderResourceResidency", &VkPhysicalDeviceFeatures::shaderResourceResidency}},
1708 {spv::CapabilityMinLod, {"VkPhysicalDeviceFeatures::shaderResourceMinLod", &VkPhysicalDeviceFeatures::shaderResourceMinLod}},
1709 {spv::CapabilitySampledCubeArray, {"VkPhysicalDeviceFeatures::imageCubeArray", &VkPhysicalDeviceFeatures::imageCubeArray}},
1710 {spv::CapabilityImageMSArray, {"VkPhysicalDeviceFeatures::shaderStorageImageMultisample", &VkPhysicalDeviceFeatures::shaderStorageImageMultisample}},
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001711 {spv::CapabilityInterpolationFunction, {"VkPhysicalDeviceFeatures::sampleRateShading", &VkPhysicalDeviceFeatures::sampleRateShading}},
1712 {spv::CapabilityStorageImageReadWithoutFormat, {"VkPhysicalDeviceFeatures::shaderStorageImageReadWithoutFormat", &VkPhysicalDeviceFeatures::shaderStorageImageReadWithoutFormat}},
1713 {spv::CapabilityStorageImageWriteWithoutFormat, {"VkPhysicalDeviceFeatures::shaderStorageImageWriteWithoutFormat", &VkPhysicalDeviceFeatures::shaderStorageImageWriteWithoutFormat}},
1714 {spv::CapabilityMultiViewport, {"VkPhysicalDeviceFeatures::multiViewport", &VkPhysicalDeviceFeatures::multiViewport}},
Jeff Bolzfdf96072018-04-10 14:32:18 -05001715
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001716 {spv::CapabilityShaderNonUniformEXT, {VK_EXT_DESCRIPTOR_INDEXING_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_descriptor_indexing}},
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001717 {spv::CapabilityRuntimeDescriptorArrayEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::runtimeDescriptorArray", &VkPhysicalDeviceVulkan12Features::runtimeDescriptorArray}},
1718 {spv::CapabilityInputAttachmentArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderInputAttachmentArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderInputAttachmentArrayDynamicIndexing}},
1719 {spv::CapabilityUniformTexelBufferArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformTexelBufferArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformTexelBufferArrayDynamicIndexing}},
1720 {spv::CapabilityStorageTexelBufferArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageTexelBufferArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageTexelBufferArrayDynamicIndexing}},
1721 {spv::CapabilityUniformBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformBufferArrayNonUniformIndexing}},
1722 {spv::CapabilitySampledImageArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderSampledImageArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderSampledImageArrayNonUniformIndexing}},
1723 {spv::CapabilityStorageBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageBufferArrayNonUniformIndexing}},
1724 {spv::CapabilityStorageImageArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageImageArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageImageArrayNonUniformIndexing}},
1725 {spv::CapabilityInputAttachmentArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderInputAttachmentArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderInputAttachmentArrayNonUniformIndexing}},
1726 {spv::CapabilityUniformTexelBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformTexelBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformTexelBufferArrayNonUniformIndexing}},
1727 {spv::CapabilityStorageTexelBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageTexelBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageTexelBufferArrayNonUniformIndexing}},
Chris Forbes47567b72017-06-09 12:09:45 -07001728
1729 // Capabilities that require an extension
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001730 {spv::CapabilityDrawParameters, {VK_KHR_SHADER_DRAW_PARAMETERS_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_draw_parameters}},
1731 {spv::CapabilityGeometryShaderPassthroughNV, {VK_NV_GEOMETRY_SHADER_PASSTHROUGH_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_geometry_shader_passthrough}},
1732 {spv::CapabilitySampleMaskOverrideCoverageNV, {VK_NV_SAMPLE_MASK_OVERRIDE_COVERAGE_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_sample_mask_override_coverage}},
1733 {spv::CapabilityShaderViewportIndexLayerEXT, {VK_EXT_SHADER_VIEWPORT_INDEX_LAYER_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_viewport_index_layer}},
1734 {spv::CapabilityShaderViewportIndexLayerNV, {VK_NV_VIEWPORT_ARRAY2_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_viewport_array2}},
1735 {spv::CapabilityShaderViewportMaskNV, {VK_NV_VIEWPORT_ARRAY2_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_viewport_array2}},
1736 {spv::CapabilitySubgroupBallotKHR, {VK_EXT_SHADER_SUBGROUP_BALLOT_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_subgroup_ballot }},
1737 {spv::CapabilitySubgroupVoteKHR, {VK_EXT_SHADER_SUBGROUP_VOTE_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_subgroup_vote }},
Jason Macnakb7d091c2019-06-10 11:13:11 -07001738 {spv::CapabilityGroupNonUniformPartitionedNV, {VK_NV_SHADER_SUBGROUP_PARTITIONED_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_shader_subgroup_partitioned}},
aqnuep7033c702018-09-11 18:03:29 +02001739 {spv::CapabilityInt64Atomics, {VK_KHR_SHADER_ATOMIC_INT64_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_atomic_int64 }},
amhaganfa0b34d2019-10-15 16:03:53 -04001740 {spv::CapabilityShaderClockKHR, {VK_KHR_SHADER_CLOCK_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_clock }},
Alexander Galazin3bd8e342018-06-14 15:49:07 +02001741
Jason Macnakc5a621d2019-06-10 12:42:50 -07001742 {spv::CapabilityComputeDerivativeGroupQuadsNV, {"VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupQuads", &VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupQuads, &DeviceExtensions::vk_nv_compute_shader_derivatives}},
1743 {spv::CapabilityComputeDerivativeGroupLinearNV, {"VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupLinear", &VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupLinear, &DeviceExtensions::vk_nv_compute_shader_derivatives}},
Jason Macnakf7019582019-06-13 10:07:26 -07001744 {spv::CapabilityFragmentBarycentricNV, {"VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::fragmentShaderBarycentric", &VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::fragmentShaderBarycentric, &DeviceExtensions::vk_nv_fragment_shader_barycentric}},
Jason Macnakc5a621d2019-06-10 12:42:50 -07001745
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001746 {spv::CapabilityStorageBuffer8BitAccess, {"VkPhysicalDevice8BitStorageFeaturesKHR::storageBuffer8BitAccess", &VkPhysicalDeviceVulkan12Features::storageBuffer8BitAccess, &DeviceExtensions::vk_khr_8bit_storage}},
1747 {spv::CapabilityUniformAndStorageBuffer8BitAccess, {"VkPhysicalDevice8BitStorageFeaturesKHR::uniformAndStorageBuffer8BitAccess", &VkPhysicalDeviceVulkan12Features::uniformAndStorageBuffer8BitAccess, &DeviceExtensions::vk_khr_8bit_storage}},
1748 {spv::CapabilityStoragePushConstant8, {"VkPhysicalDevice8BitStorageFeaturesKHR::storagePushConstant8", &VkPhysicalDeviceVulkan12Features::storagePushConstant8, &DeviceExtensions::vk_khr_8bit_storage}},
Brett Lawsonbebfb6f2018-10-23 16:58:50 -07001749
Jason Macnakf7019582019-06-13 10:07:26 -07001750 {spv::CapabilityTransformFeedback, { "VkPhysicalDeviceTransformFeedbackFeaturesEXT::transformFeedback", &VkPhysicalDeviceTransformFeedbackFeaturesEXT::transformFeedback, &DeviceExtensions::vk_ext_transform_feedback}},
1751 {spv::CapabilityGeometryStreams, { "VkPhysicalDeviceTransformFeedbackFeaturesEXT::geometryStreams", &VkPhysicalDeviceTransformFeedbackFeaturesEXT::geometryStreams, &DeviceExtensions::vk_ext_transform_feedback}},
Jose-Emilio Munoz-Lopez1109b452018-08-21 09:44:07 +01001752
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001753 {spv::CapabilityFloat16, {"VkPhysicalDeviceFloat16Int8FeaturesKHR::shaderFloat16", &VkPhysicalDeviceVulkan12Features::shaderFloat16, &DeviceExtensions::vk_khr_shader_float16_int8}},
1754 {spv::CapabilityInt8, {"VkPhysicalDeviceFloat16Int8FeaturesKHR::shaderInt8", &VkPhysicalDeviceVulkan12Features::shaderInt8, &DeviceExtensions::vk_khr_shader_float16_int8}},
Jeff Bolze4356752019-03-07 11:23:46 -06001755
Jason Macnakd7fddf82019-06-13 09:52:49 -07001756 {spv::CapabilityImageFootprintNV, {"VkPhysicalDeviceShaderImageFootprintFeaturesNV::imageFootprint", &VkPhysicalDeviceShaderImageFootprintFeaturesNV::imageFootprint, &DeviceExtensions::vk_nv_shader_image_footprint}},
1757
Jeff Bolze4356752019-03-07 11:23:46 -06001758 {spv::CapabilityCooperativeMatrixNV, {"VkPhysicalDeviceCooperativeMatrixFeaturesNV::cooperativeMatrix", &VkPhysicalDeviceCooperativeMatrixFeaturesNV::cooperativeMatrix, &DeviceExtensions::vk_nv_cooperative_matrix}},
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00001759
Graeme Leese41e6b842019-08-02 10:49:14 +01001760 {spv::CapabilitySignedZeroInfNanPreserve, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderSignedZeroInfNanPreserve", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
1761 {spv::CapabilityDenormPreserve, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderDenormPreserve", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
1762 {spv::CapabilityDenormFlushToZero, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderDenormFlushToZero", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
1763 {spv::CapabilityRoundingModeRTE, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderRoundingModeRTE", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
1764 {spv::CapabilityRoundingModeRTZ, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderRoundingModeRTZ", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
Jeff Bolz38f6cb52019-06-30 16:26:44 -05001765
1766 {spv::CapabilityFragmentShaderSampleInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderSampleInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderSampleInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
1767 {spv::CapabilityFragmentShaderPixelInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderPixelInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderPixelInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
1768 {spv::CapabilityFragmentShaderShadingRateInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderShadingRateInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderShadingRateInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
Jeff Bolza38fd3b2019-07-21 11:42:11 -05001769 {spv::CapabilityDemoteToHelperInvocationEXT, {"VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::shaderDemoteToHelperInvocation", &VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::shaderDemoteToHelperInvocation, &DeviceExtensions::vk_ext_shader_demote_to_helper_invocation}},
Jeff Bolz4563f2a2019-12-10 13:30:30 -06001770
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001771 {spv::CapabilityPhysicalStorageBufferAddresses, {"VkPhysicalDeviceBufferDeviceAddressFeatures::bufferDeviceAddress", &VkPhysicalDeviceVulkan12Features::bufferDeviceAddress, &DeviceExtensions::vk_ext_buffer_device_address}},
Jeff Bolz4563f2a2019-12-10 13:30:30 -06001772 // Should be non-EXT token, but Android SPIRV-Headers are out of date, and the token value is the same anyway
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001773 {spv::CapabilityPhysicalStorageBufferAddressesEXT, {"VkPhysicalDeviceBufferDeviceAddressFeaturesEXT::bufferDeviceAddress", &VkPhysicalDeviceVulkan12Features::bufferDeviceAddress, &DeviceExtensions::vk_khr_buffer_device_address}},
Jeff Bolz443c2ca2020-03-19 12:11:51 -05001774
1775 {spv::CapabilityRayTracingProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayTracing", &VkPhysicalDeviceRayTracingFeaturesKHR::rayTracing, &DeviceExtensions::vk_khr_ray_tracing}},
1776 {spv::CapabilityRayQueryProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayQuery", &VkPhysicalDeviceRayTracingFeaturesKHR::rayQuery, &DeviceExtensions::vk_khr_ray_tracing}},
1777 {spv::CapabilityRayTraversalPrimitiveCullingProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayTracingPrimitiveCulling", &VkPhysicalDeviceRayTracingFeaturesKHR::rayTracingPrimitiveCulling, &DeviceExtensions::vk_khr_ray_tracing}},
Chris Forbes47567b72017-06-09 12:09:45 -07001778 };
1779 // clang-format on
1780
1781 for (auto insn : *src) {
1782 if (insn.opcode() == spv::OpCapability) {
Dave Houltoneb10ea82017-12-22 12:21:50 -07001783 size_t n = capabilities.count(insn.word(1));
1784 if (1 == n) { // key occurs exactly once
1785 auto it = capabilities.find(insn.word(1));
1786 if (it != capabilities.end()) {
1787 if (it->second.feature) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001788 skip |= RequireFeature(it->second.feature.IsEnabled(enabled_features), it->second.name);
Dave Houltoneb10ea82017-12-22 12:21:50 -07001789 }
1790 if (it->second.extension) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001791 skip |= RequireExtension(IsExtEnabled((device_extensions.*(it->second.extension))), it->second.name);
Dave Houltoneb10ea82017-12-22 12:21:50 -07001792 }
Chris Forbes47567b72017-06-09 12:09:45 -07001793 }
Dave Houltoneb10ea82017-12-22 12:21:50 -07001794 } else if (1 < n) { // key occurs multiple times, at least one must be enabled
1795 bool needs_feature = false, has_feature = false;
1796 bool needs_ext = false, has_ext = false;
1797 std::string feature_names = "(one of) [ ";
1798 std::string extension_names = feature_names;
1799 auto caps = capabilities.equal_range(insn.word(1));
1800 for (auto it = caps.first; it != caps.second; ++it) {
1801 if (it->second.feature) {
1802 needs_feature = true;
Mark Lobodzinskid7b03cc2019-04-19 14:23:10 -06001803 has_feature = has_feature || it->second.feature.IsEnabled(enabled_features);
Dave Houltoneb10ea82017-12-22 12:21:50 -07001804 feature_names += it->second.name;
1805 feature_names += " ";
1806 }
1807 if (it->second.extension) {
1808 needs_ext = true;
Mark Lobodzinskif45e45f2019-04-19 14:15:39 -06001809 has_ext = has_ext || device_extensions.*(it->second.extension);
Dave Houltoneb10ea82017-12-22 12:21:50 -07001810 extension_names += it->second.name;
1811 extension_names += " ";
1812 }
1813 }
1814 if (needs_feature) {
1815 feature_names += "]";
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001816 skip |= RequireFeature(has_feature, feature_names.c_str());
Dave Houltoneb10ea82017-12-22 12:21:50 -07001817 }
1818 if (needs_ext) {
1819 extension_names += "]";
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001820 skip |= RequireExtension(has_ext, extension_names.c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001821 }
Graeme Leesec82dbe02019-08-02 10:44:21 +01001822 }
1823
1824 { // Do group non-uniform checks
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001825 const VkSubgroupFeatureFlags supportedOperations = phys_dev_props_core11.subgroupSupportedOperations;
1826 const VkSubgroupFeatureFlags supportedStages = phys_dev_props_core11.subgroupSupportedStages;
Jeff Bolzee743412019-06-20 22:24:32 -05001827
1828 switch (insn.word(1)) {
1829 default:
1830 break;
1831 case spv::CapabilityGroupNonUniform:
1832 case spv::CapabilityGroupNonUniformVote:
1833 case spv::CapabilityGroupNonUniformArithmetic:
1834 case spv::CapabilityGroupNonUniformBallot:
1835 case spv::CapabilityGroupNonUniformShuffle:
1836 case spv::CapabilityGroupNonUniformShuffleRelative:
1837 case spv::CapabilityGroupNonUniformClustered:
1838 case spv::CapabilityGroupNonUniformQuad:
1839 case spv::CapabilityGroupNonUniformPartitionedNV:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001840 RequirePropertyFlag(supportedStages & stage, string_VkShaderStageFlagBits(stage),
Jeff Bolzee743412019-06-20 22:24:32 -05001841 "VkPhysicalDeviceSubgroupProperties::supportedStages");
1842 break;
1843 }
1844
1845 switch (insn.word(1)) {
1846 default:
1847 break;
1848 case spv::CapabilityGroupNonUniform:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001849 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_BASIC_BIT, "VK_SUBGROUP_FEATURE_BASIC_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05001850 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1851 break;
1852 case spv::CapabilityGroupNonUniformVote:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001853 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_VOTE_BIT, "VK_SUBGROUP_FEATURE_VOTE_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05001854 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1855 break;
1856 case spv::CapabilityGroupNonUniformArithmetic:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001857 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_ARITHMETIC_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05001858 "VK_SUBGROUP_FEATURE_ARITHMETIC_BIT",
1859 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1860 break;
1861 case spv::CapabilityGroupNonUniformBallot:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001862 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_BALLOT_BIT, "VK_SUBGROUP_FEATURE_BALLOT_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05001863 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1864 break;
1865 case spv::CapabilityGroupNonUniformShuffle:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001866 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_SHUFFLE_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05001867 "VK_SUBGROUP_FEATURE_SHUFFLE_BIT",
1868 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1869 break;
1870 case spv::CapabilityGroupNonUniformShuffleRelative:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001871 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_SHUFFLE_RELATIVE_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05001872 "VK_SUBGROUP_FEATURE_SHUFFLE_RELATIVE_BIT",
1873 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1874 break;
1875 case spv::CapabilityGroupNonUniformClustered:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001876 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_CLUSTERED_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05001877 "VK_SUBGROUP_FEATURE_CLUSTERED_BIT",
1878 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1879 break;
1880 case spv::CapabilityGroupNonUniformQuad:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001881 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_QUAD_BIT, "VK_SUBGROUP_FEATURE_QUAD_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05001882 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1883 break;
1884 case spv::CapabilityGroupNonUniformPartitionedNV:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001885 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_PARTITIONED_BIT_NV,
Jeff Bolzee743412019-06-20 22:24:32 -05001886 "VK_SUBGROUP_FEATURE_PARTITIONED_BIT_NV",
1887 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1888 break;
1889 }
Chris Forbes47567b72017-06-09 12:09:45 -07001890 }
baldurk4095f932020-02-16 13:24:42 +00001891 } else if (insn.opcode() == spv::OpExtension) {
1892 std::string extension_name = (char const *)&insn.word(1);
1893
1894 if (extension_name == "SPV_KHR_non_semantic_info") {
1895 skip |= RequireExtension(IsExtEnabled(device_extensions.vk_khr_shader_non_semantic_info),
1896 VK_KHR_SHADER_NON_SEMANTIC_INFO_EXTENSION_NAME);
1897 }
Chris Forbes47567b72017-06-09 12:09:45 -07001898 }
1899 }
1900
Jeff Bolzee743412019-06-20 22:24:32 -05001901 return skip;
1902}
1903
John Zulaufac4c6e12019-07-01 16:05:58 -06001904bool CoreChecks::ValidateShaderStageWritableDescriptor(VkShaderStageFlagBits stage, bool has_writable_descriptor) const {
Jeff Bolzee743412019-06-20 22:24:32 -05001905 bool skip = false;
1906
Chris Forbes349b3132018-03-07 11:38:08 -08001907 if (has_writable_descriptor) {
1908 switch (stage) {
1909 case VK_SHADER_STAGE_COMPUTE_BIT:
Jeff Bolz148d94e2018-12-13 21:25:56 -06001910 case VK_SHADER_STAGE_RAYGEN_BIT_NV:
1911 case VK_SHADER_STAGE_ANY_HIT_BIT_NV:
1912 case VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV:
1913 case VK_SHADER_STAGE_MISS_BIT_NV:
1914 case VK_SHADER_STAGE_INTERSECTION_BIT_NV:
1915 case VK_SHADER_STAGE_CALLABLE_BIT_NV:
1916 case VK_SHADER_STAGE_TASK_BIT_NV:
1917 case VK_SHADER_STAGE_MESH_BIT_NV:
Chris Forbes349b3132018-03-07 11:38:08 -08001918 /* No feature requirements for writes and atomics from compute
Jeff Bolz148d94e2018-12-13 21:25:56 -06001919 * raytracing, or mesh stages */
Chris Forbes349b3132018-03-07 11:38:08 -08001920 break;
1921 case VK_SHADER_STAGE_FRAGMENT_BIT:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001922 skip |= RequireFeature(enabled_features.core.fragmentStoresAndAtomics, "fragmentStoresAndAtomics");
Chris Forbes349b3132018-03-07 11:38:08 -08001923 break;
1924 default:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001925 skip |= RequireFeature(enabled_features.core.vertexPipelineStoresAndAtomics, "vertexPipelineStoresAndAtomics");
Chris Forbes349b3132018-03-07 11:38:08 -08001926 break;
1927 }
1928 }
1929
Chris Forbes47567b72017-06-09 12:09:45 -07001930 return skip;
1931}
1932
Jeff Bolz526f2d52019-09-18 13:18:08 -05001933bool CoreChecks::ValidateShaderStageGroupNonUniform(SHADER_MODULE_STATE const *module, VkShaderStageFlagBits stage) const {
Jeff Bolzee743412019-06-20 22:24:32 -05001934 bool skip = false;
1935
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001936 auto const subgroup_props = phys_dev_props_core11;
Jeff Bolzee743412019-06-20 22:24:32 -05001937
Jeff Bolz526f2d52019-09-18 13:18:08 -05001938 for (auto inst : *module) {
Jeff Bolzee743412019-06-20 22:24:32 -05001939 // Check the quad operations.
1940 switch (inst.opcode()) {
1941 default:
1942 break;
1943 case spv::OpGroupNonUniformQuadBroadcast:
1944 case spv::OpGroupNonUniformQuadSwap:
1945 if ((stage != VK_SHADER_STAGE_FRAGMENT_BIT) && (stage != VK_SHADER_STAGE_COMPUTE_BIT)) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001946 skip |= RequireFeature(subgroup_props.subgroupQuadOperationsInAllStages,
Jeff Bolzee743412019-06-20 22:24:32 -05001947 "VkPhysicalDeviceSubgroupProperties::quadOperationsInAllStages");
1948 }
1949 break;
1950 }
Jeff Bolz526f2d52019-09-18 13:18:08 -05001951
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001952 if (!enabled_features.core12.shaderSubgroupExtendedTypes) {
Jeff Bolz526f2d52019-09-18 13:18:08 -05001953 switch (inst.opcode()) {
1954 default:
1955 break;
1956 case spv::OpGroupNonUniformAllEqual:
1957 case spv::OpGroupNonUniformBroadcast:
1958 case spv::OpGroupNonUniformBroadcastFirst:
1959 case spv::OpGroupNonUniformShuffle:
1960 case spv::OpGroupNonUniformShuffleXor:
1961 case spv::OpGroupNonUniformShuffleUp:
1962 case spv::OpGroupNonUniformShuffleDown:
1963 case spv::OpGroupNonUniformIAdd:
1964 case spv::OpGroupNonUniformFAdd:
1965 case spv::OpGroupNonUniformIMul:
1966 case spv::OpGroupNonUniformFMul:
1967 case spv::OpGroupNonUniformSMin:
1968 case spv::OpGroupNonUniformUMin:
1969 case spv::OpGroupNonUniformFMin:
1970 case spv::OpGroupNonUniformSMax:
1971 case spv::OpGroupNonUniformUMax:
1972 case spv::OpGroupNonUniformFMax:
1973 case spv::OpGroupNonUniformBitwiseAnd:
1974 case spv::OpGroupNonUniformBitwiseOr:
1975 case spv::OpGroupNonUniformBitwiseXor:
1976 case spv::OpGroupNonUniformLogicalAnd:
1977 case spv::OpGroupNonUniformLogicalOr:
1978 case spv::OpGroupNonUniformLogicalXor:
1979 case spv::OpGroupNonUniformQuadBroadcast:
1980 case spv::OpGroupNonUniformQuadSwap: {
1981 auto type = module->get_def(inst.word(1));
1982
1983 if (type.opcode() == spv::OpTypeVector) {
1984 // Get the element type
1985 type = module->get_def(type.word(2));
1986 }
1987
1988 if (type.opcode() == spv::OpTypeBool) {
1989 break;
1990 }
1991
1992 // Both OpTypeInt and OpTypeFloat the width is in the 2nd word.
1993 const uint32_t width = type.word(2);
1994
1995 if ((type.opcode() == spv::OpTypeFloat && width == 16) ||
1996 (type.opcode() == spv::OpTypeInt && (width == 8 || width == 16 || width == 64))) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001997 skip |= RequireFeature(enabled_features.core12.shaderSubgroupExtendedTypes,
Tony-LunarGa74d3fe2019-11-22 15:43:20 -07001998 "VkPhysicalDeviceShaderSubgroupExtendedTypesFeatures::shaderSubgroupExtendedTypes");
Jeff Bolz526f2d52019-09-18 13:18:08 -05001999 }
2000 break;
2001 }
2002 }
2003 }
Jeff Bolzee743412019-06-20 22:24:32 -05002004 }
2005
2006 return skip;
2007}
2008
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002009bool CoreChecks::ValidateShaderStageInputOutputLimits(SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
John Zulaufac4c6e12019-07-01 16:05:58 -06002010 const PIPELINE_STATE *pipeline, spirv_inst_iter entrypoint) const {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002011 if (pStage->stage == VK_SHADER_STAGE_COMPUTE_BIT || pStage->stage == VK_SHADER_STAGE_ALL_GRAPHICS ||
2012 pStage->stage == VK_SHADER_STAGE_ALL) {
2013 return false;
2014 }
2015
2016 bool skip = false;
Mark Lobodzinski518eadc2019-03-09 12:07:30 -07002017 auto const &limits = phys_dev_props.limits;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002018
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002019 std::set<uint32_t> patchIDs;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002020 struct Variable {
2021 uint32_t baseTypePtrID;
2022 uint32_t ID;
2023 uint32_t storageClass;
2024 };
2025 std::vector<Variable> variables;
2026
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002027 uint32_t numVertices = 0;
2028
Jeff Bolzf234bf82019-11-04 14:07:15 -06002029 auto entrypointVariables = FindEntrypointInterfaces(entrypoint);
2030
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002031 for (auto insn : *src) {
2032 switch (insn.opcode()) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002033 // Find all Patch decorations
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002034 case spv::OpDecorate:
2035 switch (insn.word(2)) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002036 case spv::DecorationPatch: {
2037 patchIDs.insert(insn.word(1));
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002038 break;
2039 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002040 default:
2041 break;
2042 }
2043 break;
2044 // Find all input and output variables
2045 case spv::OpVariable: {
2046 Variable var = {};
2047 var.storageClass = insn.word(3);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002048 if ((var.storageClass == spv::StorageClassInput || var.storageClass == spv::StorageClassOutput) &&
2049 // Only include variables in the entrypoint's interface
2050 find(entrypointVariables.begin(), entrypointVariables.end(), insn.word(2)) != entrypointVariables.end()) {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002051 var.baseTypePtrID = insn.word(1);
2052 var.ID = insn.word(2);
2053 variables.push_back(var);
2054 }
2055 break;
2056 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002057 case spv::OpExecutionMode:
2058 if (insn.word(1) == entrypoint.word(2)) {
2059 switch (insn.word(2)) {
2060 default:
2061 break;
2062 case spv::ExecutionModeOutputVertices:
2063 numVertices = insn.word(3);
2064 break;
2065 }
2066 }
2067 break;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002068 default:
2069 break;
2070 }
2071 }
2072
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002073 bool strip_output_array_level =
2074 (pStage->stage == VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT || pStage->stage == VK_SHADER_STAGE_MESH_BIT_NV);
2075 bool strip_input_array_level =
2076 (pStage->stage == VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT ||
2077 pStage->stage == VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT || pStage->stage == VK_SHADER_STAGE_GEOMETRY_BIT);
2078
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002079 uint32_t numCompIn = 0, numCompOut = 0;
Jeff Bolzf234bf82019-11-04 14:07:15 -06002080 int maxCompIn = 0, maxCompOut = 0;
2081
2082 auto inputs = CollectInterfaceByLocation(src, entrypoint, spv::StorageClassInput, strip_input_array_level);
2083 auto outputs = CollectInterfaceByLocation(src, entrypoint, spv::StorageClassOutput, strip_output_array_level);
2084
2085 // Find max component location used for input variables.
2086 for (auto &var : inputs) {
2087 int location = var.first.first;
2088 int component = var.first.second;
2089 interface_var &iv = var.second;
2090
2091 // Only need to look at the first location, since we use the type's whole size
2092 if (iv.offset != 0) {
2093 continue;
2094 }
2095
2096 if (iv.is_patch) {
2097 continue;
2098 }
2099
2100 int numComponents = GetComponentsConsumedByType(src, iv.type_id, strip_input_array_level);
2101 maxCompIn = std::max(maxCompIn, location * 4 + component + numComponents);
2102 }
2103
2104 // Find max component location used for output variables.
2105 for (auto &var : outputs) {
2106 int location = var.first.first;
2107 int component = var.first.second;
2108 interface_var &iv = var.second;
2109
2110 // Only need to look at the first location, since we use the type's whole size
2111 if (iv.offset != 0) {
2112 continue;
2113 }
2114
2115 if (iv.is_patch) {
2116 continue;
2117 }
2118
2119 int numComponents = GetComponentsConsumedByType(src, iv.type_id, strip_output_array_level);
2120 maxCompOut = std::max(maxCompOut, location * 4 + component + numComponents);
2121 }
2122
2123 // XXX TODO: Would be nice to rewrite this to use CollectInterfaceByLocation (or something similar),
2124 // but that doesn't include builtins.
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002125 for (auto &var : variables) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002126 // Check if the variable is a patch. Patches can also be members of blocks,
2127 // but if they are then the top-level arrayness has already been stripped
2128 // by the time GetComponentsConsumedByType gets to it.
2129 bool isPatch = patchIDs.find(var.ID) != patchIDs.end();
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002130
2131 if (var.storageClass == spv::StorageClassInput) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002132 numCompIn += GetComponentsConsumedByType(src, var.baseTypePtrID, strip_input_array_level && !isPatch);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002133 } else { // var.storageClass == spv::StorageClassOutput
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002134 numCompOut += GetComponentsConsumedByType(src, var.baseTypePtrID, strip_output_array_level && !isPatch);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002135 }
2136 }
2137
2138 switch (pStage->stage) {
2139 case VK_SHADER_STAGE_VERTEX_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002140 if (numCompOut > limits.maxVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002141 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2142 "Invalid Pipeline CreateInfo State: Vertex shader exceeds "
2143 "VkPhysicalDeviceLimits::maxVertexOutputComponents of %u "
2144 "components by %u components",
2145 limits.maxVertexOutputComponents, numCompOut - limits.maxVertexOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002146 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002147 if (maxCompOut > (int)limits.maxVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002148 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2149 "Invalid Pipeline CreateInfo State: Vertex shader output variable uses location that "
2150 "exceeds component limit VkPhysicalDeviceLimits::maxVertexOutputComponents (%u)",
2151 limits.maxVertexOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002152 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002153 break;
2154
2155 case VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002156 if (numCompIn > limits.maxTessellationControlPerVertexInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002157 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2158 "Invalid Pipeline CreateInfo State: Tessellation control shader exceeds "
2159 "VkPhysicalDeviceLimits::maxTessellationControlPerVertexInputComponents of %u "
2160 "components by %u components",
2161 limits.maxTessellationControlPerVertexInputComponents,
2162 numCompIn - limits.maxTessellationControlPerVertexInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002163 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002164 if (maxCompIn > (int)limits.maxTessellationControlPerVertexInputComponents) {
2165 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002166 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2167 "Invalid Pipeline CreateInfo State: Tessellation control shader input variable uses location that "
2168 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationControlPerVertexInputComponents (%u)",
2169 limits.maxTessellationControlPerVertexInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002170 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002171 if (numCompOut > limits.maxTessellationControlPerVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002172 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2173 "Invalid Pipeline CreateInfo State: Tessellation control shader exceeds "
2174 "VkPhysicalDeviceLimits::maxTessellationControlPerVertexOutputComponents of %u "
2175 "components by %u components",
2176 limits.maxTessellationControlPerVertexOutputComponents,
2177 numCompOut - limits.maxTessellationControlPerVertexOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002178 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002179 if (maxCompOut > (int)limits.maxTessellationControlPerVertexOutputComponents) {
2180 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002181 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2182 "Invalid Pipeline CreateInfo State: Tessellation control shader output variable uses location that "
2183 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationControlPerVertexOutputComponents (%u)",
2184 limits.maxTessellationControlPerVertexOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002185 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002186 break;
2187
2188 case VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002189 if (numCompIn > limits.maxTessellationEvaluationInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002190 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2191 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader exceeds "
2192 "VkPhysicalDeviceLimits::maxTessellationEvaluationInputComponents of %u "
2193 "components by %u components",
2194 limits.maxTessellationEvaluationInputComponents,
2195 numCompIn - limits.maxTessellationEvaluationInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002196 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002197 if (maxCompIn > (int)limits.maxTessellationEvaluationInputComponents) {
2198 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002199 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2200 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader input variable uses location that "
2201 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationEvaluationInputComponents (%u)",
2202 limits.maxTessellationEvaluationInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002203 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002204 if (numCompOut > limits.maxTessellationEvaluationOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002205 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2206 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader exceeds "
2207 "VkPhysicalDeviceLimits::maxTessellationEvaluationOutputComponents of %u "
2208 "components by %u components",
2209 limits.maxTessellationEvaluationOutputComponents,
2210 numCompOut - limits.maxTessellationEvaluationOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002211 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002212 if (maxCompOut > (int)limits.maxTessellationEvaluationOutputComponents) {
2213 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002214 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2215 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader output variable uses location that "
2216 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationEvaluationOutputComponents (%u)",
2217 limits.maxTessellationEvaluationOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002218 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002219 break;
2220
2221 case VK_SHADER_STAGE_GEOMETRY_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002222 if (numCompIn > limits.maxGeometryInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002223 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2224 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2225 "VkPhysicalDeviceLimits::maxGeometryInputComponents of %u "
2226 "components by %u components",
2227 limits.maxGeometryInputComponents, numCompIn - limits.maxGeometryInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002228 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002229 if (maxCompIn > (int)limits.maxGeometryInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002230 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2231 "Invalid Pipeline CreateInfo State: Geometry shader input variable uses location that "
2232 "exceeds component limit VkPhysicalDeviceLimits::maxGeometryInputComponents (%u)",
2233 limits.maxGeometryInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002234 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002235 if (numCompOut > limits.maxGeometryOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002236 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2237 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2238 "VkPhysicalDeviceLimits::maxGeometryOutputComponents of %u "
2239 "components by %u components",
2240 limits.maxGeometryOutputComponents, numCompOut - limits.maxGeometryOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002241 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002242 if (maxCompOut > (int)limits.maxGeometryOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002243 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2244 "Invalid Pipeline CreateInfo State: Geometry shader output variable uses location that "
2245 "exceeds component limit VkPhysicalDeviceLimits::maxGeometryOutputComponents (%u)",
2246 limits.maxGeometryOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002247 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002248 if (numCompOut * numVertices > limits.maxGeometryTotalOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002249 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2250 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2251 "VkPhysicalDeviceLimits::maxGeometryTotalOutputComponents of %u "
2252 "components by %u components",
2253 limits.maxGeometryTotalOutputComponents,
2254 numCompOut * numVertices - limits.maxGeometryTotalOutputComponents);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002255 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002256 break;
2257
2258 case VK_SHADER_STAGE_FRAGMENT_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002259 if (numCompIn > limits.maxFragmentInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002260 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2261 "Invalid Pipeline CreateInfo State: Fragment shader exceeds "
2262 "VkPhysicalDeviceLimits::maxFragmentInputComponents of %u "
2263 "components by %u components",
2264 limits.maxFragmentInputComponents, numCompIn - limits.maxFragmentInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002265 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002266 if (maxCompIn > (int)limits.maxFragmentInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002267 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2268 "Invalid Pipeline CreateInfo State: Fragment shader input variable uses location that "
2269 "exceeds component limit VkPhysicalDeviceLimits::maxFragmentInputComponents (%u)",
2270 limits.maxFragmentInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002271 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002272 break;
2273
Jeff Bolz148d94e2018-12-13 21:25:56 -06002274 case VK_SHADER_STAGE_RAYGEN_BIT_NV:
2275 case VK_SHADER_STAGE_ANY_HIT_BIT_NV:
2276 case VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV:
2277 case VK_SHADER_STAGE_MISS_BIT_NV:
2278 case VK_SHADER_STAGE_INTERSECTION_BIT_NV:
2279 case VK_SHADER_STAGE_CALLABLE_BIT_NV:
2280 case VK_SHADER_STAGE_TASK_BIT_NV:
2281 case VK_SHADER_STAGE_MESH_BIT_NV:
2282 break;
2283
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002284 default:
2285 assert(false); // This should never happen
2286 }
2287 return skip;
2288}
2289
sfricke-samsungdc96f302020-03-18 20:42:10 -07002290bool CoreChecks::ValidateShaderStageMaxResources(VkShaderStageFlagBits stage, const PIPELINE_STATE *pipeline) const {
2291 bool skip = false;
2292 uint32_t total_resources = 0;
2293
2294 // Only currently testing for graphics and compute pipelines
2295 // TODO: Add check and support for Ray Tracing pipeline VUID 03428
2296 if ((stage & (VK_SHADER_STAGE_ALL_GRAPHICS | VK_SHADER_STAGE_COMPUTE_BIT)) == 0) {
2297 return false;
2298 }
2299
2300 if (stage == VK_SHADER_STAGE_FRAGMENT_BIT) {
2301 // "For the fragment shader stage the framebuffer color attachments also count against this limit"
2302 total_resources += pipeline->rp_state->createInfo.pSubpasses[pipeline->graphicsPipelineCI.subpass].colorAttachmentCount;
2303 }
2304
2305 // TODO: This reuses a lot of GetDescriptorCountMaxPerStage but currently would need to make it agnostic in a way to handle
2306 // input from CreatePipeline and CreatePipelineLayout level
2307 for (auto set_layout : pipeline->pipeline_layout->set_layouts) {
2308 if ((set_layout->GetCreateFlags() & VK_DESCRIPTOR_SET_LAYOUT_CREATE_UPDATE_AFTER_BIND_POOL_BIT) != 0) {
2309 continue;
2310 }
2311
2312 for (uint32_t binding_idx = 0; binding_idx < set_layout->GetBindingCount(); binding_idx++) {
2313 const VkDescriptorSetLayoutBinding *binding = set_layout->GetDescriptorSetLayoutBindingPtrFromIndex(binding_idx);
2314 // Bindings with a descriptorCount of 0 are "reserved" and should be skipped
2315 if (((stage & binding->stageFlags) != 0) && (binding->descriptorCount > 0)) {
2316 // Check only descriptor types listed in maxPerStageResources description in spec
2317 switch (binding->descriptorType) {
2318 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
2319 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
2320 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
2321 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
2322 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
2323 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
2324 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
2325 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
2326 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
2327 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
2328 total_resources += binding->descriptorCount;
2329 break;
2330 default:
2331 break;
2332 }
2333 }
2334 }
2335 }
2336
2337 if (total_resources > phys_dev_props.limits.maxPerStageResources) {
2338 const char *vuid = (stage == VK_SHADER_STAGE_COMPUTE_BIT) ? "VUID-VkComputePipelineCreateInfo-layout-01687"
2339 : "VUID-VkGraphicsPipelineCreateInfo-layout-01688";
2340 skip |= LogError(pipeline->pipeline, vuid,
2341 "Invalid Pipeline CreateInfo State: Shader Stage %s exceeds component limit "
2342 "VkPhysicalDeviceLimits::maxPerStageResources (%u)",
2343 string_VkShaderStageFlagBits(stage), phys_dev_props.limits.maxPerStageResources);
2344 }
2345
2346 return skip;
2347}
2348
Jeff Bolze4356752019-03-07 11:23:46 -06002349// copy the specialization constant value into buf, if it is present
2350void GetSpecConstantValue(VkPipelineShaderStageCreateInfo const *pStage, uint32_t spec_id, void *buf) {
2351 VkSpecializationInfo const *spec = pStage->pSpecializationInfo;
2352
2353 if (spec && spec_id < spec->mapEntryCount) {
2354 memcpy(buf, (uint8_t *)spec->pData + spec->pMapEntries[spec_id].offset, spec->pMapEntries[spec_id].size);
2355 }
2356}
2357
2358// Fill in value with the constant or specialization constant value, if available.
2359// Returns true if the value has been accurately filled out.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002360static bool GetIntConstantValue(spirv_inst_iter insn, SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
Jeff Bolze4356752019-03-07 11:23:46 -06002361 const std::unordered_map<uint32_t, uint32_t> &id_to_spec_id, uint32_t *value) {
2362 auto type_id = src->get_def(insn.word(1));
2363 if (type_id.opcode() != spv::OpTypeInt || type_id.word(2) != 32) {
2364 return false;
2365 }
2366 switch (insn.opcode()) {
2367 case spv::OpSpecConstant:
2368 *value = insn.word(3);
2369 GetSpecConstantValue(pStage, id_to_spec_id.at(insn.word(2)), value);
2370 return true;
2371 case spv::OpConstant:
2372 *value = insn.word(3);
2373 return true;
2374 default:
2375 return false;
2376 }
2377}
2378
2379// Map SPIR-V type to VK_COMPONENT_TYPE enum
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002380VkComponentTypeNV GetComponentType(spirv_inst_iter insn, SHADER_MODULE_STATE const *src) {
Jeff Bolze4356752019-03-07 11:23:46 -06002381 switch (insn.opcode()) {
2382 case spv::OpTypeInt:
2383 switch (insn.word(2)) {
2384 case 8:
2385 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT8_NV : VK_COMPONENT_TYPE_UINT8_NV;
2386 case 16:
2387 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT16_NV : VK_COMPONENT_TYPE_UINT16_NV;
2388 case 32:
2389 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT32_NV : VK_COMPONENT_TYPE_UINT32_NV;
2390 case 64:
2391 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT64_NV : VK_COMPONENT_TYPE_UINT64_NV;
2392 default:
2393 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2394 }
2395 case spv::OpTypeFloat:
2396 switch (insn.word(2)) {
2397 case 16:
2398 return VK_COMPONENT_TYPE_FLOAT16_NV;
2399 case 32:
2400 return VK_COMPONENT_TYPE_FLOAT32_NV;
2401 case 64:
2402 return VK_COMPONENT_TYPE_FLOAT64_NV;
2403 default:
2404 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2405 }
2406 default:
2407 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2408 }
2409}
2410
2411// Validate SPV_NV_cooperative_matrix behavior that can't be statically validated
2412// in SPIRV-Tools (e.g. due to specialization constant usage).
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002413bool CoreChecks::ValidateCooperativeMatrix(SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
John Zulaufac4c6e12019-07-01 16:05:58 -06002414 const PIPELINE_STATE *pipeline) const {
Jeff Bolze4356752019-03-07 11:23:46 -06002415 bool skip = false;
2416
2417 // Map SPIR-V result ID to specialization constant id (SpecId decoration value)
2418 std::unordered_map<uint32_t, uint32_t> id_to_spec_id;
2419 // Map SPIR-V result ID to the ID of its type.
2420 std::unordered_map<uint32_t, uint32_t> id_to_type_id;
2421
2422 struct CoopMatType {
2423 uint32_t scope, rows, cols;
2424 VkComponentTypeNV component_type;
2425 bool all_constant;
2426
2427 CoopMatType() : scope(0), rows(0), cols(0), component_type(VK_COMPONENT_TYPE_MAX_ENUM_NV), all_constant(false) {}
2428
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002429 void Init(uint32_t id, SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
Jeff Bolze4356752019-03-07 11:23:46 -06002430 const std::unordered_map<uint32_t, uint32_t> &id_to_spec_id) {
2431 spirv_inst_iter insn = src->get_def(id);
2432 uint32_t component_type_id = insn.word(2);
2433 uint32_t scope_id = insn.word(3);
2434 uint32_t rows_id = insn.word(4);
2435 uint32_t cols_id = insn.word(5);
2436 auto component_type_iter = src->get_def(component_type_id);
2437 auto scope_iter = src->get_def(scope_id);
2438 auto rows_iter = src->get_def(rows_id);
2439 auto cols_iter = src->get_def(cols_id);
2440
2441 all_constant = true;
2442 if (!GetIntConstantValue(scope_iter, src, pStage, id_to_spec_id, &scope)) {
2443 all_constant = false;
2444 }
2445 if (!GetIntConstantValue(rows_iter, src, pStage, id_to_spec_id, &rows)) {
2446 all_constant = false;
2447 }
2448 if (!GetIntConstantValue(cols_iter, src, pStage, id_to_spec_id, &cols)) {
2449 all_constant = false;
2450 }
2451 component_type = GetComponentType(component_type_iter, src);
2452 }
2453 };
2454
2455 bool seen_coopmat_capability = false;
2456
2457 for (auto insn : *src) {
2458 // Whitelist instructions whose result can be a cooperative matrix type, and
2459 // keep track of their types. It would be nice if SPIRV-Headers generated code
2460 // to identify which instructions have a result type and result id. Lacking that,
2461 // this whitelist is based on the set of instructions that
2462 // SPV_NV_cooperative_matrix says can be used with cooperative matrix types.
2463 switch (insn.opcode()) {
2464 case spv::OpLoad:
2465 case spv::OpCooperativeMatrixLoadNV:
2466 case spv::OpCooperativeMatrixMulAddNV:
2467 case spv::OpSNegate:
2468 case spv::OpFNegate:
2469 case spv::OpIAdd:
2470 case spv::OpFAdd:
2471 case spv::OpISub:
2472 case spv::OpFSub:
2473 case spv::OpFDiv:
2474 case spv::OpSDiv:
2475 case spv::OpUDiv:
2476 case spv::OpMatrixTimesScalar:
2477 case spv::OpConstantComposite:
2478 case spv::OpCompositeConstruct:
2479 case spv::OpConvertFToU:
2480 case spv::OpConvertFToS:
2481 case spv::OpConvertSToF:
2482 case spv::OpConvertUToF:
2483 case spv::OpUConvert:
2484 case spv::OpSConvert:
2485 case spv::OpFConvert:
2486 id_to_type_id[insn.word(2)] = insn.word(1);
2487 break;
2488 default:
2489 break;
2490 }
2491
2492 switch (insn.opcode()) {
2493 case spv::OpDecorate:
2494 if (insn.word(2) == spv::DecorationSpecId) {
2495 id_to_spec_id[insn.word(1)] = insn.word(3);
2496 }
2497 break;
2498 case spv::OpCapability:
2499 if (insn.word(1) == spv::CapabilityCooperativeMatrixNV) {
2500 seen_coopmat_capability = true;
2501
2502 if (!(pStage->stage & phys_dev_ext_props.cooperative_matrix_props.cooperativeMatrixSupportedStages)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002503 skip |= LogError(
2504 pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixSupportedStages,
2505 "OpTypeCooperativeMatrixNV used in shader stage not in cooperativeMatrixSupportedStages (= %u)",
2506 phys_dev_ext_props.cooperative_matrix_props.cooperativeMatrixSupportedStages);
Jeff Bolze4356752019-03-07 11:23:46 -06002507 }
2508 }
2509 break;
2510 case spv::OpMemoryModel:
2511 // If the capability isn't enabled, don't bother with the rest of this function.
2512 // OpMemoryModel is the first required instruction after all OpCapability instructions.
2513 if (!seen_coopmat_capability) {
2514 return skip;
2515 }
2516 break;
2517 case spv::OpTypeCooperativeMatrixNV: {
2518 CoopMatType M;
2519 M.Init(insn.word(1), src, pStage, id_to_spec_id);
2520
2521 if (M.all_constant) {
2522 // Validate that the type parameters are all supported for one of the
2523 // operands of a cooperative matrix property.
2524 bool valid = false;
2525 for (unsigned i = 0; i < cooperative_matrix_properties.size(); ++i) {
2526 if (cooperative_matrix_properties[i].AType == M.component_type &&
2527 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].KSize == M.cols &&
2528 cooperative_matrix_properties[i].scope == M.scope) {
2529 valid = true;
2530 break;
2531 }
2532 if (cooperative_matrix_properties[i].BType == M.component_type &&
2533 cooperative_matrix_properties[i].KSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
2534 cooperative_matrix_properties[i].scope == M.scope) {
2535 valid = true;
2536 break;
2537 }
2538 if (cooperative_matrix_properties[i].CType == M.component_type &&
2539 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
2540 cooperative_matrix_properties[i].scope == M.scope) {
2541 valid = true;
2542 break;
2543 }
2544 if (cooperative_matrix_properties[i].DType == M.component_type &&
2545 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
2546 cooperative_matrix_properties[i].scope == M.scope) {
2547 valid = true;
2548 break;
2549 }
2550 }
2551 if (!valid) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002552 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixType,
2553 "OpTypeCooperativeMatrixNV (result id = %u) operands don't match a supported matrix type",
2554 insn.word(1));
Jeff Bolze4356752019-03-07 11:23:46 -06002555 }
2556 }
2557 break;
2558 }
2559 case spv::OpCooperativeMatrixMulAddNV: {
2560 CoopMatType A, B, C, D;
2561 if (id_to_type_id.find(insn.word(2)) == id_to_type_id.end() ||
2562 id_to_type_id.find(insn.word(3)) == id_to_type_id.end() ||
2563 id_to_type_id.find(insn.word(4)) == id_to_type_id.end() ||
2564 id_to_type_id.find(insn.word(5)) == id_to_type_id.end()) {
Mike Schuchardte48dc142019-04-18 09:12:03 -07002565 // Couldn't find type of matrix
2566 assert(false);
Jeff Bolze4356752019-03-07 11:23:46 -06002567 break;
2568 }
2569 D.Init(id_to_type_id[insn.word(2)], src, pStage, id_to_spec_id);
2570 A.Init(id_to_type_id[insn.word(3)], src, pStage, id_to_spec_id);
2571 B.Init(id_to_type_id[insn.word(4)], src, pStage, id_to_spec_id);
2572 C.Init(id_to_type_id[insn.word(5)], src, pStage, id_to_spec_id);
2573
2574 if (A.all_constant && B.all_constant && C.all_constant && D.all_constant) {
2575 // Validate that the type parameters are all supported for the same
2576 // cooperative matrix property.
2577 bool valid = false;
2578 for (unsigned i = 0; i < cooperative_matrix_properties.size(); ++i) {
2579 if (cooperative_matrix_properties[i].AType == A.component_type &&
2580 cooperative_matrix_properties[i].MSize == A.rows && cooperative_matrix_properties[i].KSize == A.cols &&
2581 cooperative_matrix_properties[i].scope == A.scope &&
2582
2583 cooperative_matrix_properties[i].BType == B.component_type &&
2584 cooperative_matrix_properties[i].KSize == B.rows && cooperative_matrix_properties[i].NSize == B.cols &&
2585 cooperative_matrix_properties[i].scope == B.scope &&
2586
2587 cooperative_matrix_properties[i].CType == C.component_type &&
2588 cooperative_matrix_properties[i].MSize == C.rows && cooperative_matrix_properties[i].NSize == C.cols &&
2589 cooperative_matrix_properties[i].scope == C.scope &&
2590
2591 cooperative_matrix_properties[i].DType == D.component_type &&
2592 cooperative_matrix_properties[i].MSize == D.rows && cooperative_matrix_properties[i].NSize == D.cols &&
2593 cooperative_matrix_properties[i].scope == D.scope) {
2594 valid = true;
2595 break;
2596 }
2597 }
2598 if (!valid) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002599 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixMulAdd,
2600 "OpCooperativeMatrixMulAddNV (result id = %u) operands don't match a supported matrix "
2601 "VkCooperativeMatrixPropertiesNV",
2602 insn.word(2));
Jeff Bolze4356752019-03-07 11:23:46 -06002603 }
2604 }
2605 break;
2606 }
2607 default:
2608 break;
2609 }
2610 }
2611
2612 return skip;
2613}
2614
John Zulaufac4c6e12019-07-01 16:05:58 -06002615bool CoreChecks::ValidateExecutionModes(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint) const {
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002616 auto entrypoint_id = entrypoint.word(2);
2617
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002618 // The first denorm execution mode encountered, along with its bit width.
2619 // Used to check if SeparateDenormSettings is respected.
2620 std::pair<spv::ExecutionMode, uint32_t> first_denorm_execution_mode = std::make_pair(spv::ExecutionModeMax, 0);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002621
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002622 // The first rounding mode encountered, along with its bit width.
2623 // Used to check if SeparateRoundingModeSettings is respected.
2624 std::pair<spv::ExecutionMode, uint32_t> first_rounding_mode = std::make_pair(spv::ExecutionModeMax, 0);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002625
2626 bool skip = false;
2627
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002628 uint32_t verticesOut = 0;
2629 uint32_t invocations = 0;
2630
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002631 for (auto insn : *src) {
2632 if (insn.opcode() == spv::OpExecutionMode && insn.word(1) == entrypoint_id) {
2633 auto mode = insn.word(2);
2634 switch (mode) {
2635 case spv::ExecutionModeSignedZeroInfNanPreserve: {
2636 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002637 if ((bit_width == 16 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat16) ||
2638 (bit_width == 32 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat32) ||
2639 (bit_width == 64 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002640 skip |= LogError(
2641 device, kVUID_Core_Shader_FeatureNotEnabled,
2642 "Shader requires SignedZeroInfNanPreserve for bit width %d but it is not enabled on the device",
2643 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002644 }
2645 break;
2646 }
2647
2648 case spv::ExecutionModeDenormPreserve: {
2649 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002650 if ((bit_width == 16 && !phys_dev_props_core12.shaderDenormPreserveFloat16) ||
2651 (bit_width == 32 && !phys_dev_props_core12.shaderDenormPreserveFloat32) ||
2652 (bit_width == 64 && !phys_dev_props_core12.shaderDenormPreserveFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002653 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2654 "Shader requires DenormPreserve for bit width %d but it is not enabled on the device",
2655 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002656 }
2657
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002658 if (first_denorm_execution_mode.first == spv::ExecutionModeMax) {
2659 // Register the first denorm execution mode found
2660 first_denorm_execution_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002661 } else if (first_denorm_execution_mode.first != mode && first_denorm_execution_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002662 switch (phys_dev_props_core12.denormBehaviorIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002663 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
2664 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002665 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2666 "Shader uses different denorm execution modes for 16 and 64-bit but "
2667 "denormBehaviorIndependence is "
2668 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002669 }
2670 break;
2671
2672 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
2673 break;
2674
2675 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002676 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2677 "Shader uses different denorm execution modes for different bit widths but "
2678 "denormBehaviorIndependence is "
2679 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002680 break;
2681
2682 default:
2683 break;
2684 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002685 }
2686 break;
2687 }
2688
2689 case spv::ExecutionModeDenormFlushToZero: {
2690 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002691 if ((bit_width == 16 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat16) ||
2692 (bit_width == 32 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat32) ||
2693 (bit_width == 64 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002694 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2695 "Shader requires DenormFlushToZero for bit width %d but it is not enabled on the device",
2696 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002697 }
2698
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002699 if (first_denorm_execution_mode.first == spv::ExecutionModeMax) {
2700 // Register the first denorm execution mode found
2701 first_denorm_execution_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002702 } else if (first_denorm_execution_mode.first != mode && first_denorm_execution_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002703 switch (phys_dev_props_core12.denormBehaviorIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002704 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
2705 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002706 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2707 "Shader uses different denorm execution modes for 16 and 64-bit but "
2708 "denormBehaviorIndependence is "
2709 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002710 }
2711 break;
2712
2713 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
2714 break;
2715
2716 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002717 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2718 "Shader uses different denorm execution modes for different bit widths but "
2719 "denormBehaviorIndependence is "
2720 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002721 break;
2722
2723 default:
2724 break;
2725 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002726 }
2727 break;
2728 }
2729
2730 case spv::ExecutionModeRoundingModeRTE: {
2731 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002732 if ((bit_width == 16 && !phys_dev_props_core12.shaderRoundingModeRTEFloat16) ||
2733 (bit_width == 32 && !phys_dev_props_core12.shaderRoundingModeRTEFloat32) ||
2734 (bit_width == 64 && !phys_dev_props_core12.shaderRoundingModeRTEFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002735 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2736 "Shader requires RoundingModeRTE for bit width %d but it is not enabled on the device",
2737 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002738 }
2739
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002740 if (first_rounding_mode.first == spv::ExecutionModeMax) {
2741 // Register the first rounding mode found
2742 first_rounding_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002743 } else if (first_rounding_mode.first != mode && first_rounding_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002744 switch (phys_dev_props_core12.roundingModeIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002745 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
2746 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002747 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2748 "Shader uses different rounding modes for 16 and 64-bit but "
2749 "roundingModeIndependence is "
2750 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002751 }
2752 break;
2753
2754 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
2755 break;
2756
2757 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002758 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2759 "Shader uses different rounding modes for different bit widths but "
2760 "roundingModeIndependence is "
2761 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002762 break;
2763
2764 default:
2765 break;
2766 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002767 }
2768 break;
2769 }
2770
2771 case spv::ExecutionModeRoundingModeRTZ: {
2772 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002773 if ((bit_width == 16 && !phys_dev_props_core12.shaderRoundingModeRTZFloat16) ||
2774 (bit_width == 32 && !phys_dev_props_core12.shaderRoundingModeRTZFloat32) ||
2775 (bit_width == 64 && !phys_dev_props_core12.shaderRoundingModeRTZFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002776 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2777 "Shader requires RoundingModeRTZ for bit width %d but it is not enabled on the device",
2778 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002779 }
2780
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002781 if (first_rounding_mode.first == spv::ExecutionModeMax) {
2782 // Register the first rounding mode found
2783 first_rounding_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002784 } else if (first_rounding_mode.first != mode && first_rounding_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002785 switch (phys_dev_props_core12.roundingModeIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002786 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
2787 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002788 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2789 "Shader uses different rounding modes for 16 and 64-bit but "
2790 "roundingModeIndependence is "
2791 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002792 }
2793 break;
2794
2795 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
2796 break;
2797
2798 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002799 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2800 "Shader uses different rounding modes for different bit widths but "
2801 "roundingModeIndependence is "
2802 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002803 break;
2804
2805 default:
2806 break;
2807 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002808 }
2809 break;
2810 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002811
2812 case spv::ExecutionModeOutputVertices: {
2813 verticesOut = insn.word(3);
2814 break;
2815 }
2816
2817 case spv::ExecutionModeInvocations: {
2818 invocations = insn.word(3);
2819 break;
2820 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002821 }
2822 }
2823 }
2824
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002825 if (entrypoint.word(1) == spv::ExecutionModelGeometry) {
2826 if (verticesOut == 0 || verticesOut > phys_dev_props.limits.maxGeometryOutputVertices) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002827 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-stage-00714",
2828 "Geometry shader entry point must have an OpExecutionMode instruction that "
2829 "specifies a maximum output vertex count that is greater than 0 and less "
2830 "than or equal to maxGeometryOutputVertices. "
2831 "OutputVertices=%d, maxGeometryOutputVertices=%d",
2832 verticesOut, phys_dev_props.limits.maxGeometryOutputVertices);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002833 }
2834
2835 if (invocations == 0 || invocations > phys_dev_props.limits.maxGeometryShaderInvocations) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002836 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-stage-00715",
2837 "Geometry shader entry point must have an OpExecutionMode instruction that "
2838 "specifies an invocation count that is greater than 0 and less "
2839 "than or equal to maxGeometryShaderInvocations. "
2840 "Invocations=%d, maxGeometryShaderInvocations=%d",
2841 invocations, phys_dev_props.limits.maxGeometryShaderInvocations);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002842 }
2843 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002844 return skip;
2845}
2846
locke-lunargd9a069d2019-09-17 01:50:19 -06002847uint32_t DescriptorTypeToReqs(SHADER_MODULE_STATE const *module, uint32_t type_id) {
Chris Forbes47567b72017-06-09 12:09:45 -07002848 auto type = module->get_def(type_id);
2849
2850 while (true) {
2851 switch (type.opcode()) {
2852 case spv::OpTypeArray:
Chris Forbes062f1222018-08-21 15:34:15 -07002853 case spv::OpTypeRuntimeArray:
Chris Forbes47567b72017-06-09 12:09:45 -07002854 case spv::OpTypeSampledImage:
2855 type = module->get_def(type.word(2));
2856 break;
2857 case spv::OpTypePointer:
2858 type = module->get_def(type.word(3));
2859 break;
2860 case spv::OpTypeImage: {
2861 auto dim = type.word(3);
2862 auto arrayed = type.word(5);
2863 auto msaa = type.word(6);
2864
Chris Forbes74ba2232018-08-27 15:19:27 -07002865 uint32_t bits = 0;
2866 switch (GetFundamentalType(module, type.word(2))) {
2867 case FORMAT_TYPE_FLOAT:
2868 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_FLOAT;
2869 break;
2870 case FORMAT_TYPE_UINT:
2871 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_UINT;
2872 break;
2873 case FORMAT_TYPE_SINT:
2874 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_SINT;
2875 break;
2876 default:
2877 break;
2878 }
2879
Chris Forbes47567b72017-06-09 12:09:45 -07002880 switch (dim) {
2881 case spv::Dim1D:
Chris Forbes74ba2232018-08-27 15:19:27 -07002882 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_1D_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_1D;
2883 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002884 case spv::Dim2D:
Chris Forbes74ba2232018-08-27 15:19:27 -07002885 bits |= msaa ? DESCRIPTOR_REQ_MULTI_SAMPLE : DESCRIPTOR_REQ_SINGLE_SAMPLE;
2886 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_2D_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_2D;
2887 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002888 case spv::Dim3D:
Chris Forbes74ba2232018-08-27 15:19:27 -07002889 bits |= DESCRIPTOR_REQ_VIEW_TYPE_3D;
2890 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002891 case spv::DimCube:
Chris Forbes74ba2232018-08-27 15:19:27 -07002892 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_CUBE_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_CUBE;
2893 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002894 case spv::DimSubpassData:
Chris Forbes74ba2232018-08-27 15:19:27 -07002895 bits |= msaa ? DESCRIPTOR_REQ_MULTI_SAMPLE : DESCRIPTOR_REQ_SINGLE_SAMPLE;
2896 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002897 default: // buffer, etc.
Chris Forbes74ba2232018-08-27 15:19:27 -07002898 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002899 }
2900 }
2901 default:
2902 return 0;
2903 }
2904 }
2905}
2906
2907// For given pipelineLayout verify that the set_layout_node at slot.first
2908// has the requested binding at slot.second and return ptr to that binding
Mark Lobodzinskica6ebe32019-04-25 11:43:37 -06002909static VkDescriptorSetLayoutBinding const *GetDescriptorBinding(PIPELINE_LAYOUT_STATE const *pipelineLayout,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06002910 descriptor_slot_t slot) {
Chris Forbes47567b72017-06-09 12:09:45 -07002911 if (!pipelineLayout) return nullptr;
2912
2913 if (slot.first >= pipelineLayout->set_layouts.size()) return nullptr;
2914
2915 return pipelineLayout->set_layouts[slot.first]->GetDescriptorSetLayoutBindingPtrFromBinding(slot.second);
2916}
2917
Sam Wallsd7ab6db2020-06-19 20:41:54 +01002918int32_t GetShaderResourceDimensionality(const SHADER_MODULE_STATE *module, const interface_var &resource) {
2919 if (module == nullptr) return -1;
2920
2921 auto type = module->get_def(resource.type_id);
2922 while (true) {
2923 switch (type.opcode()) {
2924 case spv::OpTypeSampledImage:
2925 type = module->get_def(type.word(2));
2926 break;
2927 case spv::OpTypePointer:
2928 type = module->get_def(type.word(3));
2929 break;
2930 case spv::OpTypeImage:
2931 return type.word(3);
2932 default:
2933 return -1;
2934 }
2935 }
2936}
2937
2938bool FindLocalSize(SHADER_MODULE_STATE const *src, uint32_t &local_size_x, uint32_t &local_size_y, uint32_t &local_size_z) {
Locke1ec6d952019-04-02 11:57:21 -06002939 for (auto insn : *src) {
2940 if (insn.opcode() == spv::OpEntryPoint) {
2941 auto executionModel = insn.word(1);
2942 auto entrypointStageBits = ExecutionModelToShaderStageFlagBits(executionModel);
2943 if (entrypointStageBits == VK_SHADER_STAGE_COMPUTE_BIT) {
2944 auto entrypoint_id = insn.word(2);
2945 for (auto insn1 : *src) {
2946 if (insn1.opcode() == spv::OpExecutionMode && insn1.word(1) == entrypoint_id &&
2947 insn1.word(2) == spv::ExecutionModeLocalSize) {
2948 local_size_x = insn1.word(3);
2949 local_size_y = insn1.word(4);
2950 local_size_z = insn1.word(5);
2951 return true;
2952 }
2953 }
2954 }
2955 }
2956 }
2957 return false;
2958}
2959
locke-lunargd9a069d2019-09-17 01:50:19 -06002960void ProcessExecutionModes(SHADER_MODULE_STATE const *src, const spirv_inst_iter &entrypoint, PIPELINE_STATE *pipeline) {
Jeff Bolz105d6492018-09-29 15:46:44 -05002961 auto entrypoint_id = entrypoint.word(2);
Chris Forbes0771b672018-03-22 21:13:46 -07002962 bool is_point_mode = false;
2963
2964 for (auto insn : *src) {
2965 if (insn.opcode() == spv::OpExecutionMode && insn.word(1) == entrypoint_id) {
2966 switch (insn.word(2)) {
2967 case spv::ExecutionModePointMode:
2968 // In tessellation shaders, PointMode is separate and trumps the tessellation topology.
2969 is_point_mode = true;
2970 break;
2971
2972 case spv::ExecutionModeOutputPoints:
2973 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_POINT_LIST;
2974 break;
2975
2976 case spv::ExecutionModeIsolines:
2977 case spv::ExecutionModeOutputLineStrip:
2978 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_LINE_STRIP;
2979 break;
2980
2981 case spv::ExecutionModeTriangles:
2982 case spv::ExecutionModeQuads:
2983 case spv::ExecutionModeOutputTriangleStrip:
2984 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_TRIANGLE_STRIP;
2985 break;
2986 }
2987 }
2988 }
2989
2990 if (is_point_mode) pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_POINT_LIST;
2991}
2992
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06002993// If PointList topology is specified in the pipeline, verify that a shader geometry stage writes PointSize
2994// o If there is only a vertex shader : gl_PointSize must be written when using points
2995// o If there is a geometry or tessellation shader:
2996// - If shaderTessellationAndGeometryPointSize feature is enabled:
2997// * gl_PointSize must be written in the final geometry stage
2998// - If shaderTessellationAndGeometryPointSize feature is disabled:
2999// * gl_PointSize must NOT be written and a default of 1.0 is assumed
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06003000bool CoreChecks::ValidatePointListShaderState(const PIPELINE_STATE *pipeline, SHADER_MODULE_STATE const *src,
John Zulaufac4c6e12019-07-01 16:05:58 -06003001 spirv_inst_iter entrypoint, VkShaderStageFlagBits stage) const {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003002 if (pipeline->topology_at_rasterizer != VK_PRIMITIVE_TOPOLOGY_POINT_LIST) {
3003 return false;
3004 }
3005
3006 bool pointsize_written = false;
3007 bool skip = false;
3008
3009 // Search for PointSize built-in decorations
3010 std::vector<uint32_t> pointsize_builtin_offsets;
3011 spirv_inst_iter insn = entrypoint;
3012 while (!pointsize_written && (insn.opcode() != spv::OpFunction)) {
3013 if (insn.opcode() == spv::OpMemberDecorate) {
3014 if (insn.word(3) == spv::DecorationBuiltIn) {
3015 if (insn.word(4) == spv::BuiltInPointSize) {
3016 pointsize_written = IsPointSizeWritten(src, insn, entrypoint);
3017 }
3018 }
3019 } else if (insn.opcode() == spv::OpDecorate) {
3020 if (insn.word(2) == spv::DecorationBuiltIn) {
3021 if (insn.word(3) == spv::BuiltInPointSize) {
3022 pointsize_written = IsPointSizeWritten(src, insn, entrypoint);
3023 }
3024 }
3025 }
3026
3027 insn++;
3028 }
3029
3030 if ((stage == VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT || stage == VK_SHADER_STAGE_GEOMETRY_BIT) &&
Mark Lobodzinskid7b03cc2019-04-19 14:23:10 -06003031 !enabled_features.core.shaderTessellationAndGeometryPointSize) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003032 if (pointsize_written) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003033 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_PointSizeBuiltInOverSpecified,
3034 "Pipeline topology is set to POINT_LIST and geometry or tessellation shaders write PointSize which "
3035 "is prohibited when the shaderTessellationAndGeometryPointSize feature is not enabled.");
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003036 }
3037 } else if (!pointsize_written) {
3038 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003039 LogError(pipeline->pipeline, kVUID_Core_Shader_MissingPointSizeBuiltIn,
3040 "Pipeline topology is set to POINT_LIST, but PointSize is not written to in the shader corresponding to %s.",
3041 string_VkShaderStageFlagBits(stage));
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003042 }
3043 return skip;
3044}
John Zulauf14c355b2019-06-27 16:09:37 -06003045
3046bool CoreChecks::ValidatePipelineShaderStage(VkPipelineShaderStageCreateInfo const *pStage, const PIPELINE_STATE *pipeline,
3047 const PIPELINE_STATE::StageState &stage_state, const SHADER_MODULE_STATE *module,
John Zulaufac4c6e12019-07-01 16:05:58 -06003048 const spirv_inst_iter &entrypoint, bool check_point_size) const {
John Zulauf14c355b2019-06-27 16:09:37 -06003049 bool skip = false;
3050
3051 // Check the module
3052 if (!module->has_valid_spirv) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003053 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-module-parameter",
3054 "%s does not contain valid spirv for stage %s.",
3055 report_data->FormatHandle(module->vk_shader_module).c_str(), string_VkShaderStageFlagBits(pStage->stage));
John Zulauf14c355b2019-06-27 16:09:37 -06003056 }
3057
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003058 // If specialization-constant values are given and specialization-constant instructions are present in the shader, the
3059 // specializations should be applied and validated.
3060 if (pStage->pSpecializationInfo != nullptr && pStage->pSpecializationInfo->mapEntryCount > 0 &&
3061 pStage->pSpecializationInfo->pMapEntries != nullptr && module->has_specialization_constants) {
3062 // Gather the specialization-constant values.
3063 auto const &specialization_info = pStage->pSpecializationInfo;
Jeremy Hayes521221d2020-01-15 16:48:49 -07003064 auto const &specialization_data = reinterpret_cast<uint8_t const *>(specialization_info->pData);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003065 std::unordered_map<uint32_t, std::vector<uint32_t>> id_value_map;
3066 id_value_map.reserve(specialization_info->mapEntryCount);
3067 for (auto i = 0u; i < specialization_info->mapEntryCount; ++i) {
3068 auto const &map_entry = specialization_info->pMapEntries[i];
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003069
Jeremy Hayes521221d2020-01-15 16:48:49 -07003070 // Expect only scalar types.
3071 assert(map_entry.size == 1 || map_entry.size == 2 || map_entry.size == 4 || map_entry.size == 8);
3072 auto entry = id_value_map.emplace(map_entry.constantID, std::vector<uint32_t>(map_entry.size > 4 ? 2 : 1));
3073 memcpy(entry.first->second.data(), specialization_data + map_entry.offset, map_entry.size);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003074 }
3075
3076 // Apply the specialization-constant values and revalidate the shader module.
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06003077 spv_target_env spirv_environment = PickSpirvEnv(api_version, (device_extensions.vk_khr_spirv_1_4 != kNotEnabled));
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003078 spvtools::Optimizer optimizer(spirv_environment);
3079 spvtools::MessageConsumer consumer = [&skip, &module, &pStage, this](spv_message_level_t level, const char *source,
3080 const spv_position_t &position, const char *message) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003081 skip |= LogError(
3082 device, "VUID-VkPipelineShaderStageCreateInfo-module-parameter", "%s does not contain valid spirv for stage %s. %s",
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003083 report_data->FormatHandle(module->vk_shader_module).c_str(), string_VkShaderStageFlagBits(pStage->stage), message);
3084 };
3085 optimizer.SetMessageConsumer(consumer);
3086 optimizer.RegisterPass(spvtools::CreateSetSpecConstantDefaultValuePass(id_value_map));
3087 optimizer.RegisterPass(spvtools::CreateFreezeSpecConstantValuePass());
3088 std::vector<uint32_t> specialized_spirv;
3089 auto const optimized =
3090 optimizer.Run(module->words.data(), module->words.size(), &specialized_spirv, spvtools::ValidatorOptions(), true);
3091 assert(optimized == true);
3092
3093 if (optimized) {
3094 spv_context ctx = spvContextCreate(spirv_environment);
3095 spv_const_binary_t binary{specialized_spirv.data(), specialized_spirv.size()};
3096 spv_diagnostic diag = nullptr;
Tony-LunarG9fe69a42020-07-23 15:09:37 -06003097 spvtools::ValidatorOptions options;
3098 AdjustValidatorOptions(device_extensions, enabled_features, options);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003099 auto const spv_valid = spvValidateWithOptions(ctx, options, &binary, &diag);
3100 if (spv_valid != SPV_SUCCESS) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003101 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-module-parameter",
3102 "After specialization was applied, %s does not contain valid spirv for stage %s.",
3103 report_data->FormatHandle(module->vk_shader_module).c_str(),
3104 string_VkShaderStageFlagBits(pStage->stage));
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003105 }
3106
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003107 spvDiagnosticDestroy(diag);
3108 spvContextDestroy(ctx);
3109 }
3110 }
3111
John Zulauf14c355b2019-06-27 16:09:37 -06003112 // Check the entrypoint
3113 if (entrypoint == module->end()) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003114 skip |=
3115 LogError(device, "VUID-VkPipelineShaderStageCreateInfo-pName-00707", "No entrypoint found named `%s` for stage %s..",
3116 pStage->pName, string_VkShaderStageFlagBits(pStage->stage));
John Zulauf14c355b2019-06-27 16:09:37 -06003117 }
3118 if (skip) return true; // no point continuing beyond here, any analysis is just going to be garbage.
3119
3120 // Mark accessible ids
3121 auto &accessible_ids = stage_state.accessible_ids;
3122
Chris Forbes47567b72017-06-09 12:09:45 -07003123 // Validate descriptor set layout against what the entrypoint actually uses
John Zulauf14c355b2019-06-27 16:09:37 -06003124 bool has_writable_descriptor = stage_state.has_writable_descriptor;
3125 auto &descriptor_uses = stage_state.descriptor_uses;
Chris Forbes47567b72017-06-09 12:09:45 -07003126
Chris Forbes349b3132018-03-07 11:38:08 -08003127 // Validate shader capabilities against enabled device features
Jeff Bolzee743412019-06-20 22:24:32 -05003128 skip |= ValidateShaderCapabilities(module, pStage->stage);
3129 skip |= ValidateShaderStageWritableDescriptor(pStage->stage, has_writable_descriptor);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05003130 skip |= ValidateShaderStageInputOutputLimits(module, pStage, pipeline, entrypoint);
sfricke-samsungdc96f302020-03-18 20:42:10 -07003131 skip |= ValidateShaderStageMaxResources(pStage->stage, pipeline);
Jeff Bolz526f2d52019-09-18 13:18:08 -05003132 skip |= ValidateShaderStageGroupNonUniform(module, pStage->stage);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003133 skip |= ValidateExecutionModes(module, entrypoint);
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003134 skip |= ValidateSpecializationOffsets(pStage);
3135 skip |= ValidatePushConstantUsage(pipeline->pipeline_layout->push_constant_ranges.get(), module, accessible_ids, pStage->stage);
Jeff Bolze54ae892018-09-08 12:16:29 -05003136 if (check_point_size && !pipeline->graphicsPipelineCI.pRasterizationState->rasterizerDiscardEnable) {
Mark Lobodzinski518eadc2019-03-09 12:07:30 -07003137 skip |= ValidatePointListShaderState(pipeline, module, entrypoint, pStage->stage);
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003138 }
Jeff Bolze4356752019-03-07 11:23:46 -06003139 skip |= ValidateCooperativeMatrix(module, pStage, pipeline);
Chris Forbes47567b72017-06-09 12:09:45 -07003140
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003141 std::string vuid_layout_mismatch;
3142 if (pipeline->graphicsPipelineCI.sType == VK_STRUCTURE_TYPE_GRAPHICS_PIPELINE_CREATE_INFO) {
3143 vuid_layout_mismatch = "VUID-VkGraphicsPipelineCreateInfo-layout-00756";
3144 } else if (pipeline->computePipelineCI.sType == VK_STRUCTURE_TYPE_COMPUTE_PIPELINE_CREATE_INFO) {
3145 vuid_layout_mismatch = "VUID-VkComputePipelineCreateInfo-layout-00703";
3146 } else if (pipeline->raytracingPipelineCI.sType == VK_STRUCTURE_TYPE_RAY_TRACING_PIPELINE_CREATE_INFO_KHR) {
3147 vuid_layout_mismatch = "VUID-VkRayTracingPipelineCreateInfoKHR-layout-03427";
3148 } else if (pipeline->raytracingPipelineCI.sType == VK_STRUCTURE_TYPE_RAY_TRACING_PIPELINE_CREATE_INFO_NV) {
3149 vuid_layout_mismatch = "VUID-VkRayTracingPipelineCreateInfoNV-layout-03427";
3150 }
3151
Chris Forbes47567b72017-06-09 12:09:45 -07003152 // Validate descriptor use
3153 for (auto use : descriptor_uses) {
Chris Forbes47567b72017-06-09 12:09:45 -07003154 // Verify given pipelineLayout has requested setLayout with requested binding
Jeff Bolze7fc67b2019-10-04 12:29:31 -05003155 const auto &binding = GetDescriptorBinding(pipeline->pipeline_layout.get(), use.first);
Chris Forbes47567b72017-06-09 12:09:45 -07003156 unsigned required_descriptor_count;
Jeff Bolze54ae892018-09-08 12:16:29 -05003157 std::set<uint32_t> descriptor_types = TypeToDescriptorTypeSet(module, use.second.type_id, required_descriptor_count);
Chris Forbes47567b72017-06-09 12:09:45 -07003158
3159 if (!binding) {
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003160 skip |= LogError(device, vuid_layout_mismatch,
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003161 "Shader uses descriptor slot %u.%u (expected `%s`) but not declared in pipeline layout",
3162 use.first.first, use.first.second, string_descriptorTypes(descriptor_types).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003163 } else if (~binding->stageFlags & pStage->stage) {
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003164 skip |= LogError(device, vuid_layout_mismatch,
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003165 "Shader uses descriptor slot %u.%u but descriptor not accessible from stage %s", use.first.first,
3166 use.first.second, string_VkShaderStageFlagBits(pStage->stage));
Jeff Bolze54ae892018-09-08 12:16:29 -05003167 } else if (descriptor_types.find(binding->descriptorType) == descriptor_types.end()) {
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003168 skip |= LogError(device, vuid_layout_mismatch,
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003169 "Type mismatch on descriptor slot %u.%u (expected `%s`) but descriptor of type %s", use.first.first,
3170 use.first.second, string_descriptorTypes(descriptor_types).c_str(),
3171 string_VkDescriptorType(binding->descriptorType));
Chris Forbes47567b72017-06-09 12:09:45 -07003172 } else if (binding->descriptorCount < required_descriptor_count) {
locke-lunarg9a16ebb2020-07-30 16:56:33 -06003173 skip |= LogError(device, vuid_layout_mismatch,
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003174 "Shader expects at least %u descriptors for binding %u.%u but only %u provided",
3175 required_descriptor_count, use.first.first, use.first.second, binding->descriptorCount);
Chris Forbes47567b72017-06-09 12:09:45 -07003176 }
3177 }
3178
3179 // Validate use of input attachments against subpass structure
3180 if (pStage->stage == VK_SHADER_STAGE_FRAGMENT_BIT) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003181 auto input_attachment_uses = CollectInterfaceByInputAttachmentIndex(module, accessible_ids);
Chris Forbes47567b72017-06-09 12:09:45 -07003182
Petr Krause91f7a12017-12-14 20:57:36 +01003183 auto rpci = pipeline->rp_state->createInfo.ptr();
Chris Forbes47567b72017-06-09 12:09:45 -07003184 auto subpass = pipeline->graphicsPipelineCI.subpass;
3185
3186 for (auto use : input_attachment_uses) {
3187 auto input_attachments = rpci->pSubpasses[subpass].pInputAttachments;
3188 auto index = (input_attachments && use.first < rpci->pSubpasses[subpass].inputAttachmentCount)
Dave Houltona9df0ce2018-02-07 10:51:23 -07003189 ? input_attachments[use.first].attachment
3190 : VK_ATTACHMENT_UNUSED;
Chris Forbes47567b72017-06-09 12:09:45 -07003191
3192 if (index == VK_ATTACHMENT_UNUSED) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003193 skip |= LogError(device, kVUID_Core_Shader_MissingInputAttachment,
3194 "Shader consumes input attachment index %d but not provided in subpass", use.first);
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003195 } else if (!(GetFormatType(rpci->pAttachments[index].format) & GetFundamentalType(module, use.second.type_id))) {
Chris Forbes47567b72017-06-09 12:09:45 -07003196 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003197 LogError(device, kVUID_Core_Shader_InputAttachmentTypeMismatch,
3198 "Subpass input attachment %u format of %s does not match type used in shader `%s`", use.first,
3199 string_VkFormat(rpci->pAttachments[index].format), DescribeType(module, use.second.type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003200 }
3201 }
3202 }
Lockeaa8fdc02019-04-02 11:59:20 -06003203 if (pStage->stage == VK_SHADER_STAGE_COMPUTE_BIT) {
3204 skip |= ValidateComputeWorkGroupSizes(module);
3205 }
Chris Forbes47567b72017-06-09 12:09:45 -07003206 return skip;
3207}
3208
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003209bool CoreChecks::ValidateInterfaceBetweenStages(SHADER_MODULE_STATE const *producer, spirv_inst_iter producer_entrypoint,
3210 shader_stage_attributes const *producer_stage, SHADER_MODULE_STATE const *consumer,
3211 spirv_inst_iter consumer_entrypoint,
3212 shader_stage_attributes const *consumer_stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07003213 bool skip = false;
3214
3215 auto outputs =
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003216 CollectInterfaceByLocation(producer, producer_entrypoint, spv::StorageClassOutput, producer_stage->arrayed_output);
3217 auto inputs = CollectInterfaceByLocation(consumer, consumer_entrypoint, spv::StorageClassInput, consumer_stage->arrayed_input);
Chris Forbes47567b72017-06-09 12:09:45 -07003218
3219 auto a_it = outputs.begin();
3220 auto b_it = inputs.begin();
3221
3222 // Maps sorted by key (location); walk them together to find mismatches
3223 while ((outputs.size() > 0 && a_it != outputs.end()) || (inputs.size() && b_it != inputs.end())) {
3224 bool a_at_end = outputs.size() == 0 || a_it == outputs.end();
3225 bool b_at_end = inputs.size() == 0 || b_it == inputs.end();
3226 auto a_first = a_at_end ? std::make_pair(0u, 0u) : a_it->first;
3227 auto b_first = b_at_end ? std::make_pair(0u, 0u) : b_it->first;
3228
3229 if (b_at_end || ((!a_at_end) && (a_first < b_first))) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003230 skip |= LogPerformanceWarning(producer->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
3231 "%s writes to output location %u.%u which is not consumed by %s", producer_stage->name,
3232 a_first.first, a_first.second, consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003233 a_it++;
3234 } else if (a_at_end || a_first > b_first) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003235 skip |= LogError(consumer->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
3236 "%s consumes input location %u.%u which is not written by %s", consumer_stage->name, b_first.first,
3237 b_first.second, producer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003238 b_it++;
3239 } else {
3240 // subtleties of arrayed interfaces:
3241 // - if is_patch, then the member is not arrayed, even though the interface may be.
3242 // - if is_block_member, then the extra array level of an arrayed interface is not
3243 // expressed in the member type -- it's expressed in the block type.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003244 if (!TypesMatch(producer, consumer, a_it->second.type_id, b_it->second.type_id,
3245 producer_stage->arrayed_output && !a_it->second.is_patch && !a_it->second.is_block_member,
3246 consumer_stage->arrayed_input && !b_it->second.is_patch && !b_it->second.is_block_member, true)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003247 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3248 "Type mismatch on location %u.%u: '%s' vs '%s'", a_first.first, a_first.second,
3249 DescribeType(producer, a_it->second.type_id).c_str(),
3250 DescribeType(consumer, b_it->second.type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003251 }
3252 if (a_it->second.is_patch != b_it->second.is_patch) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003253 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3254 "Decoration mismatch on location %u.%u: is per-%s in %s stage but per-%s in %s stage",
3255 a_first.first, a_first.second, a_it->second.is_patch ? "patch" : "vertex", producer_stage->name,
3256 b_it->second.is_patch ? "patch" : "vertex", consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003257 }
3258 if (a_it->second.is_relaxed_precision != b_it->second.is_relaxed_precision) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003259 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3260 "Decoration mismatch on location %u.%u: %s and %s stages differ in precision", a_first.first,
3261 a_first.second, producer_stage->name, consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003262 }
3263 a_it++;
3264 b_it++;
3265 }
3266 }
3267
Ari Suonpaa696b3432019-03-11 14:02:57 +02003268 if (consumer_stage->stage != VK_SHADER_STAGE_FRAGMENT_BIT) {
3269 auto builtins_producer = CollectBuiltinBlockMembers(producer, producer_entrypoint, spv::StorageClassOutput);
3270 auto builtins_consumer = CollectBuiltinBlockMembers(consumer, consumer_entrypoint, spv::StorageClassInput);
3271
3272 if (!builtins_producer.empty() && !builtins_consumer.empty()) {
3273 if (builtins_producer.size() != builtins_consumer.size()) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003274 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3275 "Number of elements inside builtin block differ between stages (%s %d vs %s %d).",
3276 producer_stage->name, (int)builtins_producer.size(), consumer_stage->name,
3277 (int)builtins_consumer.size());
Ari Suonpaa696b3432019-03-11 14:02:57 +02003278 } else {
3279 auto it_producer = builtins_producer.begin();
3280 auto it_consumer = builtins_consumer.begin();
3281 while (it_producer != builtins_producer.end() && it_consumer != builtins_consumer.end()) {
3282 if (*it_producer != *it_consumer) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003283 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3284 "Builtin variable inside block doesn't match between %s and %s.", producer_stage->name,
3285 consumer_stage->name);
Ari Suonpaa696b3432019-03-11 14:02:57 +02003286 break;
3287 }
3288 it_producer++;
3289 it_consumer++;
3290 }
3291 }
3292 }
3293 }
3294
Chris Forbes47567b72017-06-09 12:09:45 -07003295 return skip;
3296}
3297
John Zulauf14c355b2019-06-27 16:09:37 -06003298static inline uint32_t DetermineFinalGeomStage(const PIPELINE_STATE *pipeline, const VkGraphicsPipelineCreateInfo *pCreateInfo) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003299 uint32_t stage_mask = 0;
3300 if (pipeline->topology_at_rasterizer == VK_PRIMITIVE_TOPOLOGY_POINT_LIST) {
3301 for (uint32_t i = 0; i < pCreateInfo->stageCount; i++) {
3302 stage_mask |= pCreateInfo->pStages[i].stage;
3303 }
3304 // Determine which shader in which PointSize should be written (the final geometry stage)
Jeff Bolz105d6492018-09-29 15:46:44 -05003305 if (stage_mask & VK_SHADER_STAGE_MESH_BIT_NV) {
3306 stage_mask = VK_SHADER_STAGE_MESH_BIT_NV;
3307 } else if (stage_mask & VK_SHADER_STAGE_GEOMETRY_BIT) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003308 stage_mask = VK_SHADER_STAGE_GEOMETRY_BIT;
3309 } else if (stage_mask & VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT) {
3310 stage_mask = VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT;
3311 } else if (stage_mask & VK_SHADER_STAGE_VERTEX_BIT) {
3312 stage_mask = VK_SHADER_STAGE_VERTEX_BIT;
Mark Lobodzinski2c984cc2018-07-31 09:57:46 -06003313 }
3314 }
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003315 return stage_mask;
Mark Lobodzinski2c984cc2018-07-31 09:57:46 -06003316}
3317
Chris Forbes47567b72017-06-09 12:09:45 -07003318// Validate that the shaders used by the given pipeline and store the active_slots
3319// that are actually used by the pipeline into pPipeline->active_slots
John Zulaufac4c6e12019-07-01 16:05:58 -06003320bool CoreChecks::ValidateGraphicsPipelineShaderState(const PIPELINE_STATE *pipeline) const {
Chris Forbesa400a8a2017-07-20 13:10:24 -07003321 auto pCreateInfo = pipeline->graphicsPipelineCI.ptr();
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003322 int vertex_stage = GetShaderStageId(VK_SHADER_STAGE_VERTEX_BIT);
3323 int fragment_stage = GetShaderStageId(VK_SHADER_STAGE_FRAGMENT_BIT);
Chris Forbes47567b72017-06-09 12:09:45 -07003324
John Zulauf14c355b2019-06-27 16:09:37 -06003325 const SHADER_MODULE_STATE *shaders[32];
Chris Forbes47567b72017-06-09 12:09:45 -07003326 memset(shaders, 0, sizeof(shaders));
Jeff Bolz7e35c392018-09-04 15:30:41 -05003327 spirv_inst_iter entrypoints[32];
Chris Forbes47567b72017-06-09 12:09:45 -07003328 memset(entrypoints, 0, sizeof(entrypoints));
3329 bool skip = false;
3330
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003331 uint32_t pointlist_stage_mask = DetermineFinalGeomStage(pipeline, pCreateInfo);
3332
Chris Forbes47567b72017-06-09 12:09:45 -07003333 for (uint32_t i = 0; i < pCreateInfo->stageCount; i++) {
3334 auto pStage = &pCreateInfo->pStages[i];
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003335 auto stage_id = GetShaderStageId(pStage->stage);
John Zulauf14c355b2019-06-27 16:09:37 -06003336 shaders[stage_id] = GetShaderModuleState(pStage->module);
3337 entrypoints[stage_id] = FindEntrypoint(shaders[stage_id], pStage->pName, pStage->stage);
3338 skip |= ValidatePipelineShaderStage(pStage, pipeline, pipeline->stage_state[i], shaders[stage_id], entrypoints[stage_id],
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003339 (pointlist_stage_mask == pStage->stage));
Chris Forbes47567b72017-06-09 12:09:45 -07003340 }
3341
3342 // if the shader stages are no good individually, cross-stage validation is pointless.
3343 if (skip) return true;
3344
3345 auto vi = pCreateInfo->pVertexInputState;
3346
3347 if (vi) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003348 skip |= ValidateViConsistency(vi);
Chris Forbes47567b72017-06-09 12:09:45 -07003349 }
3350
3351 if (shaders[vertex_stage] && shaders[vertex_stage]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003352 skip |= ValidateViAgainstVsInputs(vi, shaders[vertex_stage], entrypoints[vertex_stage]);
Chris Forbes47567b72017-06-09 12:09:45 -07003353 }
3354
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003355 int producer = GetShaderStageId(VK_SHADER_STAGE_VERTEX_BIT);
3356 int consumer = GetShaderStageId(VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT);
Chris Forbes47567b72017-06-09 12:09:45 -07003357
3358 while (!shaders[producer] && producer != fragment_stage) {
3359 producer++;
3360 consumer++;
3361 }
3362
3363 for (; producer != fragment_stage && consumer <= fragment_stage; consumer++) {
3364 assert(shaders[producer]);
Chris Forbesdbb43fc2018-02-16 16:59:23 -08003365 if (shaders[consumer]) {
3366 if (shaders[consumer]->has_valid_spirv && shaders[producer]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003367 skip |= ValidateInterfaceBetweenStages(shaders[producer], entrypoints[producer], &shader_stage_attribs[producer],
3368 shaders[consumer], entrypoints[consumer], &shader_stage_attribs[consumer]);
Chris Forbesdbb43fc2018-02-16 16:59:23 -08003369 }
Chris Forbes47567b72017-06-09 12:09:45 -07003370
3371 producer = consumer;
3372 }
3373 }
3374
3375 if (shaders[fragment_stage] && shaders[fragment_stage]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003376 skip |= ValidateFsOutputsAgainstRenderPass(shaders[fragment_stage], entrypoints[fragment_stage], pipeline,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003377 pCreateInfo->subpass);
Chris Forbes47567b72017-06-09 12:09:45 -07003378 }
3379
3380 return skip;
3381}
3382
sfricke-samsunge72a85e2020-02-29 21:48:37 -08003383bool CoreChecks::ValidateComputePipelineShaderState(PIPELINE_STATE *pipeline) const {
John Zulauf14c355b2019-06-27 16:09:37 -06003384 const auto &stage = *pipeline->computePipelineCI.stage.ptr();
Chris Forbes47567b72017-06-09 12:09:45 -07003385
John Zulauf14c355b2019-06-27 16:09:37 -06003386 const SHADER_MODULE_STATE *module = GetShaderModuleState(stage.module);
3387 const spirv_inst_iter entrypoint = FindEntrypoint(module, stage.pName, stage.stage);
Chris Forbes47567b72017-06-09 12:09:45 -07003388
John Zulauf14c355b2019-06-27 16:09:37 -06003389 return ValidatePipelineShaderStage(&stage, pipeline, pipeline->stage_state[0], module, entrypoint, false);
Chris Forbes47567b72017-06-09 12:09:45 -07003390}
Chris Forbes4ae55b32017-06-09 14:42:56 -07003391
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003392bool CoreChecks::ValidateRayTracingPipeline(PIPELINE_STATE *pipeline, bool isKHR) const {
John Zulaufe4474e72019-07-01 17:28:27 -06003393 bool skip = false;
Jason Macnak15f95e82019-08-21 21:52:02 -04003394
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003395 if (isKHR) {
3396 if (pipeline->raytracingPipelineCI.maxRecursionDepth > phys_dev_ext_props.ray_tracing_propsKHR.maxRecursionDepth) {
3397 skip |= LogError(device, "VUID-VkRayTracingPipelineCreateInfoKHR-maxRecursionDepth-03464", ": %d > %d",
3398 pipeline->raytracingPipelineCI.maxRecursionDepth,
3399 phys_dev_ext_props.ray_tracing_propsKHR.maxRecursionDepth);
3400 }
sourav parmar83c31b12020-05-06 12:30:54 -07003401 for (uint32_t i = 0; i < pipeline->raytracingPipelineCI.libraries.libraryCount; ++i) {
3402 const PIPELINE_STATE *pLibrary_pipelinestate = GetPipelineState(pipeline->raytracingPipelineCI.libraries.pLibraries[i]);
3403 if (pLibrary_pipelinestate->raytracingPipelineCI.maxRecursionDepth !=
3404 pipeline->raytracingPipelineCI.maxRecursionDepth) {
3405 skip |= LogError(
3406 device, "VUID-VkRayTracingPipelineCreateInfoKHR-pLibraries-03467",
3407 "vkCreateRayTracingPipelinesKHR: Each element (%d) of the pLibraries member of libraries must have been"
3408 "created with the value of maxRecursionDepth (%d) equal to that in this pipeline (%d) .",
3409 i, pLibrary_pipelinestate->raytracingPipelineCI.maxRecursionDepth,
3410 pipeline->raytracingPipelineCI.maxRecursionDepth);
3411 }
3412 if (pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxAttributeSize !=
3413 pipeline->raytracingPipelineCI.pLibraryInterface->maxAttributeSize ||
3414 pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxPayloadSize !=
3415 pipeline->raytracingPipelineCI.pLibraryInterface->maxPayloadSize ||
3416 pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxCallableSize !=
3417 pipeline->raytracingPipelineCI.pLibraryInterface->maxCallableSize) {
3418 skip |=
3419 LogError(device, "VUID-VkRayTracingPipelineCreateInfoKHR-pLibraries-03469",
3420 "vkCreateRayTracingPipelinesKHR: Each element of the pLibraries member of libraries must have been "
3421 "created with values of the maxPayloadSize,"
3422 "maxAttributeSize, and maxCallableSize members of pLibraryInterface equal to those in this pipeline.");
3423 }
3424 }
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003425 } else {
3426 if (pipeline->raytracingPipelineCI.maxRecursionDepth > phys_dev_ext_props.ray_tracing_propsNV.maxRecursionDepth) {
3427 skip |= LogError(device, "VUID-VkRayTracingPipelineCreateInfoNV-maxRecursionDepth-03457", ": %d > %d",
3428 pipeline->raytracingPipelineCI.maxRecursionDepth,
3429 phys_dev_ext_props.ray_tracing_propsNV.maxRecursionDepth);
3430 }
Jason Macnak15f95e82019-08-21 21:52:02 -04003431 }
Jason Macnak15f95e82019-08-21 21:52:02 -04003432 const auto *stages = pipeline->raytracingPipelineCI.ptr()->pStages;
3433 const auto *groups = pipeline->raytracingPipelineCI.ptr()->pGroups;
3434
3435 uint32_t raygen_stages_found = 0;
John Zulaufe4474e72019-07-01 17:28:27 -06003436 for (uint32_t stage_index = 0; stage_index < pipeline->raytracingPipelineCI.stageCount; stage_index++) {
Jason Macnak15f95e82019-08-21 21:52:02 -04003437 const auto &stage = stages[stage_index];
Jeff Bolzfbe51582018-09-13 10:01:35 -05003438
John Zulaufe4474e72019-07-01 17:28:27 -06003439 const SHADER_MODULE_STATE *module = GetShaderModuleState(stage.module);
3440 const spirv_inst_iter entrypoint = FindEntrypoint(module, stage.pName, stage.stage);
Jeff Bolzfbe51582018-09-13 10:01:35 -05003441
John Zulaufe4474e72019-07-01 17:28:27 -06003442 skip |= ValidatePipelineShaderStage(&stage, pipeline, pipeline->stage_state[stage_index], module, entrypoint, false);
Jason Macnak15f95e82019-08-21 21:52:02 -04003443
3444 if (stage.stage == VK_SHADER_STAGE_RAYGEN_BIT_NV) {
3445 raygen_stages_found++;
3446 }
3447 }
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003448 if (raygen_stages_found == 0) {
3449 skip |= LogError(
3450 device,
3451 isKHR ? "VUID-VkRayTracingPipelineCreateInfoKHR-stage-03425" : "VUID-VkRayTracingPipelineCreateInfoNV-stage-03425",
3452 " : zero raygen stages specified");
Jason Macnak15f95e82019-08-21 21:52:02 -04003453 }
3454
3455 for (uint32_t group_index = 0; group_index < pipeline->raytracingPipelineCI.groupCount; group_index++) {
3456 const auto &group = groups[group_index];
3457
3458 if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_GENERAL_NV) {
3459 if (group.generalShader >= pipeline->raytracingPipelineCI.stageCount ||
3460 (stages[group.generalShader].stage != VK_SHADER_STAGE_RAYGEN_BIT_NV &&
3461 stages[group.generalShader].stage != VK_SHADER_STAGE_MISS_BIT_NV &&
3462 stages[group.generalShader].stage != VK_SHADER_STAGE_CALLABLE_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003463 skip |= LogError(device,
3464 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03474"
3465 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02413",
3466 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003467 }
3468 if (group.anyHitShader != VK_SHADER_UNUSED_NV || group.closestHitShader != VK_SHADER_UNUSED_NV ||
3469 group.intersectionShader != VK_SHADER_UNUSED_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003470 skip |= LogError(device,
3471 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03475"
3472 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02414",
3473 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003474 }
3475 } else if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_PROCEDURAL_HIT_GROUP_NV) {
3476 if (group.intersectionShader >= pipeline->raytracingPipelineCI.stageCount ||
3477 stages[group.intersectionShader].stage != VK_SHADER_STAGE_INTERSECTION_BIT_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003478 skip |= LogError(device,
3479 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03476"
3480 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02415",
3481 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003482 }
3483 } else if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_TRIANGLES_HIT_GROUP_NV) {
3484 if (group.intersectionShader != VK_SHADER_UNUSED_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003485 skip |= LogError(device,
3486 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03477"
3487 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02416",
3488 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003489 }
3490 }
3491
3492 if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_PROCEDURAL_HIT_GROUP_NV ||
3493 group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_TRIANGLES_HIT_GROUP_NV) {
3494 if (group.anyHitShader != VK_SHADER_UNUSED_NV && (group.anyHitShader >= pipeline->raytracingPipelineCI.stageCount ||
3495 stages[group.anyHitShader].stage != VK_SHADER_STAGE_ANY_HIT_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003496 skip |= LogError(device,
3497 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-anyHitShader-03479"
3498 : "VUID-VkRayTracingShaderGroupCreateInfoNV-anyHitShader-02418",
3499 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003500 }
3501 if (group.closestHitShader != VK_SHADER_UNUSED_NV &&
3502 (group.closestHitShader >= pipeline->raytracingPipelineCI.stageCount ||
3503 stages[group.closestHitShader].stage != VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003504 skip |= LogError(device,
3505 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-closestHitShader-03478"
3506 : "VUID-VkRayTracingShaderGroupCreateInfoNV-closestHitShader-02417",
3507 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003508 }
3509 }
John Zulaufe4474e72019-07-01 17:28:27 -06003510 }
3511 return skip;
Jeff Bolzfbe51582018-09-13 10:01:35 -05003512}
3513
Dave Houltona9df0ce2018-02-07 10:51:23 -07003514uint32_t ValidationCache::MakeShaderHash(VkShaderModuleCreateInfo const *smci) { return XXH32(smci->pCode, smci->codeSize, 0); }
Chris Forbes9a61e082017-07-24 15:35:29 -07003515
Dave Houltona9df0ce2018-02-07 10:51:23 -07003516static ValidationCache *GetValidationCacheInfo(VkShaderModuleCreateInfo const *pCreateInfo) {
John Zulauf25ea2432019-04-05 10:07:38 -06003517 const auto validation_cache_ci = lvl_find_in_chain<VkShaderModuleValidationCacheCreateInfoEXT>(pCreateInfo->pNext);
3518 if (validation_cache_ci) {
John Zulauf146ee802019-04-05 15:31:06 -06003519 return CastFromHandle<ValidationCache *>(validation_cache_ci->validationCache);
Chris Forbes9a61e082017-07-24 15:35:29 -07003520 }
Chris Forbes9a61e082017-07-24 15:35:29 -07003521 return nullptr;
3522}
3523
Mark Lobodzinskib56bbb92019-02-18 11:49:59 -07003524bool CoreChecks::PreCallValidateCreateShaderModule(VkDevice device, const VkShaderModuleCreateInfo *pCreateInfo,
Jeff Bolz5c801d12019-10-09 10:38:45 -05003525 const VkAllocationCallbacks *pAllocator, VkShaderModule *pShaderModule) const {
Chris Forbes4ae55b32017-06-09 14:42:56 -07003526 bool skip = false;
3527 spv_result_t spv_valid = SPV_SUCCESS;
Chris Forbes4ae55b32017-06-09 14:42:56 -07003528
Mark Lobodzinski90eea5b2020-05-15 12:54:00 -06003529 if (disabled[shader_validation]) {
Chris Forbes4ae55b32017-06-09 14:42:56 -07003530 return false;
3531 }
3532
Mark Lobodzinskif45e45f2019-04-19 14:15:39 -06003533 auto have_glsl_shader = device_extensions.vk_nv_glsl_shader;
Chris Forbes4ae55b32017-06-09 14:42:56 -07003534
3535 if (!have_glsl_shader && (pCreateInfo->codeSize % 4)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003536 skip |= LogError(device, "VUID-VkShaderModuleCreateInfo-pCode-01376",
3537 "SPIR-V module not valid: Codesize must be a multiple of 4 but is " PRINTF_SIZE_T_SPECIFIER ".",
3538 pCreateInfo->codeSize);
Chris Forbes4ae55b32017-06-09 14:42:56 -07003539 } else {
Chris Forbes9a61e082017-07-24 15:35:29 -07003540 auto cache = GetValidationCacheInfo(pCreateInfo);
3541 uint32_t hash = 0;
3542 if (cache) {
3543 hash = ValidationCache::MakeShaderHash(pCreateInfo);
Dave Houltona9df0ce2018-02-07 10:51:23 -07003544 if (cache->Contains(hash)) return false;
Chris Forbes9a61e082017-07-24 15:35:29 -07003545 }
3546
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003547 // Use SPIRV-Tools validator to try and catch any issues with the module itself. If specialization constants are present,
3548 // the default values will be used during validation.
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06003549 spv_target_env spirv_environment = PickSpirvEnv(api_version, (device_extensions.vk_khr_spirv_1_4 != kNotEnabled));
Dave Houlton0ea2d012018-06-21 14:00:26 -06003550 spv_context ctx = spvContextCreate(spirv_environment);
Dave Houltona9df0ce2018-02-07 10:51:23 -07003551 spv_const_binary_t binary{pCreateInfo->pCode, pCreateInfo->codeSize / sizeof(uint32_t)};
Chris Forbes4ae55b32017-06-09 14:42:56 -07003552 spv_diagnostic diag = nullptr;
Tony-LunarG9fe69a42020-07-23 15:09:37 -06003553 spvtools::ValidatorOptions options;
3554 AdjustValidatorOptions(device_extensions, enabled_features, options);
Karl Schultzfda1b382018-08-08 18:56:11 -06003555 spv_valid = spvValidateWithOptions(ctx, options, &binary, &diag);
Chris Forbes4ae55b32017-06-09 14:42:56 -07003556 if (spv_valid != SPV_SUCCESS) {
3557 if (!have_glsl_shader || (pCreateInfo->pCode[0] == spv::MagicNumber)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003558 if (spv_valid == SPV_WARNING) {
3559 skip |= LogWarning(device, kVUID_Core_Shader_InconsistentSpirv, "SPIR-V module not valid: %s",
3560 diag && diag->error ? diag->error : "(no error text)");
3561 } else {
3562 skip |= LogError(device, kVUID_Core_Shader_InconsistentSpirv, "SPIR-V module not valid: %s",
3563 diag && diag->error ? diag->error : "(no error text)");
3564 }
Chris Forbes4ae55b32017-06-09 14:42:56 -07003565 }
Chris Forbes9a61e082017-07-24 15:35:29 -07003566 } else {
3567 if (cache) {
3568 cache->Insert(hash);
3569 }
Chris Forbes4ae55b32017-06-09 14:42:56 -07003570 }
3571
3572 spvDiagnosticDestroy(diag);
3573 spvContextDestroy(ctx);
3574 }
3575
Chris Forbes4ae55b32017-06-09 14:42:56 -07003576 return skip;
Mark Lobodzinski01734072019-02-13 17:39:15 -07003577}
3578
John Zulaufac4c6e12019-07-01 16:05:58 -06003579bool CoreChecks::ValidateComputeWorkGroupSizes(const SHADER_MODULE_STATE *shader) const {
Lockeaa8fdc02019-04-02 11:59:20 -06003580 bool skip = false;
3581 uint32_t local_size_x = 0;
3582 uint32_t local_size_y = 0;
3583 uint32_t local_size_z = 0;
3584 if (FindLocalSize(shader, local_size_x, local_size_y, local_size_z)) {
3585 if (local_size_x > phys_dev_props.limits.maxComputeWorkGroupSize[0]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003586 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
3587 "%s local_size_x (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[0] (%" PRIu32 ").",
3588 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
3589 phys_dev_props.limits.maxComputeWorkGroupSize[0]);
Lockeaa8fdc02019-04-02 11:59:20 -06003590 }
3591 if (local_size_y > phys_dev_props.limits.maxComputeWorkGroupSize[1]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003592 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
3593 "%s local_size_y (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[1] (%" PRIu32 ").",
3594 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
3595 phys_dev_props.limits.maxComputeWorkGroupSize[1]);
Lockeaa8fdc02019-04-02 11:59:20 -06003596 }
3597 if (local_size_z > phys_dev_props.limits.maxComputeWorkGroupSize[2]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003598 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
3599 "%s local_size_z (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[2] (%" PRIu32 ").",
3600 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
3601 phys_dev_props.limits.maxComputeWorkGroupSize[2]);
Lockeaa8fdc02019-04-02 11:59:20 -06003602 }
3603
3604 uint32_t limit = phys_dev_props.limits.maxComputeWorkGroupInvocations;
3605 uint64_t invocations = local_size_x * local_size_y;
3606 // Prevent overflow.
3607 bool fail = false;
3608 if (invocations > UINT32_MAX || invocations > limit) {
3609 fail = true;
3610 }
3611 if (!fail) {
3612 invocations *= local_size_z;
3613 if (invocations > UINT32_MAX || invocations > limit) {
3614 fail = true;
3615 }
3616 }
3617 if (fail) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003618 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupInvocations",
3619 "%s local_size (%" PRIu32 ", %" PRIu32 ", %" PRIu32
3620 ") exceeds device limit maxComputeWorkGroupInvocations (%" PRIu32 ").",
3621 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x, local_size_y, local_size_z,
3622 limit);
Lockeaa8fdc02019-04-02 11:59:20 -06003623 }
3624 }
3625 return skip;
3626}
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06003627
3628spv_target_env PickSpirvEnv(uint32_t api_version, bool spirv_1_4) {
3629 if (api_version >= VK_API_VERSION_1_2) {
3630 return SPV_ENV_VULKAN_1_2;
3631 } else if (api_version >= VK_API_VERSION_1_1) {
3632 if (spirv_1_4) {
3633 return SPV_ENV_VULKAN_1_1_SPIRV_1_4;
3634 } else {
3635 return SPV_ENV_VULKAN_1_1;
3636 }
3637 }
3638 return SPV_ENV_VULKAN_1_0;
3639}
Tony-LunarG9fe69a42020-07-23 15:09:37 -06003640
3641void AdjustValidatorOptions(const DeviceExtensions device_extensions, const DeviceFeatures enabled_features,
3642 spvtools::ValidatorOptions &options) {
3643 if (device_extensions.vk_khr_relaxed_block_layout) {
3644 options.SetRelaxBlockLayout(true);
3645 }
3646 if (device_extensions.vk_khr_uniform_buffer_standard_layout && enabled_features.core12.uniformBufferStandardLayout == VK_TRUE) {
3647 options.SetUniformBufferStandardLayout(true);
3648 }
3649 if (device_extensions.vk_ext_scalar_block_layout && enabled_features.core12.scalarBlockLayout == VK_TRUE) {
3650 options.SetScalarBlockLayout(true);
3651 }
3652}