blob: c342da31d491fe1390faa9c2eabb55c759b6810d [file] [log] [blame]
Tony-LunarG73719992020-01-15 10:20:28 -07001/* Copyright (c) 2015-2020 The Khronos Group Inc.
2 * Copyright (c) 2015-2020 Valve Corporation
3 * Copyright (c) 2015-2020 LunarG, Inc.
4 * Copyright (C) 2015-2020 Google Inc.
Chris Forbes47567b72017-06-09 12:09:45 -07005 *
6 * Licensed under the Apache License, Version 2.0 (the "License");
7 * you may not use this file except in compliance with the License.
8 * You may obtain a copy of the License at
9 *
10 * http://www.apache.org/licenses/LICENSE-2.0
11 *
12 * Unless required by applicable law or agreed to in writing, software
13 * distributed under the License is distributed on an "AS IS" BASIS,
14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 * See the License for the specific language governing permissions and
16 * limitations under the License.
17 *
18 * Author: Chris Forbes <chrisf@ijw.co.nz>
Dave Houlton51653902018-06-22 17:32:13 -060019 * Author: Dave Houlton <daveh@lunarg.com>
Chris Forbes47567b72017-06-09 12:09:45 -070020 */
21
Petr Kraus25810d02019-08-27 17:41:15 +020022#include "shader_validation.h"
23
Chris Forbes47567b72017-06-09 12:09:45 -070024#include <cassert>
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +020025#include <chrono>
Petr Kraus25810d02019-08-27 17:41:15 +020026#include <cinttypes>
Jeff Bolzf234bf82019-11-04 14:07:15 -060027#include <cmath>
Petr Kraus25810d02019-08-27 17:41:15 +020028#include <map>
Chris Forbes47567b72017-06-09 12:09:45 -070029#include <sstream>
Petr Kraus25810d02019-08-27 17:41:15 +020030#include <string>
31#include <unordered_map>
32#include <vector>
33
Mark Lobodzinski102687e2020-04-28 11:03:28 -060034#include <spirv/unified1/spirv.hpp>
Chris Forbes47567b72017-06-09 12:09:45 -070035#include "vk_loader_platform.h"
36#include "vk_enum_string_helper.h"
Chris Forbes47567b72017-06-09 12:09:45 -070037#include "vk_layer_data.h"
38#include "vk_layer_extension_utils.h"
39#include "vk_layer_utils.h"
Mark Lobodzinskib56bbb92019-02-18 11:49:59 -070040#include "chassis.h"
Chris Forbes47567b72017-06-09 12:09:45 -070041#include "core_validation.h"
Petr Kraus25810d02019-08-27 17:41:15 +020042
Chris Forbes4ae55b32017-06-09 14:42:56 -070043#include "spirv-tools/libspirv.h"
Chris Forbes9a61e082017-07-24 15:35:29 -070044#include "xxhash.h"
Chris Forbes47567b72017-06-09 12:09:45 -070045
Chris Forbes8a6d8cb2019-02-14 14:33:08 -080046void decoration_set::add(uint32_t decoration, uint32_t value) {
47 switch (decoration) {
48 case spv::DecorationLocation:
49 flags |= location_bit;
50 location = value;
51 break;
52 case spv::DecorationPatch:
53 flags |= patch_bit;
54 break;
55 case spv::DecorationRelaxedPrecision:
56 flags |= relaxed_precision_bit;
57 break;
58 case spv::DecorationBlock:
59 flags |= block_bit;
60 break;
61 case spv::DecorationBufferBlock:
62 flags |= buffer_block_bit;
63 break;
64 case spv::DecorationComponent:
65 flags |= component_bit;
66 component = value;
67 break;
68 case spv::DecorationInputAttachmentIndex:
69 flags |= input_attachment_index_bit;
70 input_attachment_index = value;
71 break;
72 case spv::DecorationDescriptorSet:
73 flags |= descriptor_set_bit;
74 descriptor_set = value;
75 break;
76 case spv::DecorationBinding:
77 flags |= binding_bit;
78 binding = value;
79 break;
80 case spv::DecorationNonWritable:
81 flags |= nonwritable_bit;
82 break;
83 case spv::DecorationBuiltIn:
84 flags |= builtin_bit;
85 builtin = value;
86 break;
87 }
88}
89
Chris Forbes47567b72017-06-09 12:09:45 -070090enum FORMAT_TYPE {
91 FORMAT_TYPE_FLOAT = 1, // UNORM, SNORM, FLOAT, USCALED, SSCALED, SRGB -- anything we consider float in the shader
92 FORMAT_TYPE_SINT = 2,
93 FORMAT_TYPE_UINT = 4,
94};
95
96typedef std::pair<unsigned, unsigned> location_t;
97
Chris Forbes47567b72017-06-09 12:09:45 -070098static shader_stage_attributes shader_stage_attribs[] = {
Ari Suonpaa696b3432019-03-11 14:02:57 +020099 {"vertex shader", false, false, VK_SHADER_STAGE_VERTEX_BIT},
100 {"tessellation control shader", true, true, VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT},
101 {"tessellation evaluation shader", true, false, VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT},
102 {"geometry shader", true, false, VK_SHADER_STAGE_GEOMETRY_BIT},
103 {"fragment shader", false, false, VK_SHADER_STAGE_FRAGMENT_BIT},
Chris Forbes47567b72017-06-09 12:09:45 -0700104};
105
John Zulauf14c355b2019-06-27 16:09:37 -0600106unsigned ExecutionModelToShaderStageFlagBits(unsigned mode);
107
Chris Forbes47567b72017-06-09 12:09:45 -0700108// SPIRV utility functions
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600109void SHADER_MODULE_STATE::BuildDefIndex() {
Chris Forbes47567b72017-06-09 12:09:45 -0700110 for (auto insn : *this) {
111 switch (insn.opcode()) {
112 // Types
113 case spv::OpTypeVoid:
114 case spv::OpTypeBool:
115 case spv::OpTypeInt:
116 case spv::OpTypeFloat:
117 case spv::OpTypeVector:
118 case spv::OpTypeMatrix:
119 case spv::OpTypeImage:
120 case spv::OpTypeSampler:
121 case spv::OpTypeSampledImage:
122 case spv::OpTypeArray:
123 case spv::OpTypeRuntimeArray:
124 case spv::OpTypeStruct:
125 case spv::OpTypeOpaque:
126 case spv::OpTypePointer:
127 case spv::OpTypeFunction:
128 case spv::OpTypeEvent:
129 case spv::OpTypeDeviceEvent:
130 case spv::OpTypeReserveId:
131 case spv::OpTypeQueue:
132 case spv::OpTypePipe:
Shannon McPherson0fa28232018-11-01 11:59:02 -0600133 case spv::OpTypeAccelerationStructureNV:
Jeff Bolze4356752019-03-07 11:23:46 -0600134 case spv::OpTypeCooperativeMatrixNV:
Chris Forbes47567b72017-06-09 12:09:45 -0700135 def_index[insn.word(1)] = insn.offset();
136 break;
137
138 // Fixed constants
139 case spv::OpConstantTrue:
140 case spv::OpConstantFalse:
141 case spv::OpConstant:
142 case spv::OpConstantComposite:
143 case spv::OpConstantSampler:
144 case spv::OpConstantNull:
145 def_index[insn.word(2)] = insn.offset();
146 break;
147
148 // Specialization constants
149 case spv::OpSpecConstantTrue:
150 case spv::OpSpecConstantFalse:
151 case spv::OpSpecConstant:
152 case spv::OpSpecConstantComposite:
153 case spv::OpSpecConstantOp:
154 def_index[insn.word(2)] = insn.offset();
155 break;
156
157 // Variables
158 case spv::OpVariable:
159 def_index[insn.word(2)] = insn.offset();
160 break;
161
162 // Functions
163 case spv::OpFunction:
164 def_index[insn.word(2)] = insn.offset();
165 break;
166
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800167 // Decorations
168 case spv::OpDecorate: {
169 auto targetId = insn.word(1);
170 decorations[targetId].add(insn.word(2), insn.len() > 3u ? insn.word(3) : 0u);
171 } break;
172 case spv::OpGroupDecorate: {
173 auto const &src = decorations[insn.word(1)];
174 for (auto i = 2u; i < insn.len(); i++) decorations[insn.word(i)].merge(src);
175 } break;
176
John Zulauf14c355b2019-06-27 16:09:37 -0600177 // Entry points ... add to the entrypoint table
178 case spv::OpEntryPoint: {
179 // Entry points do not have an id (the id is the function id) and thus need their own table
180 auto entrypoint_name = (char const *)&insn.word(3);
181 auto execution_model = insn.word(1);
182 auto entrypoint_stage = ExecutionModelToShaderStageFlagBits(execution_model);
183 entry_points.emplace(entrypoint_name, EntryPoint{insn.offset(), entrypoint_stage});
184 break;
185 }
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800186
Chris Forbes47567b72017-06-09 12:09:45 -0700187 default:
188 // We don't care about any other defs for now.
189 break;
190 }
191 }
192}
193
Jeff Bolz105d6492018-09-29 15:46:44 -0500194unsigned ExecutionModelToShaderStageFlagBits(unsigned mode) {
195 switch (mode) {
196 case spv::ExecutionModelVertex:
197 return VK_SHADER_STAGE_VERTEX_BIT;
198 case spv::ExecutionModelTessellationControl:
199 return VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT;
200 case spv::ExecutionModelTessellationEvaluation:
201 return VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT;
202 case spv::ExecutionModelGeometry:
203 return VK_SHADER_STAGE_GEOMETRY_BIT;
204 case spv::ExecutionModelFragment:
205 return VK_SHADER_STAGE_FRAGMENT_BIT;
206 case spv::ExecutionModelGLCompute:
207 return VK_SHADER_STAGE_COMPUTE_BIT;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600208 case spv::ExecutionModelRayGenerationNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700209 return VK_SHADER_STAGE_RAYGEN_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600210 case spv::ExecutionModelAnyHitNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700211 return VK_SHADER_STAGE_ANY_HIT_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600212 case spv::ExecutionModelClosestHitNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700213 return VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600214 case spv::ExecutionModelMissNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700215 return VK_SHADER_STAGE_MISS_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600216 case spv::ExecutionModelIntersectionNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700217 return VK_SHADER_STAGE_INTERSECTION_BIT_NV;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600218 case spv::ExecutionModelCallableNV:
Eric Werness30127fd2018-10-31 21:01:03 -0700219 return VK_SHADER_STAGE_CALLABLE_BIT_NV;
Jeff Bolz105d6492018-09-29 15:46:44 -0500220 case spv::ExecutionModelTaskNV:
221 return VK_SHADER_STAGE_TASK_BIT_NV;
222 case spv::ExecutionModelMeshNV:
223 return VK_SHADER_STAGE_MESH_BIT_NV;
224 default:
225 return 0;
226 }
227}
228
locke-lunargd9a069d2019-09-17 01:50:19 -0600229spirv_inst_iter FindEntrypoint(SHADER_MODULE_STATE const *src, char const *name, VkShaderStageFlagBits stageBits) {
John Zulauf14c355b2019-06-27 16:09:37 -0600230 auto range = src->entry_points.equal_range(name);
231 for (auto it = range.first; it != range.second; ++it) {
232 if (it->second.stage == stageBits) {
233 return src->at(it->second.offset);
Chris Forbes47567b72017-06-09 12:09:45 -0700234 }
235 }
Chris Forbes47567b72017-06-09 12:09:45 -0700236 return src->end();
237}
238
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600239static char const *StorageClassName(unsigned sc) {
Chris Forbes47567b72017-06-09 12:09:45 -0700240 switch (sc) {
241 case spv::StorageClassInput:
242 return "input";
243 case spv::StorageClassOutput:
244 return "output";
245 case spv::StorageClassUniformConstant:
246 return "const uniform";
247 case spv::StorageClassUniform:
248 return "uniform";
249 case spv::StorageClassWorkgroup:
250 return "workgroup local";
251 case spv::StorageClassCrossWorkgroup:
252 return "workgroup global";
253 case spv::StorageClassPrivate:
254 return "private global";
255 case spv::StorageClassFunction:
256 return "function";
257 case spv::StorageClassGeneric:
258 return "generic";
259 case spv::StorageClassAtomicCounter:
260 return "atomic counter";
261 case spv::StorageClassImage:
262 return "image";
263 case spv::StorageClassPushConstant:
264 return "push constant";
Chris Forbes9f89d752018-03-07 12:57:48 -0800265 case spv::StorageClassStorageBuffer:
266 return "storage buffer";
Chris Forbes47567b72017-06-09 12:09:45 -0700267 default:
268 return "unknown";
269 }
270}
271
272// Get the value of an integral constant
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600273unsigned GetConstantValue(SHADER_MODULE_STATE const *src, unsigned id) {
Chris Forbes47567b72017-06-09 12:09:45 -0700274 auto value = src->get_def(id);
275 assert(value != src->end());
276
277 if (value.opcode() != spv::OpConstant) {
278 // TODO: Either ensure that the specialization transform is already performed on a module we're
279 // considering here, OR -- specialize on the fly now.
280 return 1;
281 }
282
283 return value.word(3);
284}
285
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600286static void DescribeTypeInner(std::ostringstream &ss, SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700287 auto insn = src->get_def(type);
288 assert(insn != src->end());
289
290 switch (insn.opcode()) {
291 case spv::OpTypeBool:
292 ss << "bool";
293 break;
294 case spv::OpTypeInt:
295 ss << (insn.word(3) ? 's' : 'u') << "int" << insn.word(2);
296 break;
297 case spv::OpTypeFloat:
298 ss << "float" << insn.word(2);
299 break;
300 case spv::OpTypeVector:
301 ss << "vec" << insn.word(3) << " of ";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600302 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700303 break;
304 case spv::OpTypeMatrix:
305 ss << "mat" << insn.word(3) << " of ";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600306 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700307 break;
308 case spv::OpTypeArray:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600309 ss << "arr[" << GetConstantValue(src, insn.word(3)) << "] of ";
310 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700311 break;
Chris Forbes062f1222018-08-21 15:34:15 -0700312 case spv::OpTypeRuntimeArray:
313 ss << "runtime arr[] of ";
314 DescribeTypeInner(ss, src, insn.word(2));
315 break;
Chris Forbes47567b72017-06-09 12:09:45 -0700316 case spv::OpTypePointer:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600317 ss << "ptr to " << StorageClassName(insn.word(2)) << " ";
318 DescribeTypeInner(ss, src, insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700319 break;
320 case spv::OpTypeStruct: {
321 ss << "struct of (";
322 for (unsigned i = 2; i < insn.len(); i++) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600323 DescribeTypeInner(ss, src, insn.word(i));
Chris Forbes47567b72017-06-09 12:09:45 -0700324 if (i == insn.len() - 1) {
325 ss << ")";
326 } else {
327 ss << ", ";
328 }
329 }
330 break;
331 }
332 case spv::OpTypeSampler:
333 ss << "sampler";
334 break;
335 case spv::OpTypeSampledImage:
336 ss << "sampler+";
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600337 DescribeTypeInner(ss, src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700338 break;
339 case spv::OpTypeImage:
340 ss << "image(dim=" << insn.word(3) << ", sampled=" << insn.word(7) << ")";
341 break;
Shannon McPherson0fa28232018-11-01 11:59:02 -0600342 case spv::OpTypeAccelerationStructureNV:
Jeff Bolz105d6492018-09-29 15:46:44 -0500343 ss << "accelerationStruture";
344 break;
Chris Forbes47567b72017-06-09 12:09:45 -0700345 default:
346 ss << "oddtype";
347 break;
348 }
349}
350
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600351static std::string DescribeType(SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700352 std::ostringstream ss;
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600353 DescribeTypeInner(ss, src, type);
Chris Forbes47567b72017-06-09 12:09:45 -0700354 return ss.str();
355}
356
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600357static bool IsNarrowNumericType(spirv_inst_iter type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700358 if (type.opcode() != spv::OpTypeInt && type.opcode() != spv::OpTypeFloat) return false;
359 return type.word(2) < 64;
360}
361
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600362static bool TypesMatch(SHADER_MODULE_STATE const *a, SHADER_MODULE_STATE const *b, unsigned a_type, unsigned b_type, bool a_arrayed,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600363 bool b_arrayed, bool relaxed) {
Chris Forbes47567b72017-06-09 12:09:45 -0700364 // Walk two type trees together, and complain about differences
365 auto a_insn = a->get_def(a_type);
366 auto b_insn = b->get_def(b_type);
367 assert(a_insn != a->end());
368 assert(b_insn != b->end());
369
Chris Forbes062f1222018-08-21 15:34:15 -0700370 // Ignore runtime-sized arrays-- they cannot appear in these interfaces.
371
Chris Forbes47567b72017-06-09 12:09:45 -0700372 if (a_arrayed && a_insn.opcode() == spv::OpTypeArray) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600373 return TypesMatch(a, b, a_insn.word(2), b_type, false, b_arrayed, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700374 }
375
376 if (b_arrayed && b_insn.opcode() == spv::OpTypeArray) {
377 // We probably just found the extra level of arrayness in b_type: compare the type inside it to a_type
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600378 return TypesMatch(a, b, a_type, b_insn.word(2), a_arrayed, false, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700379 }
380
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600381 if (a_insn.opcode() == spv::OpTypeVector && relaxed && IsNarrowNumericType(b_insn)) {
382 return TypesMatch(a, b, a_insn.word(2), b_type, a_arrayed, b_arrayed, false);
Chris Forbes47567b72017-06-09 12:09:45 -0700383 }
384
385 if (a_insn.opcode() != b_insn.opcode()) {
386 return false;
387 }
388
389 if (a_insn.opcode() == spv::OpTypePointer) {
390 // Match on pointee type. storage class is expected to differ
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600391 return TypesMatch(a, b, a_insn.word(3), b_insn.word(3), a_arrayed, b_arrayed, relaxed);
Chris Forbes47567b72017-06-09 12:09:45 -0700392 }
393
394 if (a_arrayed || b_arrayed) {
395 // If we havent resolved array-of-verts by here, we're not going to.
396 return false;
397 }
398
399 switch (a_insn.opcode()) {
400 case spv::OpTypeBool:
401 return true;
402 case spv::OpTypeInt:
403 // Match on width, signedness
404 return a_insn.word(2) == b_insn.word(2) && a_insn.word(3) == b_insn.word(3);
405 case spv::OpTypeFloat:
406 // Match on width
407 return a_insn.word(2) == b_insn.word(2);
408 case spv::OpTypeVector:
409 // Match on element type, count.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600410 if (!TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false)) return false;
411 if (relaxed && IsNarrowNumericType(a->get_def(a_insn.word(2)))) {
Chris Forbes47567b72017-06-09 12:09:45 -0700412 return a_insn.word(3) >= b_insn.word(3);
413 } else {
414 return a_insn.word(3) == b_insn.word(3);
415 }
416 case spv::OpTypeMatrix:
417 // Match on element type, count.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600418 return TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false) &&
Dave Houltona9df0ce2018-02-07 10:51:23 -0700419 a_insn.word(3) == b_insn.word(3);
Chris Forbes47567b72017-06-09 12:09:45 -0700420 case spv::OpTypeArray:
421 // Match on element type, count. these all have the same layout. we don't get here if b_arrayed. This differs from
422 // vector & matrix types in that the array size is the id of a constant instruction, * not a literal within OpTypeArray
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600423 return TypesMatch(a, b, a_insn.word(2), b_insn.word(2), a_arrayed, b_arrayed, false) &&
424 GetConstantValue(a, a_insn.word(3)) == GetConstantValue(b, b_insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700425 case spv::OpTypeStruct:
426 // Match on all element types
Dave Houltona9df0ce2018-02-07 10:51:23 -0700427 {
428 if (a_insn.len() != b_insn.len()) {
429 return false; // Structs cannot match if member counts differ
Chris Forbes47567b72017-06-09 12:09:45 -0700430 }
Chris Forbes47567b72017-06-09 12:09:45 -0700431
Dave Houltona9df0ce2018-02-07 10:51:23 -0700432 for (unsigned i = 2; i < a_insn.len(); i++) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600433 if (!TypesMatch(a, b, a_insn.word(i), b_insn.word(i), a_arrayed, b_arrayed, false)) {
Dave Houltona9df0ce2018-02-07 10:51:23 -0700434 return false;
435 }
436 }
437
438 return true;
439 }
Chris Forbes47567b72017-06-09 12:09:45 -0700440 default:
441 // Remaining types are CLisms, or may not appear in the interfaces we are interested in. Just claim no match.
442 return false;
443 }
444}
445
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600446static unsigned GetLocationsConsumedByType(SHADER_MODULE_STATE const *src, unsigned type, bool strip_array_level) {
Chris Forbes47567b72017-06-09 12:09:45 -0700447 auto insn = src->get_def(type);
448 assert(insn != src->end());
449
450 switch (insn.opcode()) {
451 case spv::OpTypePointer:
452 // See through the ptr -- this is only ever at the toplevel for graphics shaders we're never actually passing
453 // pointers around.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600454 return GetLocationsConsumedByType(src, insn.word(3), strip_array_level);
Chris Forbes47567b72017-06-09 12:09:45 -0700455 case spv::OpTypeArray:
456 if (strip_array_level) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600457 return GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700458 } else {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600459 return GetConstantValue(src, insn.word(3)) * GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700460 }
461 case spv::OpTypeMatrix:
462 // Num locations is the dimension * element size
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600463 return insn.word(3) * GetLocationsConsumedByType(src, insn.word(2), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700464 case spv::OpTypeVector: {
465 auto scalar_type = src->get_def(insn.word(2));
466 auto bit_width =
467 (scalar_type.opcode() == spv::OpTypeInt || scalar_type.opcode() == spv::OpTypeFloat) ? scalar_type.word(2) : 32;
468
469 // Locations are 128-bit wide; 3- and 4-component vectors of 64 bit types require two.
470 return (bit_width * insn.word(3) + 127) / 128;
471 }
472 default:
473 // Everything else is just 1.
474 return 1;
475
476 // TODO: extend to handle 64bit scalar types, whose vectors may need multiple locations.
477 }
478}
479
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600480static unsigned GetComponentsConsumedByType(SHADER_MODULE_STATE const *src, unsigned type, bool strip_array_level) {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200481 auto insn = src->get_def(type);
482 assert(insn != src->end());
483
484 switch (insn.opcode()) {
485 case spv::OpTypePointer:
486 // See through the ptr -- this is only ever at the toplevel for graphics shaders we're never actually passing
487 // pointers around.
488 return GetComponentsConsumedByType(src, insn.word(3), strip_array_level);
489 case spv::OpTypeStruct: {
490 uint32_t sum = 0;
491 for (uint32_t i = 2; i < insn.len(); i++) { // i=2 to skip word(0) and word(1)=ID of struct
492 sum += GetComponentsConsumedByType(src, insn.word(i), false);
493 }
494 return sum;
495 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -0500496 case spv::OpTypeArray:
497 if (strip_array_level) {
498 return GetComponentsConsumedByType(src, insn.word(2), false);
499 } else {
500 return GetConstantValue(src, insn.word(3)) * GetComponentsConsumedByType(src, insn.word(2), false);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200501 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +0200502 case spv::OpTypeMatrix:
503 // Num locations is the dimension * element size
504 return insn.word(3) * GetComponentsConsumedByType(src, insn.word(2), false);
505 case spv::OpTypeVector: {
506 auto scalar_type = src->get_def(insn.word(2));
507 auto bit_width =
508 (scalar_type.opcode() == spv::OpTypeInt || scalar_type.opcode() == spv::OpTypeFloat) ? scalar_type.word(2) : 32;
509 // One component is 32-bit
510 return (bit_width * insn.word(3) + 31) / 32;
511 }
512 case spv::OpTypeFloat: {
513 auto bit_width = insn.word(2);
514 return (bit_width + 31) / 32;
515 }
516 case spv::OpTypeInt: {
517 auto bit_width = insn.word(2);
518 return (bit_width + 31) / 32;
519 }
520 case spv::OpConstant:
521 return GetComponentsConsumedByType(src, insn.word(1), false);
522 default:
523 return 0;
524 }
525}
526
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600527static unsigned GetLocationsConsumedByFormat(VkFormat format) {
Chris Forbes47567b72017-06-09 12:09:45 -0700528 switch (format) {
529 case VK_FORMAT_R64G64B64A64_SFLOAT:
530 case VK_FORMAT_R64G64B64A64_SINT:
531 case VK_FORMAT_R64G64B64A64_UINT:
532 case VK_FORMAT_R64G64B64_SFLOAT:
533 case VK_FORMAT_R64G64B64_SINT:
534 case VK_FORMAT_R64G64B64_UINT:
535 return 2;
536 default:
537 return 1;
538 }
539}
540
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600541static unsigned GetFormatType(VkFormat fmt) {
Dave Houltona9df0ce2018-02-07 10:51:23 -0700542 if (FormatIsSInt(fmt)) return FORMAT_TYPE_SINT;
543 if (FormatIsUInt(fmt)) return FORMAT_TYPE_UINT;
544 if (FormatIsDepthAndStencil(fmt)) return FORMAT_TYPE_FLOAT | FORMAT_TYPE_UINT;
545 if (fmt == VK_FORMAT_UNDEFINED) return 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700546 // everything else -- UNORM/SNORM/FLOAT/USCALED/SSCALED is all float in the shader.
547 return FORMAT_TYPE_FLOAT;
548}
549
550// characterizes a SPIR-V type appearing in an interface to a FF stage, for comparison to a VkFormat's characterization above.
Chris Forbes062f1222018-08-21 15:34:15 -0700551// also used for input attachments, as we statically know their format.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600552static unsigned GetFundamentalType(SHADER_MODULE_STATE const *src, unsigned type) {
Chris Forbes47567b72017-06-09 12:09:45 -0700553 auto insn = src->get_def(type);
554 assert(insn != src->end());
555
556 switch (insn.opcode()) {
557 case spv::OpTypeInt:
558 return insn.word(3) ? FORMAT_TYPE_SINT : FORMAT_TYPE_UINT;
559 case spv::OpTypeFloat:
560 return FORMAT_TYPE_FLOAT;
561 case spv::OpTypeVector:
Chris Forbes47567b72017-06-09 12:09:45 -0700562 case spv::OpTypeMatrix:
Chris Forbes47567b72017-06-09 12:09:45 -0700563 case spv::OpTypeArray:
Chris Forbes062f1222018-08-21 15:34:15 -0700564 case spv::OpTypeRuntimeArray:
565 case spv::OpTypeImage:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600566 return GetFundamentalType(src, insn.word(2));
Chris Forbes47567b72017-06-09 12:09:45 -0700567 case spv::OpTypePointer:
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600568 return GetFundamentalType(src, insn.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -0700569
570 default:
571 return 0;
572 }
573}
574
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600575static uint32_t GetShaderStageId(VkShaderStageFlagBits stage) {
Chris Forbes47567b72017-06-09 12:09:45 -0700576 uint32_t bit_pos = uint32_t(u_ffs(stage));
577 return bit_pos - 1;
578}
579
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600580static spirv_inst_iter GetStructType(SHADER_MODULE_STATE const *src, spirv_inst_iter def, bool is_array_of_verts) {
Chris Forbes47567b72017-06-09 12:09:45 -0700581 while (true) {
582 if (def.opcode() == spv::OpTypePointer) {
583 def = src->get_def(def.word(3));
584 } else if (def.opcode() == spv::OpTypeArray && is_array_of_verts) {
585 def = src->get_def(def.word(2));
586 is_array_of_verts = false;
587 } else if (def.opcode() == spv::OpTypeStruct) {
588 return def;
589 } else {
590 return src->end();
591 }
592 }
593}
594
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600595static bool CollectInterfaceBlockMembers(SHADER_MODULE_STATE const *src, std::map<location_t, interface_var> *out,
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800596 bool is_array_of_verts, uint32_t id, uint32_t type_id, bool is_patch,
597 int /*first_location*/) {
Chris Forbes47567b72017-06-09 12:09:45 -0700598 // Walk down the type_id presented, trying to determine whether it's actually an interface block.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600599 auto type = GetStructType(src, src->get_def(type_id), is_array_of_verts && !is_patch);
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800600 if (type == src->end() || !(src->get_decorations(type.word(1)).flags & decoration_set::block_bit)) {
Chris Forbes47567b72017-06-09 12:09:45 -0700601 // This isn't an interface block.
Chris Forbesa313d772017-06-13 13:59:41 -0700602 return false;
Chris Forbes47567b72017-06-09 12:09:45 -0700603 }
604
605 std::unordered_map<unsigned, unsigned> member_components;
606 std::unordered_map<unsigned, unsigned> member_relaxed_precision;
Chris Forbesa313d772017-06-13 13:59:41 -0700607 std::unordered_map<unsigned, unsigned> member_patch;
Chris Forbes47567b72017-06-09 12:09:45 -0700608
609 // Walk all the OpMemberDecorate for type's result id -- first pass, collect components.
610 for (auto insn : *src) {
611 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1)) {
612 unsigned member_index = insn.word(2);
613
614 if (insn.word(3) == spv::DecorationComponent) {
615 unsigned component = insn.word(4);
616 member_components[member_index] = component;
617 }
618
619 if (insn.word(3) == spv::DecorationRelaxedPrecision) {
620 member_relaxed_precision[member_index] = 1;
621 }
Chris Forbesa313d772017-06-13 13:59:41 -0700622
623 if (insn.word(3) == spv::DecorationPatch) {
624 member_patch[member_index] = 1;
625 }
Chris Forbes47567b72017-06-09 12:09:45 -0700626 }
627 }
628
Chris Forbesa313d772017-06-13 13:59:41 -0700629 // TODO: correctly handle location assignment from outside
630
Chris Forbes47567b72017-06-09 12:09:45 -0700631 // Second pass -- produce the output, from Location decorations
632 for (auto insn : *src) {
633 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1)) {
634 unsigned member_index = insn.word(2);
635 unsigned member_type_id = type.word(2 + member_index);
636
637 if (insn.word(3) == spv::DecorationLocation) {
638 unsigned location = insn.word(4);
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600639 unsigned num_locations = GetLocationsConsumedByType(src, member_type_id, false);
Chris Forbes47567b72017-06-09 12:09:45 -0700640 auto component_it = member_components.find(member_index);
641 unsigned component = component_it == member_components.end() ? 0 : component_it->second;
642 bool is_relaxed_precision = member_relaxed_precision.find(member_index) != member_relaxed_precision.end();
Dave Houltona9df0ce2018-02-07 10:51:23 -0700643 bool member_is_patch = is_patch || member_patch.count(member_index) > 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700644
645 for (unsigned int offset = 0; offset < num_locations; offset++) {
646 interface_var v = {};
647 v.id = id;
648 // TODO: member index in interface_var too?
649 v.type_id = member_type_id;
650 v.offset = offset;
Chris Forbesa313d772017-06-13 13:59:41 -0700651 v.is_patch = member_is_patch;
Chris Forbes47567b72017-06-09 12:09:45 -0700652 v.is_block_member = true;
653 v.is_relaxed_precision = is_relaxed_precision;
654 (*out)[std::make_pair(location + offset, component)] = v;
655 }
656 }
657 }
658 }
Chris Forbesa313d772017-06-13 13:59:41 -0700659
660 return true;
Chris Forbes47567b72017-06-09 12:09:45 -0700661}
662
Ari Suonpaa696b3432019-03-11 14:02:57 +0200663static std::vector<uint32_t> FindEntrypointInterfaces(spirv_inst_iter entrypoint) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800664 assert(entrypoint.opcode() == spv::OpEntryPoint);
665
Ari Suonpaa696b3432019-03-11 14:02:57 +0200666 std::vector<uint32_t> interfaces;
667 // Find the end of the entrypoint's name string. additional zero bytes follow the actual null terminator, to fill out the
668 // rest of the word - so we only need to look at the last byte in the word to determine which word contains the terminator.
669 uint32_t word = 3;
670 while (entrypoint.word(word) & 0xff000000u) {
671 ++word;
672 }
673 ++word;
674
675 for (; word < entrypoint.len(); word++) interfaces.push_back(entrypoint.word(word));
676
677 return interfaces;
678}
679
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600680static std::map<location_t, interface_var> CollectInterfaceByLocation(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600681 spv::StorageClass sinterface, bool is_array_of_verts) {
Chris Forbes47567b72017-06-09 12:09:45 -0700682 // TODO: handle index=1 dual source outputs from FS -- two vars will have the same location, and we DON'T want to clobber.
683
Chris Forbes47567b72017-06-09 12:09:45 -0700684 std::map<location_t, interface_var> out;
685
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800686 for (uint32_t iid : FindEntrypointInterfaces(entrypoint)) {
687 auto insn = src->get_def(iid);
Chris Forbes47567b72017-06-09 12:09:45 -0700688 assert(insn != src->end());
689 assert(insn.opcode() == spv::OpVariable);
690
691 if (insn.word(3) == static_cast<uint32_t>(sinterface)) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800692 auto d = src->get_decorations(iid);
Chris Forbes47567b72017-06-09 12:09:45 -0700693 unsigned id = insn.word(2);
694 unsigned type = insn.word(1);
695
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800696 int location = d.location;
697 int builtin = d.builtin;
698 unsigned component = d.component;
699 bool is_patch = (d.flags & decoration_set::patch_bit) != 0;
700 bool is_relaxed_precision = (d.flags & decoration_set::relaxed_precision_bit) != 0;
Chris Forbes47567b72017-06-09 12:09:45 -0700701
Dave Houltona9df0ce2018-02-07 10:51:23 -0700702 if (builtin != -1)
703 continue;
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800704 else if (!CollectInterfaceBlockMembers(src, &out, is_array_of_verts, id, type, is_patch, location)) {
Chris Forbes47567b72017-06-09 12:09:45 -0700705 // A user-defined interface variable, with a location. Where a variable occupied multiple locations, emit
706 // one result for each.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600707 unsigned num_locations = GetLocationsConsumedByType(src, type, is_array_of_verts && !is_patch);
Chris Forbes47567b72017-06-09 12:09:45 -0700708 for (unsigned int offset = 0; offset < num_locations; offset++) {
709 interface_var v = {};
710 v.id = id;
711 v.type_id = type;
712 v.offset = offset;
713 v.is_patch = is_patch;
714 v.is_relaxed_precision = is_relaxed_precision;
715 out[std::make_pair(location + offset, component)] = v;
716 }
Chris Forbes47567b72017-06-09 12:09:45 -0700717 }
718 }
719 }
720
721 return out;
722}
723
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600724static std::vector<uint32_t> CollectBuiltinBlockMembers(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint,
Ari Suonpaa696b3432019-03-11 14:02:57 +0200725 uint32_t storageClass) {
726 std::vector<uint32_t> variables;
727 std::vector<uint32_t> builtinStructMembers;
728 std::vector<uint32_t> builtinDecorations;
729
730 for (auto insn : *src) {
731 switch (insn.opcode()) {
732 // Find all built-in member decorations
733 case spv::OpMemberDecorate:
734 if (insn.word(3) == spv::DecorationBuiltIn) {
735 builtinStructMembers.push_back(insn.word(1));
736 }
737 break;
738 // Find all built-in decorations
739 case spv::OpDecorate:
740 switch (insn.word(2)) {
741 case spv::DecorationBlock: {
742 uint32_t blockID = insn.word(1);
743 for (auto builtInBlockID : builtinStructMembers) {
744 // Check if one of the members of the block are built-in -> the block is built-in
745 if (blockID == builtInBlockID) {
746 builtinDecorations.push_back(blockID);
747 break;
748 }
749 }
750 break;
751 }
752 case spv::DecorationBuiltIn:
753 builtinDecorations.push_back(insn.word(1));
754 break;
755 default:
756 break;
757 }
758 break;
759 default:
760 break;
761 }
762 }
763
764 // Find all interface variables belonging to the entrypoint and matching the storage class
765 for (uint32_t id : FindEntrypointInterfaces(entrypoint)) {
766 auto def = src->get_def(id);
767 assert(def != src->end());
768 assert(def.opcode() == spv::OpVariable);
769
770 if (def.word(3) == storageClass) variables.push_back(def.word(1));
771 }
772
773 // Find all members belonging to the builtin block selected
774 std::vector<uint32_t> builtinBlockMembers;
775 for (auto &var : variables) {
776 auto def = src->get_def(src->get_def(var).word(3));
777
778 // It could be an array of IO blocks. The element type should be the struct defining the block contents
779 if (def.opcode() == spv::OpTypeArray) def = src->get_def(def.word(2));
780
781 // Now find all members belonging to the struct defining the IO block
782 if (def.opcode() == spv::OpTypeStruct) {
783 for (auto builtInID : builtinDecorations) {
784 if (builtInID == def.word(1)) {
785 for (int i = 2; i < (int)def.len(); i++)
786 builtinBlockMembers.push_back(spv::BuiltInMax); // Start with undefined builtin for each struct member.
787 // These shouldn't be left after replacing.
788 for (auto insn : *src) {
789 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == builtInID &&
790 insn.word(3) == spv::DecorationBuiltIn) {
791 auto structIndex = insn.word(2);
792 assert(structIndex < builtinBlockMembers.size());
793 builtinBlockMembers[structIndex] = insn.word(4);
794 }
795 }
796 }
797 }
798 }
799 }
800
801 return builtinBlockMembers;
802}
803
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600804static std::vector<std::pair<uint32_t, interface_var>> CollectInterfaceByInputAttachmentIndex(
Mark Lobodzinski3c59d972019-04-25 11:28:14 -0600805 SHADER_MODULE_STATE const *src, std::unordered_set<uint32_t> const &accessible_ids) {
Chris Forbes47567b72017-06-09 12:09:45 -0700806 std::vector<std::pair<uint32_t, interface_var>> out;
807
808 for (auto insn : *src) {
809 if (insn.opcode() == spv::OpDecorate) {
810 if (insn.word(2) == spv::DecorationInputAttachmentIndex) {
811 auto attachment_index = insn.word(3);
812 auto id = insn.word(1);
813
814 if (accessible_ids.count(id)) {
815 auto def = src->get_def(id);
816 assert(def != src->end());
817
818 if (def.opcode() == spv::OpVariable && insn.word(3) == spv::StorageClassUniformConstant) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -0600819 auto num_locations = GetLocationsConsumedByType(src, def.word(1), false);
Chris Forbes47567b72017-06-09 12:09:45 -0700820 for (unsigned int offset = 0; offset < num_locations; offset++) {
821 interface_var v = {};
822 v.id = id;
823 v.type_id = def.word(1);
824 v.offset = offset;
825 out.emplace_back(attachment_index + offset, v);
826 }
827 }
828 }
829 }
830 }
831 }
832
833 return out;
834}
835
locke-lunarg6f760f12020-06-05 16:19:37 -0600836static bool IsWritableDescriptorType(SHADER_MODULE_STATE const *module, const spirv_inst_iter &id_it, bool is_storage_buffer) {
837 uint32_t type_id = id_it.word(1);
Chris Forbes8af24522018-03-07 11:37:45 -0800838 auto type = module->get_def(type_id);
839
840 // Strip off any array or ptrs. Where we remove array levels, adjust the descriptor count for each dimension.
Chris Forbes062f1222018-08-21 15:34:15 -0700841 while (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypePointer || type.opcode() == spv::OpTypeRuntimeArray) {
842 if (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypeRuntimeArray) {
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700843 type = module->get_def(type.word(2)); // Element type
Chris Forbes8af24522018-03-07 11:37:45 -0800844 } else {
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700845 type = module->get_def(type.word(3)); // Pointee type
Chris Forbes8af24522018-03-07 11:37:45 -0800846 }
847 }
Chris Forbes8af24522018-03-07 11:37:45 -0800848 switch (type.opcode()) {
849 case spv::OpTypeImage: {
850 auto dim = type.word(3);
851 auto sampled = type.word(7);
locke-lunarg6f760f12020-06-05 16:19:37 -0600852 if (sampled == 2 && dim != spv::DimSubpassData) {
853 std::vector<unsigned> imagwrite_members;
854 std::unordered_map<unsigned, unsigned> load_members;
855 std::unordered_map<unsigned, unsigned> accesschain_members;
856 unsigned int id = id_it.word(2);
857
858 for (auto insn : *module) {
859 switch (insn.opcode()) {
860 case spv::OpImageWrite: {
861 imagwrite_members.emplace_back(insn.word(1)); // Load id
862 break;
863 }
864 case spv::OpLoad: {
865 // 2: Load id, 3: object id or AccessChain id
866 load_members.insert(std::make_pair(insn.word(2), insn.word(3)));
867 break;
868 }
869 case spv::OpAccessChain: {
870 // 2: AccessChain id, 3: object id
871 if (insn.word(3) == id) {
872 accesschain_members.insert(std::make_pair(insn.word(2), insn.word(3)));
873 }
874 break;
875 }
876 default:
877 break;
878 }
879 }
880 if (imagwrite_members.empty() || load_members.empty()) {
881 return false;
882 }
883 for (auto load_id : imagwrite_members) {
884 auto load_it = load_members.find(load_id);
885 if (load_it == load_members.end()) {
886 continue;
887 }
888 if (load_it->second == id) {
889 return true;
890 }
891 auto accesschain_it = accesschain_members.find(load_it->second);
892 if (accesschain_it == accesschain_members.end()) {
893 continue;
894 }
895 return true;
896 }
897 }
898 return false;
Chris Forbes8af24522018-03-07 11:37:45 -0800899 }
900
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700901 case spv::OpTypeStruct: {
902 std::unordered_set<unsigned> nonwritable_members;
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800903 if (module->get_decorations(type.word(1)).flags & decoration_set::buffer_block_bit) is_storage_buffer = true;
Chris Forbes8af24522018-03-07 11:37:45 -0800904 for (auto insn : *module) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800905 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1) &&
906 insn.word(3) == spv::DecorationNonWritable) {
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700907 nonwritable_members.insert(insn.word(2));
Chris Forbes8af24522018-03-07 11:37:45 -0800908 }
909 }
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700910
911 // A buffer is writable if it's either flavor of storage buffer, and has any member not decorated
912 // as nonwritable.
locke-lunarg6f760f12020-06-05 16:19:37 -0600913 if (is_storage_buffer && nonwritable_members.size() != type.len() - 2) {
914 std::vector<unsigned> store_members;
915 std::unordered_map<unsigned, unsigned> accesschain_members;
916 unsigned int id = id_it.word(2);
917
918 for (auto insn : *module) {
919 switch (insn.opcode()) {
920 case spv::OpStore:
921 case spv::OpAtomicStore: {
922 if (insn.word(1) == id) {
923 return true;
924 }
925 store_members.emplace_back(insn.word(1)); // object id or AccessChain id
926 break;
927 }
928 case spv::OpAccessChain: {
929 // 2: AccessChain id, 3: object id
930 if (insn.word(3) == id) {
931 accesschain_members.insert(std::make_pair(insn.word(2), insn.word(3)));
932 }
933 break;
934 }
935 default:
936 break;
937 }
938 }
939 if (store_members.empty() || accesschain_members.empty()) {
940 return false;
941 }
942 for (auto oid : store_members) {
943 auto accesschain_it = accesschain_members.find(oid);
944 if (accesschain_it == accesschain_members.end()) {
945 continue;
946 }
947 return true;
948 }
949 }
950 return false;
Chris Forbes8d31e5d2018-10-08 17:19:15 -0700951 }
Chris Forbes8af24522018-03-07 11:37:45 -0800952 }
953
954 return false;
955}
956
locke-lunargd9a069d2019-09-17 01:50:19 -0600957std::vector<std::pair<descriptor_slot_t, interface_var>> CollectInterfaceByDescriptorSlot(
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -0700958 SHADER_MODULE_STATE const *src, std::unordered_set<uint32_t> const &accessible_ids, bool *has_writable_descriptor) {
Chris Forbes47567b72017-06-09 12:09:45 -0700959 std::vector<std::pair<descriptor_slot_t, interface_var>> out;
960
961 for (auto id : accessible_ids) {
962 auto insn = src->get_def(id);
963 assert(insn != src->end());
964
965 if (insn.opcode() == spv::OpVariable &&
Chris Forbes9f89d752018-03-07 12:57:48 -0800966 (insn.word(3) == spv::StorageClassUniform || insn.word(3) == spv::StorageClassUniformConstant ||
967 insn.word(3) == spv::StorageClassStorageBuffer)) {
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800968 auto d = src->get_decorations(insn.word(2));
969 unsigned set = d.descriptor_set;
970 unsigned binding = d.binding;
Chris Forbes47567b72017-06-09 12:09:45 -0700971
972 interface_var v = {};
973 v.id = insn.word(2);
974 v.type_id = insn.word(1);
locke-lunarg654e3692020-06-04 17:19:15 -0600975 v.is_writable = false;
Chris Forbes8af24522018-03-07 11:37:45 -0800976
Chris Forbes8a6d8cb2019-02-14 14:33:08 -0800977 if (!(d.flags & decoration_set::nonwritable_bit) &&
locke-lunarg6f760f12020-06-05 16:19:37 -0600978 IsWritableDescriptorType(src, insn, insn.word(3) == spv::StorageClassStorageBuffer)) {
Chris Forbes8af24522018-03-07 11:37:45 -0800979 *has_writable_descriptor = true;
locke-lunarg654e3692020-06-04 17:19:15 -0600980 v.is_writable = true;
Chris Forbes8af24522018-03-07 11:37:45 -0800981 }
locke-lunarg654e3692020-06-04 17:19:15 -0600982 out.emplace_back(std::make_pair(set, binding), v);
Chris Forbes47567b72017-06-09 12:09:45 -0700983 }
984 }
985
986 return out;
987}
988
locke-lunarg96dc9632020-06-10 17:22:18 -0600989std::unordered_set<uint32_t> CollectWritableOutputLocationinFS(const SHADER_MODULE_STATE &module,
990 const VkPipelineShaderStageCreateInfo &stage_info) {
991 std::unordered_set<uint32_t> location_list;
992 if (stage_info.stage != VK_SHADER_STAGE_FRAGMENT_BIT) return location_list;
993 const auto entrypoint = FindEntrypoint(&module, stage_info.pName, stage_info.stage);
994 const auto outputs = CollectInterfaceByLocation(&module, entrypoint, spv::StorageClassOutput, false);
995 std::unordered_set<unsigned> store_members;
996 std::unordered_map<unsigned, unsigned> accesschain_members;
997
998 for (auto insn : module) {
999 switch (insn.opcode()) {
1000 case spv::OpStore:
1001 case spv::OpAtomicStore: {
1002 store_members.insert(insn.word(1)); // object id or AccessChain id
1003 break;
1004 }
1005 case spv::OpAccessChain: {
1006 // 2: AccessChain id, 3: object id
1007 if (insn.word(3)) accesschain_members.insert(std::make_pair(insn.word(2), insn.word(3)));
1008 break;
1009 }
1010 default:
1011 break;
1012 }
1013 }
1014 if (store_members.empty()) {
1015 return location_list;
1016 }
1017 for (auto output : outputs) {
1018 auto store_it = store_members.find(output.second.id);
1019 if (store_it != store_members.end()) {
1020 location_list.insert(output.first.first);
1021 store_members.erase(store_it);
1022 continue;
1023 }
1024 store_it = store_members.begin();
1025 while (store_it != store_members.end()) {
1026 auto accesschain_it = accesschain_members.find(*store_it);
1027 if (accesschain_it == accesschain_members.end()) {
1028 ++store_it;
1029 continue;
1030 }
1031 if (accesschain_it->second == output.second.id) {
1032 location_list.insert(output.first.first);
1033 store_members.erase(store_it);
1034 accesschain_members.erase(accesschain_it);
1035 break;
1036 }
1037 ++store_it;
1038 }
1039 }
1040 return location_list;
1041}
1042
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001043bool CoreChecks::ValidateViConsistency(VkPipelineVertexInputStateCreateInfo const *vi) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001044 // Walk the binding descriptions, which describe the step rate and stride of each vertex buffer. Each binding should
1045 // be specified only once.
1046 std::unordered_map<uint32_t, VkVertexInputBindingDescription const *> bindings;
1047 bool skip = false;
1048
1049 for (unsigned i = 0; i < vi->vertexBindingDescriptionCount; i++) {
1050 auto desc = &vi->pVertexBindingDescriptions[i];
1051 auto &binding = bindings[desc->binding];
1052 if (binding) {
Dave Houlton78d09922018-05-17 15:48:45 -06001053 // TODO: "VUID-VkGraphicsPipelineCreateInfo-pStages-00742" perhaps?
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001054 skip |= LogError(device, kVUID_Core_Shader_InconsistentVi, "Duplicate vertex input binding descriptions for binding %d",
1055 desc->binding);
Chris Forbes47567b72017-06-09 12:09:45 -07001056 } else {
1057 binding = desc;
1058 }
1059 }
1060
1061 return skip;
1062}
1063
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001064bool CoreChecks::ValidateViAgainstVsInputs(VkPipelineVertexInputStateCreateInfo const *vi, SHADER_MODULE_STATE const *vs,
1065 spirv_inst_iter entrypoint) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001066 bool skip = false;
1067
Petr Kraus25810d02019-08-27 17:41:15 +02001068 const auto inputs = CollectInterfaceByLocation(vs, entrypoint, spv::StorageClassInput, false);
Chris Forbes47567b72017-06-09 12:09:45 -07001069
1070 // Build index by location
Petr Kraus25810d02019-08-27 17:41:15 +02001071 std::map<uint32_t, const VkVertexInputAttributeDescription *> attribs;
Chris Forbes47567b72017-06-09 12:09:45 -07001072 if (vi) {
Petr Kraus25810d02019-08-27 17:41:15 +02001073 for (uint32_t i = 0; i < vi->vertexAttributeDescriptionCount; ++i) {
1074 const auto num_locations = GetLocationsConsumedByFormat(vi->pVertexAttributeDescriptions[i].format);
1075 for (uint32_t j = 0; j < num_locations; ++j) {
Chris Forbes47567b72017-06-09 12:09:45 -07001076 attribs[vi->pVertexAttributeDescriptions[i].location + j] = &vi->pVertexAttributeDescriptions[i];
1077 }
1078 }
1079 }
1080
Petr Kraus25810d02019-08-27 17:41:15 +02001081 struct AttribInputPair {
1082 const VkVertexInputAttributeDescription *attrib = nullptr;
1083 const interface_var *input = nullptr;
1084 };
1085 std::map<uint32_t, AttribInputPair> location_map;
1086 for (const auto &attrib_it : attribs) location_map[attrib_it.first].attrib = attrib_it.second;
1087 for (const auto &input_it : inputs) location_map[input_it.first.first].input = &input_it.second;
Chris Forbes47567b72017-06-09 12:09:45 -07001088
Jamie Madillc1f7ca82020-03-16 17:08:26 -04001089 for (const auto &location_it : location_map) {
Petr Kraus25810d02019-08-27 17:41:15 +02001090 const auto location = location_it.first;
1091 const auto attrib = location_it.second.attrib;
1092 const auto input = location_it.second.input;
Mark Lobodzinski7caa39c2018-07-25 15:48:34 -06001093
Petr Kraus25810d02019-08-27 17:41:15 +02001094 if (attrib && !input) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001095 skip |= LogPerformanceWarning(vs->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
1096 "Vertex attribute at location %" PRIu32 " not consumed by vertex shader", location);
Petr Kraus25810d02019-08-27 17:41:15 +02001097 } else if (!attrib && input) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001098 skip |= LogError(vs->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
1099 "Vertex shader consumes input at location %" PRIu32 " but not provided", location);
Petr Kraus25810d02019-08-27 17:41:15 +02001100 } else if (attrib && input) {
1101 const auto attrib_type = GetFormatType(attrib->format);
1102 const auto input_type = GetFundamentalType(vs, input->type_id);
Chris Forbes47567b72017-06-09 12:09:45 -07001103
1104 // Type checking
1105 if (!(attrib_type & input_type)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001106 skip |= LogError(vs->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
1107 "Attribute type of `%s` at location %" PRIu32 " does not match vertex shader input type of `%s`",
1108 string_VkFormat(attrib->format), location, DescribeType(vs, input->type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001109 }
Petr Kraus25810d02019-08-27 17:41:15 +02001110 } else { // !attrib && !input
1111 assert(false); // at least one exists in the map
Chris Forbes47567b72017-06-09 12:09:45 -07001112 }
1113 }
1114
1115 return skip;
1116}
1117
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001118bool CoreChecks::ValidateFsOutputsAgainstRenderPass(SHADER_MODULE_STATE const *fs, spirv_inst_iter entrypoint,
1119 PIPELINE_STATE const *pipeline, uint32_t subpass_index) const {
Petr Kraus25810d02019-08-27 17:41:15 +02001120 bool skip = false;
Chris Forbes8bca1652017-07-20 11:10:09 -07001121
Petr Kraus25810d02019-08-27 17:41:15 +02001122 const auto rpci = pipeline->rp_state->createInfo.ptr();
1123
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001124 struct Attachment {
1125 const VkAttachmentReference2KHR *reference = nullptr;
1126 const VkAttachmentDescription2KHR *attachment = nullptr;
1127 const interface_var *output = nullptr;
1128 };
1129 std::map<uint32_t, Attachment> location_map;
1130
Petr Kraus25810d02019-08-27 17:41:15 +02001131 const auto subpass = rpci->pSubpasses[subpass_index];
1132 for (uint32_t i = 0; i < subpass.colorAttachmentCount; ++i) {
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001133 auto const &reference = subpass.pColorAttachments[i];
1134 location_map[i].reference = &reference;
1135 if (reference.attachment != VK_ATTACHMENT_UNUSED &&
1136 rpci->pAttachments[reference.attachment].format != VK_FORMAT_UNDEFINED) {
1137 location_map[i].attachment = &rpci->pAttachments[reference.attachment];
Chris Forbes47567b72017-06-09 12:09:45 -07001138 }
1139 }
1140
Chris Forbes47567b72017-06-09 12:09:45 -07001141 // TODO: dual source blend index (spv::DecIndex, zero if not provided)
1142
Petr Kraus25810d02019-08-27 17:41:15 +02001143 const auto outputs = CollectInterfaceByLocation(fs, entrypoint, spv::StorageClassOutput, false);
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001144 for (const auto &output_it : outputs) {
1145 auto const location = output_it.first.first;
1146 location_map[location].output = &output_it.second;
1147 }
Chris Forbes47567b72017-06-09 12:09:45 -07001148
Petr Kraus25810d02019-08-27 17:41:15 +02001149 const bool alphaToCoverageEnabled = pipeline->graphicsPipelineCI.pMultisampleState != NULL &&
1150 pipeline->graphicsPipelineCI.pMultisampleState->alphaToCoverageEnable == VK_TRUE;
Chris Forbes47567b72017-06-09 12:09:45 -07001151
Jamie Madillc1f7ca82020-03-16 17:08:26 -04001152 for (const auto &location_it : location_map) {
Jeremy Hayes3699c7c2019-10-09 12:24:55 -06001153 const auto reference = location_it.second.reference;
1154 if (reference != nullptr && reference->attachment == VK_ATTACHMENT_UNUSED) {
1155 continue;
1156 }
1157
Petr Kraus25810d02019-08-27 17:41:15 +02001158 const auto location = location_it.first;
1159 const auto attachment = location_it.second.attachment;
1160 const auto output = location_it.second.output;
Petr Kraus25810d02019-08-27 17:41:15 +02001161 if (attachment && !output) {
1162 if (pipeline->attachments[location].colorWriteMask != 0) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001163 skip |= LogWarning(fs->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
1164 "Attachment %" PRIu32
1165 " not written by fragment shader; undefined values will be written to attachment",
1166 location);
Petr Kraus25810d02019-08-27 17:41:15 +02001167 }
1168 } else if (!attachment && output) {
1169 if (!(alphaToCoverageEnabled && location == 0)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001170 skip |= LogWarning(fs->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
1171 "fragment shader writes to output location %" PRIu32 " with no matching attachment", location);
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001172 }
Petr Kraus25810d02019-08-27 17:41:15 +02001173 } else if (attachment && output) {
1174 const auto attachment_type = GetFormatType(attachment->format);
1175 const auto output_type = GetFundamentalType(fs, output->type_id);
Chris Forbes47567b72017-06-09 12:09:45 -07001176
1177 // Type checking
Petr Kraus25810d02019-08-27 17:41:15 +02001178 if (!(output_type & attachment_type)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001179 skip |=
1180 LogWarning(fs->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
1181 "Attachment %" PRIu32
1182 " of type `%s` does not match fragment shader output type of `%s`; resulting values are undefined",
1183 location, string_VkFormat(attachment->format), DescribeType(fs, output->type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001184 }
Petr Kraus25810d02019-08-27 17:41:15 +02001185 } else { // !attachment && !output
1186 assert(false); // at least one exists in the map
Chris Forbes47567b72017-06-09 12:09:45 -07001187 }
1188 }
1189
Petr Kraus25810d02019-08-27 17:41:15 +02001190 const auto output_zero = location_map.count(0) ? location_map[0].output : nullptr;
1191 bool locationZeroHasAlpha = output_zero && fs->get_def(output_zero->type_id) != fs->end() &&
1192 GetComponentsConsumedByType(fs, output_zero->type_id, false) == 4;
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001193 if (alphaToCoverageEnabled && !locationZeroHasAlpha) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001194 skip |= LogError(fs->vk_shader_module, kVUID_Core_Shader_NoAlphaAtLocation0WithAlphaToCoverage,
1195 "fragment shader doesn't declare alpha output at location 0 even though alpha to coverage is enabled.");
Ari Suonpaa412b23b2019-02-26 07:56:58 +02001196 }
1197
Chris Forbes47567b72017-06-09 12:09:45 -07001198 return skip;
1199}
1200
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001201// For PointSize analysis we need to know if the variable decorated with the PointSize built-in was actually written to.
1202// This function examines instructions in the static call tree for a write to this variable.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06001203static bool IsPointSizeWritten(SHADER_MODULE_STATE const *src, spirv_inst_iter builtin_instr, spirv_inst_iter entrypoint) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001204 auto type = builtin_instr.opcode();
1205 uint32_t target_id = builtin_instr.word(1);
1206 bool init_complete = false;
1207
1208 if (type == spv::OpMemberDecorate) {
1209 // Built-in is part of a structure -- examine instructions up to first function body to get initial IDs
1210 auto insn = entrypoint;
1211 while (!init_complete && (insn.opcode() != spv::OpFunction)) {
1212 switch (insn.opcode()) {
1213 case spv::OpTypePointer:
1214 if ((insn.word(3) == target_id) && (insn.word(2) == spv::StorageClassOutput)) {
1215 target_id = insn.word(1);
1216 }
1217 break;
1218 case spv::OpVariable:
1219 if (insn.word(1) == target_id) {
1220 target_id = insn.word(2);
1221 init_complete = true;
1222 }
1223 break;
1224 }
1225 insn++;
1226 }
1227 }
1228
Mark Lobodzinskif84b0b42018-09-11 14:54:32 -06001229 if (!init_complete && (type == spv::OpMemberDecorate)) return false;
1230
1231 bool found_write = false;
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06001232 std::unordered_set<uint32_t> worklist;
1233 worklist.insert(entrypoint.word(2));
1234
1235 // Follow instructions in call graph looking for writes to target
1236 while (!worklist.empty() && !found_write) {
1237 auto id_iter = worklist.begin();
1238 auto id = *id_iter;
1239 worklist.erase(id_iter);
1240
1241 auto insn = src->get_def(id);
1242 if (insn == src->end()) {
1243 continue;
1244 }
1245
1246 if (insn.opcode() == spv::OpFunction) {
1247 // Scan body of function looking for other function calls or items in our ID chain
1248 while (++insn, insn.opcode() != spv::OpFunctionEnd) {
1249 switch (insn.opcode()) {
1250 case spv::OpAccessChain:
1251 if (insn.word(3) == target_id) {
1252 if (type == spv::OpMemberDecorate) {
1253 auto value = GetConstantValue(src, insn.word(4));
1254 if (value == builtin_instr.word(2)) {
1255 target_id = insn.word(2);
1256 }
1257 } else {
1258 target_id = insn.word(2);
1259 }
1260 }
1261 break;
1262 case spv::OpStore:
1263 if (insn.word(1) == target_id) {
1264 found_write = true;
1265 }
1266 break;
1267 case spv::OpFunctionCall:
1268 worklist.insert(insn.word(3));
1269 break;
1270 }
1271 }
1272 }
1273 }
1274 return found_write;
1275}
1276
Chris Forbes47567b72017-06-09 12:09:45 -07001277// For some analyses, we need to know about all ids referenced by the static call tree of a particular entrypoint. This is
1278// important for identifying the set of shader resources actually used by an entrypoint, for example.
1279// Note: we only explore parts of the image which might actually contain ids we care about for the above analyses.
1280// - NOT the shader input/output interfaces.
1281//
1282// TODO: The set of interesting opcodes here was determined by eyeballing the SPIRV spec. It might be worth
1283// converting parts of this to be generated from the machine-readable spec instead.
locke-lunargd9a069d2019-09-17 01:50:19 -06001284std::unordered_set<uint32_t> MarkAccessibleIds(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint) {
Chris Forbes47567b72017-06-09 12:09:45 -07001285 std::unordered_set<uint32_t> ids;
1286 std::unordered_set<uint32_t> worklist;
1287 worklist.insert(entrypoint.word(2));
1288
1289 while (!worklist.empty()) {
1290 auto id_iter = worklist.begin();
1291 auto id = *id_iter;
1292 worklist.erase(id_iter);
1293
1294 auto insn = src->get_def(id);
1295 if (insn == src->end()) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06001296 // ID is something we didn't collect in BuildDefIndex. that's OK -- we'll stumble across all kinds of things here
Chris Forbes47567b72017-06-09 12:09:45 -07001297 // that we may not care about.
1298 continue;
1299 }
1300
1301 // Try to add to the output set
1302 if (!ids.insert(id).second) {
1303 continue; // If we already saw this id, we don't want to walk it again.
1304 }
1305
1306 switch (insn.opcode()) {
1307 case spv::OpFunction:
1308 // Scan whole body of the function, enlisting anything interesting
1309 while (++insn, insn.opcode() != spv::OpFunctionEnd) {
1310 switch (insn.opcode()) {
1311 case spv::OpLoad:
1312 case spv::OpAtomicLoad:
1313 case spv::OpAtomicExchange:
1314 case spv::OpAtomicCompareExchange:
1315 case spv::OpAtomicCompareExchangeWeak:
1316 case spv::OpAtomicIIncrement:
1317 case spv::OpAtomicIDecrement:
1318 case spv::OpAtomicIAdd:
1319 case spv::OpAtomicISub:
1320 case spv::OpAtomicSMin:
1321 case spv::OpAtomicUMin:
1322 case spv::OpAtomicSMax:
1323 case spv::OpAtomicUMax:
1324 case spv::OpAtomicAnd:
1325 case spv::OpAtomicOr:
1326 case spv::OpAtomicXor:
1327 worklist.insert(insn.word(3)); // ptr
1328 break;
1329 case spv::OpStore:
1330 case spv::OpAtomicStore:
1331 worklist.insert(insn.word(1)); // ptr
1332 break;
1333 case spv::OpAccessChain:
1334 case spv::OpInBoundsAccessChain:
1335 worklist.insert(insn.word(3)); // base ptr
1336 break;
1337 case spv::OpSampledImage:
1338 case spv::OpImageSampleImplicitLod:
1339 case spv::OpImageSampleExplicitLod:
1340 case spv::OpImageSampleDrefImplicitLod:
1341 case spv::OpImageSampleDrefExplicitLod:
1342 case spv::OpImageSampleProjImplicitLod:
1343 case spv::OpImageSampleProjExplicitLod:
1344 case spv::OpImageSampleProjDrefImplicitLod:
1345 case spv::OpImageSampleProjDrefExplicitLod:
1346 case spv::OpImageFetch:
1347 case spv::OpImageGather:
1348 case spv::OpImageDrefGather:
1349 case spv::OpImageRead:
1350 case spv::OpImage:
1351 case spv::OpImageQueryFormat:
1352 case spv::OpImageQueryOrder:
1353 case spv::OpImageQuerySizeLod:
1354 case spv::OpImageQuerySize:
1355 case spv::OpImageQueryLod:
1356 case spv::OpImageQueryLevels:
1357 case spv::OpImageQuerySamples:
1358 case spv::OpImageSparseSampleImplicitLod:
1359 case spv::OpImageSparseSampleExplicitLod:
1360 case spv::OpImageSparseSampleDrefImplicitLod:
1361 case spv::OpImageSparseSampleDrefExplicitLod:
1362 case spv::OpImageSparseSampleProjImplicitLod:
1363 case spv::OpImageSparseSampleProjExplicitLod:
1364 case spv::OpImageSparseSampleProjDrefImplicitLod:
1365 case spv::OpImageSparseSampleProjDrefExplicitLod:
1366 case spv::OpImageSparseFetch:
1367 case spv::OpImageSparseGather:
1368 case spv::OpImageSparseDrefGather:
1369 case spv::OpImageTexelPointer:
1370 worklist.insert(insn.word(3)); // Image or sampled image
1371 break;
1372 case spv::OpImageWrite:
1373 worklist.insert(insn.word(1)); // Image -- different operand order to above
1374 break;
1375 case spv::OpFunctionCall:
1376 for (uint32_t i = 3; i < insn.len(); i++) {
1377 worklist.insert(insn.word(i)); // fn itself, and all args
1378 }
1379 break;
1380
1381 case spv::OpExtInst:
1382 for (uint32_t i = 5; i < insn.len(); i++) {
1383 worklist.insert(insn.word(i)); // Operands to ext inst
1384 }
1385 break;
1386 }
1387 }
1388 break;
1389 }
1390 }
1391
1392 return ids;
1393}
1394
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001395bool CoreChecks::ValidatePushConstantBlockAgainstPipeline(std::vector<VkPushConstantRange> const *push_constant_ranges,
1396 SHADER_MODULE_STATE const *src, spirv_inst_iter type,
1397 VkShaderStageFlagBits stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001398 bool skip = false;
1399
1400 // Strip off ptrs etc
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06001401 type = GetStructType(src, type, false);
Chris Forbes47567b72017-06-09 12:09:45 -07001402 assert(type != src->end());
1403
1404 // Validate directly off the offsets. this isn't quite correct for arrays and matrices, but is a good first step.
1405 // TODO: arrays, matrices, weird sizes
1406 for (auto insn : *src) {
1407 if (insn.opcode() == spv::OpMemberDecorate && insn.word(1) == type.word(1)) {
1408 if (insn.word(3) == spv::DecorationOffset) {
Jeremy Hayesadf93862020-07-22 14:29:30 -06001409 auto const member = insn.word(2);
1410 auto const offset = insn.word(4);
1411 auto const size = 4; // Bytes; TODO: calculate this based on the type
Chris Forbes47567b72017-06-09 12:09:45 -07001412
1413 bool found_range = false;
1414 for (auto const &range : *push_constant_ranges) {
Jeremy Hayese883b362019-12-10 15:12:26 -07001415 if ((range.offset <= offset) && ((range.offset + range.size) >= (offset + size)) &&
1416 (range.stageFlags & stage)) {
Chris Forbes47567b72017-06-09 12:09:45 -07001417 found_range = true;
1418
Chris Forbes47567b72017-06-09 12:09:45 -07001419 break;
1420 }
1421 }
1422
1423 if (!found_range) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001424 skip |= LogError(device, kVUID_Core_Shader_PushConstantOutOfRange,
Jeremy Hayesadf93862020-07-22 14:29:30 -06001425 "Shader push-constant buffer member %u at offset %u is not declared in pipeline layout",
1426 member, offset);
Chris Forbes47567b72017-06-09 12:09:45 -07001427 }
1428 }
1429 }
1430 }
1431
1432 return skip;
1433}
1434
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001435bool CoreChecks::ValidatePushConstantUsage(std::vector<VkPushConstantRange> const *push_constant_ranges,
1436 SHADER_MODULE_STATE const *src, std::unordered_set<uint32_t> accessible_ids,
1437 VkShaderStageFlagBits stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001438 bool skip = false;
1439
1440 for (auto id : accessible_ids) {
1441 auto def_insn = src->get_def(id);
1442 if (def_insn.opcode() == spv::OpVariable && def_insn.word(3) == spv::StorageClassPushConstant) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001443 skip |= ValidatePushConstantBlockAgainstPipeline(push_constant_ranges, src, src->get_def(def_insn.word(1)), stage);
Chris Forbes47567b72017-06-09 12:09:45 -07001444 }
1445 }
1446
1447 return skip;
1448}
1449
1450// Validate that data for each specialization entry is fully contained within the buffer.
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001451bool CoreChecks::ValidateSpecializationOffsets(VkPipelineShaderStageCreateInfo const *info) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001452 bool skip = false;
1453
1454 VkSpecializationInfo const *spec = info->pSpecializationInfo;
1455
1456 if (spec) {
1457 for (auto i = 0u; i < spec->mapEntryCount; i++) {
Jeremy Hayes6c555c32019-09-09 17:14:09 -06001458 if (spec->pMapEntries[i].offset >= spec->dataSize) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001459 skip |= LogError(device, "VUID-VkSpecializationInfo-offset-00773",
1460 "Specialization entry %u (for constant id %u) references memory outside provided specialization "
1461 "data (bytes %u.." PRINTF_SIZE_T_SPECIFIER "; " PRINTF_SIZE_T_SPECIFIER " bytes provided)..",
1462 i, spec->pMapEntries[i].constantID, spec->pMapEntries[i].offset,
1463 spec->pMapEntries[i].offset + spec->dataSize - 1, spec->dataSize);
Jeremy Hayes6c555c32019-09-09 17:14:09 -06001464
1465 continue;
1466 }
Chris Forbes47567b72017-06-09 12:09:45 -07001467 if (spec->pMapEntries[i].offset + spec->pMapEntries[i].size > spec->dataSize) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001468 skip |= LogError(device, "VUID-VkSpecializationInfo-pMapEntries-00774",
1469 "Specialization entry %u (for constant id %u) references memory outside provided specialization "
1470 "data (bytes %u.." PRINTF_SIZE_T_SPECIFIER "; " PRINTF_SIZE_T_SPECIFIER " bytes provided)..",
1471 i, spec->pMapEntries[i].constantID, spec->pMapEntries[i].offset,
1472 spec->pMapEntries[i].offset + spec->pMapEntries[i].size - 1, spec->dataSize);
Chris Forbes47567b72017-06-09 12:09:45 -07001473 }
1474 }
1475 }
1476
1477 return skip;
1478}
1479
Jeff Bolz38b3ce72018-09-19 12:53:38 -05001480// TODO (jbolz): Can this return a const reference?
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06001481static std::set<uint32_t> TypeToDescriptorTypeSet(SHADER_MODULE_STATE const *module, uint32_t type_id, unsigned &descriptor_count) {
Chris Forbes47567b72017-06-09 12:09:45 -07001482 auto type = module->get_def(type_id);
Chris Forbes9f89d752018-03-07 12:57:48 -08001483 bool is_storage_buffer = false;
Chris Forbes47567b72017-06-09 12:09:45 -07001484 descriptor_count = 1;
Jeff Bolze54ae892018-09-08 12:16:29 -05001485 std::set<uint32_t> ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001486
1487 // Strip off any array or ptrs. Where we remove array levels, adjust the descriptor count for each dimension.
Jeff Bolzfdf96072018-04-10 14:32:18 -05001488 while (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypePointer || type.opcode() == spv::OpTypeRuntimeArray) {
1489 if (type.opcode() == spv::OpTypeRuntimeArray) {
1490 descriptor_count = 0;
1491 type = module->get_def(type.word(2));
1492 } else if (type.opcode() == spv::OpTypeArray) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06001493 descriptor_count *= GetConstantValue(module, type.word(3));
Chris Forbes47567b72017-06-09 12:09:45 -07001494 type = module->get_def(type.word(2));
1495 } else {
Chris Forbes9f89d752018-03-07 12:57:48 -08001496 if (type.word(2) == spv::StorageClassStorageBuffer) {
1497 is_storage_buffer = true;
1498 }
Chris Forbes47567b72017-06-09 12:09:45 -07001499 type = module->get_def(type.word(3));
1500 }
1501 }
1502
1503 switch (type.opcode()) {
1504 case spv::OpTypeStruct: {
1505 for (auto insn : *module) {
1506 if (insn.opcode() == spv::OpDecorate && insn.word(1) == type.word(1)) {
1507 if (insn.word(2) == spv::DecorationBlock) {
Chris Forbes9f89d752018-03-07 12:57:48 -08001508 if (is_storage_buffer) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001509 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER);
1510 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC);
1511 return ret;
Chris Forbes9f89d752018-03-07 12:57:48 -08001512 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05001513 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER);
1514 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC);
1515 ret.insert(VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK_EXT);
1516 return ret;
Chris Forbes9f89d752018-03-07 12:57:48 -08001517 }
Chris Forbes47567b72017-06-09 12:09:45 -07001518 } else if (insn.word(2) == spv::DecorationBufferBlock) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001519 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER);
1520 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC);
1521 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001522 }
1523 }
1524 }
1525
1526 // Invalid
Jeff Bolze54ae892018-09-08 12:16:29 -05001527 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001528 }
1529
1530 case spv::OpTypeSampler:
Jeff Bolze54ae892018-09-08 12:16:29 -05001531 ret.insert(VK_DESCRIPTOR_TYPE_SAMPLER);
1532 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
1533 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001534
Chris Forbes73c00bf2018-06-22 16:28:06 -07001535 case spv::OpTypeSampledImage: {
1536 // Slight relaxation for some GLSL historical madness: samplerBuffer doesn't really have a sampler, and a texel
1537 // buffer descriptor doesn't really provide one. Allow this slight mismatch.
1538 auto image_type = module->get_def(type.word(2));
1539 auto dim = image_type.word(3);
1540 auto sampled = image_type.word(7);
1541 if (dim == spv::DimBuffer && sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001542 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER);
1543 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001544 }
Chris Forbes73c00bf2018-06-22 16:28:06 -07001545 }
Jeff Bolze54ae892018-09-08 12:16:29 -05001546 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
1547 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001548
1549 case spv::OpTypeImage: {
1550 // Many descriptor types backing image types-- depends on dimension and whether the image will be used with a sampler.
1551 // SPIRV for Vulkan requires that sampled be 1 or 2 -- leaving the decision to runtime is unacceptable.
1552 auto dim = type.word(3);
1553 auto sampled = type.word(7);
1554
1555 if (dim == spv::DimSubpassData) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001556 ret.insert(VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT);
1557 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001558 } else if (dim == spv::DimBuffer) {
1559 if (sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001560 ret.insert(VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER);
1561 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001562 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05001563 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER);
1564 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001565 }
1566 } else if (sampled == 1) {
Jeff Bolze54ae892018-09-08 12:16:29 -05001567 ret.insert(VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE);
1568 ret.insert(VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER);
1569 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001570 } else {
Jeff Bolze54ae892018-09-08 12:16:29 -05001571 ret.insert(VK_DESCRIPTOR_TYPE_STORAGE_IMAGE);
1572 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001573 }
1574 }
Shannon McPherson0fa28232018-11-01 11:59:02 -06001575 case spv::OpTypeAccelerationStructureNV:
Eric Werness30127fd2018-10-31 21:01:03 -07001576 ret.insert(VK_DESCRIPTOR_TYPE_ACCELERATION_STRUCTURE_NV);
Jeff Bolz105d6492018-09-29 15:46:44 -05001577 return ret;
Chris Forbes47567b72017-06-09 12:09:45 -07001578
1579 // We shouldn't really see any other junk types -- but if we do, they're a mismatch.
1580 default:
Jeff Bolze54ae892018-09-08 12:16:29 -05001581 return ret; // Matches nothing
Chris Forbes47567b72017-06-09 12:09:45 -07001582 }
1583}
1584
Jeff Bolze54ae892018-09-08 12:16:29 -05001585static std::string string_descriptorTypes(const std::set<uint32_t> &descriptor_types) {
Chris Forbes73c00bf2018-06-22 16:28:06 -07001586 std::stringstream ss;
Jeff Bolze54ae892018-09-08 12:16:29 -05001587 for (auto it = descriptor_types.begin(); it != descriptor_types.end(); ++it) {
1588 if (ss.tellp()) ss << ", ";
1589 ss << string_VkDescriptorType(VkDescriptorType(*it));
Chris Forbes73c00bf2018-06-22 16:28:06 -07001590 }
1591 return ss.str();
1592}
1593
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001594bool CoreChecks::RequirePropertyFlag(VkBool32 check, char const *flag, char const *structure) const {
Jeff Bolzee743412019-06-20 22:24:32 -05001595 if (!check) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001596 if (LogError(device, kVUID_Core_Shader_ExceedDeviceLimit,
1597 "Shader requires flag %s set in %s but it is not set on the device", flag, structure)) {
Jeff Bolzee743412019-06-20 22:24:32 -05001598 return true;
1599 }
1600 }
1601
1602 return false;
1603}
1604
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001605bool CoreChecks::RequireFeature(VkBool32 feature, char const *feature_name) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001606 if (!feature) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001607 if (LogError(device, kVUID_Core_Shader_FeatureNotEnabled, "Shader requires %s but is not enabled on the device",
1608 feature_name)) {
Chris Forbes47567b72017-06-09 12:09:45 -07001609 return true;
1610 }
1611 }
1612
1613 return false;
1614}
1615
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001616bool CoreChecks::RequireExtension(bool extension, char const *extension_name) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001617 if (!extension) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07001618 if (LogError(device, kVUID_Core_Shader_FeatureNotEnabled, "Shader requires extension %s but is not enabled on the device",
1619 extension_name)) {
Chris Forbes47567b72017-06-09 12:09:45 -07001620 return true;
1621 }
1622 }
1623
1624 return false;
1625}
1626
John Zulaufac4c6e12019-07-01 16:05:58 -06001627bool CoreChecks::ValidateShaderCapabilities(SHADER_MODULE_STATE const *src, VkShaderStageFlagBits stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07001628 bool skip = false;
1629
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001630 struct FeaturePointer {
1631 // Callable object to test if this feature is enabled in the given aggregate feature struct
1632 const std::function<VkBool32(const DeviceFeatures &)> IsEnabled;
1633
1634 // Test if feature pointer is populated
1635 explicit operator bool() const { return static_cast<bool>(IsEnabled); }
1636
1637 // Default and nullptr constructor to create an empty FeaturePointer
1638 FeaturePointer() : IsEnabled(nullptr) {}
1639 FeaturePointer(std::nullptr_t ptr) : IsEnabled(nullptr) {}
1640
1641 // Constructors to populate FeaturePointer based on given pointer to member
1642 FeaturePointer(VkBool32 VkPhysicalDeviceFeatures::*ptr)
1643 : IsEnabled([=](const DeviceFeatures &features) { return features.core.*ptr; }) {}
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001644 FeaturePointer(VkBool32 VkPhysicalDeviceVulkan11Features::*ptr)
1645 : IsEnabled([=](const DeviceFeatures &features) { return features.core11.*ptr; }) {}
1646 FeaturePointer(VkBool32 VkPhysicalDeviceVulkan12Features::*ptr)
1647 : IsEnabled([=](const DeviceFeatures &features) { return features.core12.*ptr; }) {}
Brett Lawsonbebfb6f2018-10-23 16:58:50 -07001648 FeaturePointer(VkBool32 VkPhysicalDeviceTransformFeedbackFeaturesEXT::*ptr)
1649 : IsEnabled([=](const DeviceFeatures &features) { return features.transform_feedback_features.*ptr; }) {}
Jeff Bolze4356752019-03-07 11:23:46 -06001650 FeaturePointer(VkBool32 VkPhysicalDeviceCooperativeMatrixFeaturesNV::*ptr)
1651 : IsEnabled([=](const DeviceFeatures &features) { return features.cooperative_matrix_features.*ptr; }) {}
Jason Macnakc5a621d2019-06-10 12:42:50 -07001652 FeaturePointer(VkBool32 VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::*ptr)
1653 : IsEnabled([=](const DeviceFeatures &features) { return features.compute_shader_derivatives_features.*ptr; }) {}
Jason Macnak325e8b52019-06-10 13:33:10 -07001654 FeaturePointer(VkBool32 VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::*ptr)
1655 : IsEnabled([=](const DeviceFeatures &features) { return features.fragment_shader_barycentric_features.*ptr; }) {}
Jason Macnakd7fddf82019-06-13 09:52:49 -07001656 FeaturePointer(VkBool32 VkPhysicalDeviceShaderImageFootprintFeaturesNV::*ptr)
1657 : IsEnabled([=](const DeviceFeatures &features) { return features.shader_image_footprint_features.*ptr; }) {}
Jeff Bolz38f6cb52019-06-30 16:26:44 -05001658 FeaturePointer(VkBool32 VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::*ptr)
1659 : IsEnabled([=](const DeviceFeatures &features) { return features.fragment_shader_interlock_features.*ptr; }) {}
Jeff Bolza38fd3b2019-07-21 11:42:11 -05001660 FeaturePointer(VkBool32 VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::*ptr)
1661 : IsEnabled([=](const DeviceFeatures &features) { return features.demote_to_helper_invocation_features.*ptr; }) {}
Jeff Bolz443c2ca2020-03-19 12:11:51 -05001662 FeaturePointer(VkBool32 VkPhysicalDeviceRayTracingFeaturesKHR::*ptr)
1663 : IsEnabled([=](const DeviceFeatures &features) { return features.ray_tracing_features.*ptr; }) {}
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001664 };
1665
Chris Forbes47567b72017-06-09 12:09:45 -07001666 struct CapabilityInfo {
1667 char const *name;
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001668 FeaturePointer feature;
Tony-LunarG2ec96bb2019-11-26 13:43:02 -07001669 ExtEnabled DeviceExtensions::*extension;
Chris Forbes47567b72017-06-09 12:09:45 -07001670 };
1671
Chris Forbes47567b72017-06-09 12:09:45 -07001672 // clang-format off
Dave Houltoneb10ea82017-12-22 12:21:50 -07001673 static const std::unordered_multimap<uint32_t, CapabilityInfo> capabilities = {
Chris Forbes47567b72017-06-09 12:09:45 -07001674 // Capabilities always supported by a Vulkan 1.0 implementation -- no
1675 // feature bits.
1676 {spv::CapabilityMatrix, {nullptr}},
1677 {spv::CapabilityShader, {nullptr}},
1678 {spv::CapabilityInputAttachment, {nullptr}},
1679 {spv::CapabilitySampled1D, {nullptr}},
1680 {spv::CapabilityImage1D, {nullptr}},
1681 {spv::CapabilitySampledBuffer, {nullptr}},
Toni Merilehtib13a4a22019-05-21 12:58:44 +03001682 {spv::CapabilityStorageImageExtendedFormats, {nullptr}},
Chris Forbes47567b72017-06-09 12:09:45 -07001683 {spv::CapabilityImageQuery, {nullptr}},
1684 {spv::CapabilityDerivativeControl, {nullptr}},
1685
1686 // Capabilities that are optionally supported, but require a feature to
1687 // be enabled on the device
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001688 {spv::CapabilityGeometry, {"VkPhysicalDeviceFeatures::geometryShader", &VkPhysicalDeviceFeatures::geometryShader}},
1689 {spv::CapabilityTessellation, {"VkPhysicalDeviceFeatures::tessellationShader", &VkPhysicalDeviceFeatures::tessellationShader}},
1690 {spv::CapabilityFloat64, {"VkPhysicalDeviceFeatures::shaderFloat64", &VkPhysicalDeviceFeatures::shaderFloat64}},
1691 {spv::CapabilityInt64, {"VkPhysicalDeviceFeatures::shaderInt64", &VkPhysicalDeviceFeatures::shaderInt64}},
1692 {spv::CapabilityTessellationPointSize, {"VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize", &VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize}},
1693 {spv::CapabilityGeometryPointSize, {"VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize", &VkPhysicalDeviceFeatures::shaderTessellationAndGeometryPointSize}},
1694 {spv::CapabilityImageGatherExtended, {"VkPhysicalDeviceFeatures::shaderImageGatherExtended", &VkPhysicalDeviceFeatures::shaderImageGatherExtended}},
1695 {spv::CapabilityStorageImageMultisample, {"VkPhysicalDeviceFeatures::shaderStorageImageMultisample", &VkPhysicalDeviceFeatures::shaderStorageImageMultisample}},
1696 {spv::CapabilityUniformBufferArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderUniformBufferArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderUniformBufferArrayDynamicIndexing}},
1697 {spv::CapabilitySampledImageArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderSampledImageArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderSampledImageArrayDynamicIndexing}},
1698 {spv::CapabilityStorageBufferArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing}},
1699 {spv::CapabilityStorageImageArrayDynamicIndexing, {"VkPhysicalDeviceFeatures::shaderStorageImageArrayDynamicIndexing", &VkPhysicalDeviceFeatures::shaderStorageBufferArrayDynamicIndexing}},
1700 {spv::CapabilityClipDistance, {"VkPhysicalDeviceFeatures::shaderClipDistance", &VkPhysicalDeviceFeatures::shaderClipDistance}},
1701 {spv::CapabilityCullDistance, {"VkPhysicalDeviceFeatures::shaderCullDistance", &VkPhysicalDeviceFeatures::shaderCullDistance}},
1702 {spv::CapabilityImageCubeArray, {"VkPhysicalDeviceFeatures::imageCubeArray", &VkPhysicalDeviceFeatures::imageCubeArray}},
1703 {spv::CapabilitySampleRateShading, {"VkPhysicalDeviceFeatures::sampleRateShading", &VkPhysicalDeviceFeatures::sampleRateShading}},
1704 {spv::CapabilitySparseResidency, {"VkPhysicalDeviceFeatures::shaderResourceResidency", &VkPhysicalDeviceFeatures::shaderResourceResidency}},
1705 {spv::CapabilityMinLod, {"VkPhysicalDeviceFeatures::shaderResourceMinLod", &VkPhysicalDeviceFeatures::shaderResourceMinLod}},
1706 {spv::CapabilitySampledCubeArray, {"VkPhysicalDeviceFeatures::imageCubeArray", &VkPhysicalDeviceFeatures::imageCubeArray}},
1707 {spv::CapabilityImageMSArray, {"VkPhysicalDeviceFeatures::shaderStorageImageMultisample", &VkPhysicalDeviceFeatures::shaderStorageImageMultisample}},
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001708 {spv::CapabilityInterpolationFunction, {"VkPhysicalDeviceFeatures::sampleRateShading", &VkPhysicalDeviceFeatures::sampleRateShading}},
1709 {spv::CapabilityStorageImageReadWithoutFormat, {"VkPhysicalDeviceFeatures::shaderStorageImageReadWithoutFormat", &VkPhysicalDeviceFeatures::shaderStorageImageReadWithoutFormat}},
1710 {spv::CapabilityStorageImageWriteWithoutFormat, {"VkPhysicalDeviceFeatures::shaderStorageImageWriteWithoutFormat", &VkPhysicalDeviceFeatures::shaderStorageImageWriteWithoutFormat}},
1711 {spv::CapabilityMultiViewport, {"VkPhysicalDeviceFeatures::multiViewport", &VkPhysicalDeviceFeatures::multiViewport}},
Jeff Bolzfdf96072018-04-10 14:32:18 -05001712
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001713 {spv::CapabilityShaderNonUniformEXT, {VK_EXT_DESCRIPTOR_INDEXING_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_descriptor_indexing}},
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001714 {spv::CapabilityRuntimeDescriptorArrayEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::runtimeDescriptorArray", &VkPhysicalDeviceVulkan12Features::runtimeDescriptorArray}},
1715 {spv::CapabilityInputAttachmentArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderInputAttachmentArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderInputAttachmentArrayDynamicIndexing}},
1716 {spv::CapabilityUniformTexelBufferArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformTexelBufferArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformTexelBufferArrayDynamicIndexing}},
1717 {spv::CapabilityStorageTexelBufferArrayDynamicIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageTexelBufferArrayDynamicIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageTexelBufferArrayDynamicIndexing}},
1718 {spv::CapabilityUniformBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformBufferArrayNonUniformIndexing}},
1719 {spv::CapabilitySampledImageArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderSampledImageArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderSampledImageArrayNonUniformIndexing}},
1720 {spv::CapabilityStorageBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageBufferArrayNonUniformIndexing}},
1721 {spv::CapabilityStorageImageArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageImageArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageImageArrayNonUniformIndexing}},
1722 {spv::CapabilityInputAttachmentArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderInputAttachmentArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderInputAttachmentArrayNonUniformIndexing}},
1723 {spv::CapabilityUniformTexelBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderUniformTexelBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderUniformTexelBufferArrayNonUniformIndexing}},
1724 {spv::CapabilityStorageTexelBufferArrayNonUniformIndexingEXT, {"VkPhysicalDeviceDescriptorIndexingFeatures::shaderStorageTexelBufferArrayNonUniformIndexing", &VkPhysicalDeviceVulkan12Features::shaderStorageTexelBufferArrayNonUniformIndexing}},
Chris Forbes47567b72017-06-09 12:09:45 -07001725
1726 // Capabilities that require an extension
Mike Schuchardt8ed5ea02018-07-20 18:24:17 -06001727 {spv::CapabilityDrawParameters, {VK_KHR_SHADER_DRAW_PARAMETERS_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_draw_parameters}},
1728 {spv::CapabilityGeometryShaderPassthroughNV, {VK_NV_GEOMETRY_SHADER_PASSTHROUGH_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_geometry_shader_passthrough}},
1729 {spv::CapabilitySampleMaskOverrideCoverageNV, {VK_NV_SAMPLE_MASK_OVERRIDE_COVERAGE_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_sample_mask_override_coverage}},
1730 {spv::CapabilityShaderViewportIndexLayerEXT, {VK_EXT_SHADER_VIEWPORT_INDEX_LAYER_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_viewport_index_layer}},
1731 {spv::CapabilityShaderViewportIndexLayerNV, {VK_NV_VIEWPORT_ARRAY2_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_viewport_array2}},
1732 {spv::CapabilityShaderViewportMaskNV, {VK_NV_VIEWPORT_ARRAY2_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_viewport_array2}},
1733 {spv::CapabilitySubgroupBallotKHR, {VK_EXT_SHADER_SUBGROUP_BALLOT_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_subgroup_ballot }},
1734 {spv::CapabilitySubgroupVoteKHR, {VK_EXT_SHADER_SUBGROUP_VOTE_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_ext_shader_subgroup_vote }},
Jason Macnakb7d091c2019-06-10 11:13:11 -07001735 {spv::CapabilityGroupNonUniformPartitionedNV, {VK_NV_SHADER_SUBGROUP_PARTITIONED_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_nv_shader_subgroup_partitioned}},
aqnuep7033c702018-09-11 18:03:29 +02001736 {spv::CapabilityInt64Atomics, {VK_KHR_SHADER_ATOMIC_INT64_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_atomic_int64 }},
amhaganfa0b34d2019-10-15 16:03:53 -04001737 {spv::CapabilityShaderClockKHR, {VK_KHR_SHADER_CLOCK_EXTENSION_NAME, nullptr, &DeviceExtensions::vk_khr_shader_clock }},
Alexander Galazin3bd8e342018-06-14 15:49:07 +02001738
Jason Macnakc5a621d2019-06-10 12:42:50 -07001739 {spv::CapabilityComputeDerivativeGroupQuadsNV, {"VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupQuads", &VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupQuads, &DeviceExtensions::vk_nv_compute_shader_derivatives}},
1740 {spv::CapabilityComputeDerivativeGroupLinearNV, {"VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupLinear", &VkPhysicalDeviceComputeShaderDerivativesFeaturesNV::computeDerivativeGroupLinear, &DeviceExtensions::vk_nv_compute_shader_derivatives}},
Jason Macnakf7019582019-06-13 10:07:26 -07001741 {spv::CapabilityFragmentBarycentricNV, {"VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::fragmentShaderBarycentric", &VkPhysicalDeviceFragmentShaderBarycentricFeaturesNV::fragmentShaderBarycentric, &DeviceExtensions::vk_nv_fragment_shader_barycentric}},
Jason Macnakc5a621d2019-06-10 12:42:50 -07001742
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001743 {spv::CapabilityStorageBuffer8BitAccess, {"VkPhysicalDevice8BitStorageFeaturesKHR::storageBuffer8BitAccess", &VkPhysicalDeviceVulkan12Features::storageBuffer8BitAccess, &DeviceExtensions::vk_khr_8bit_storage}},
1744 {spv::CapabilityUniformAndStorageBuffer8BitAccess, {"VkPhysicalDevice8BitStorageFeaturesKHR::uniformAndStorageBuffer8BitAccess", &VkPhysicalDeviceVulkan12Features::uniformAndStorageBuffer8BitAccess, &DeviceExtensions::vk_khr_8bit_storage}},
1745 {spv::CapabilityStoragePushConstant8, {"VkPhysicalDevice8BitStorageFeaturesKHR::storagePushConstant8", &VkPhysicalDeviceVulkan12Features::storagePushConstant8, &DeviceExtensions::vk_khr_8bit_storage}},
Brett Lawsonbebfb6f2018-10-23 16:58:50 -07001746
Jason Macnakf7019582019-06-13 10:07:26 -07001747 {spv::CapabilityTransformFeedback, { "VkPhysicalDeviceTransformFeedbackFeaturesEXT::transformFeedback", &VkPhysicalDeviceTransformFeedbackFeaturesEXT::transformFeedback, &DeviceExtensions::vk_ext_transform_feedback}},
1748 {spv::CapabilityGeometryStreams, { "VkPhysicalDeviceTransformFeedbackFeaturesEXT::geometryStreams", &VkPhysicalDeviceTransformFeedbackFeaturesEXT::geometryStreams, &DeviceExtensions::vk_ext_transform_feedback}},
Jose-Emilio Munoz-Lopez1109b452018-08-21 09:44:07 +01001749
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001750 {spv::CapabilityFloat16, {"VkPhysicalDeviceFloat16Int8FeaturesKHR::shaderFloat16", &VkPhysicalDeviceVulkan12Features::shaderFloat16, &DeviceExtensions::vk_khr_shader_float16_int8}},
1751 {spv::CapabilityInt8, {"VkPhysicalDeviceFloat16Int8FeaturesKHR::shaderInt8", &VkPhysicalDeviceVulkan12Features::shaderInt8, &DeviceExtensions::vk_khr_shader_float16_int8}},
Jeff Bolze4356752019-03-07 11:23:46 -06001752
Jason Macnakd7fddf82019-06-13 09:52:49 -07001753 {spv::CapabilityImageFootprintNV, {"VkPhysicalDeviceShaderImageFootprintFeaturesNV::imageFootprint", &VkPhysicalDeviceShaderImageFootprintFeaturesNV::imageFootprint, &DeviceExtensions::vk_nv_shader_image_footprint}},
1754
Jeff Bolze4356752019-03-07 11:23:46 -06001755 {spv::CapabilityCooperativeMatrixNV, {"VkPhysicalDeviceCooperativeMatrixFeaturesNV::cooperativeMatrix", &VkPhysicalDeviceCooperativeMatrixFeaturesNV::cooperativeMatrix, &DeviceExtensions::vk_nv_cooperative_matrix}},
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00001756
Graeme Leese41e6b842019-08-02 10:49:14 +01001757 {spv::CapabilitySignedZeroInfNanPreserve, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderSignedZeroInfNanPreserve", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
1758 {spv::CapabilityDenormPreserve, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderDenormPreserve", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
1759 {spv::CapabilityDenormFlushToZero, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderDenormFlushToZero", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
1760 {spv::CapabilityRoundingModeRTE, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderRoundingModeRTE", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
1761 {spv::CapabilityRoundingModeRTZ, {"VkPhysicalDeviceFloatControlsPropertiesKHR::shaderRoundingModeRTZ", nullptr, &DeviceExtensions::vk_khr_shader_float_controls}},
Jeff Bolz38f6cb52019-06-30 16:26:44 -05001762
1763 {spv::CapabilityFragmentShaderSampleInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderSampleInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderSampleInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
1764 {spv::CapabilityFragmentShaderPixelInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderPixelInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderPixelInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
1765 {spv::CapabilityFragmentShaderShadingRateInterlockEXT, {"VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderShadingRateInterlock", &VkPhysicalDeviceFragmentShaderInterlockFeaturesEXT::fragmentShaderShadingRateInterlock, &DeviceExtensions::vk_ext_fragment_shader_interlock}},
Jeff Bolza38fd3b2019-07-21 11:42:11 -05001766 {spv::CapabilityDemoteToHelperInvocationEXT, {"VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::shaderDemoteToHelperInvocation", &VkPhysicalDeviceShaderDemoteToHelperInvocationFeaturesEXT::shaderDemoteToHelperInvocation, &DeviceExtensions::vk_ext_shader_demote_to_helper_invocation}},
Jeff Bolz4563f2a2019-12-10 13:30:30 -06001767
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001768 {spv::CapabilityPhysicalStorageBufferAddresses, {"VkPhysicalDeviceBufferDeviceAddressFeatures::bufferDeviceAddress", &VkPhysicalDeviceVulkan12Features::bufferDeviceAddress, &DeviceExtensions::vk_ext_buffer_device_address}},
Jeff Bolz4563f2a2019-12-10 13:30:30 -06001769 // Should be non-EXT token, but Android SPIRV-Headers are out of date, and the token value is the same anyway
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001770 {spv::CapabilityPhysicalStorageBufferAddressesEXT, {"VkPhysicalDeviceBufferDeviceAddressFeaturesEXT::bufferDeviceAddress", &VkPhysicalDeviceVulkan12Features::bufferDeviceAddress, &DeviceExtensions::vk_khr_buffer_device_address}},
Jeff Bolz443c2ca2020-03-19 12:11:51 -05001771
1772 {spv::CapabilityRayTracingProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayTracing", &VkPhysicalDeviceRayTracingFeaturesKHR::rayTracing, &DeviceExtensions::vk_khr_ray_tracing}},
1773 {spv::CapabilityRayQueryProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayQuery", &VkPhysicalDeviceRayTracingFeaturesKHR::rayQuery, &DeviceExtensions::vk_khr_ray_tracing}},
1774 {spv::CapabilityRayTraversalPrimitiveCullingProvisionalKHR, {"VkPhysicalDeviceRayTracingFeaturesKHR::rayTracingPrimitiveCulling", &VkPhysicalDeviceRayTracingFeaturesKHR::rayTracingPrimitiveCulling, &DeviceExtensions::vk_khr_ray_tracing}},
Chris Forbes47567b72017-06-09 12:09:45 -07001775 };
1776 // clang-format on
1777
1778 for (auto insn : *src) {
1779 if (insn.opcode() == spv::OpCapability) {
Dave Houltoneb10ea82017-12-22 12:21:50 -07001780 size_t n = capabilities.count(insn.word(1));
1781 if (1 == n) { // key occurs exactly once
1782 auto it = capabilities.find(insn.word(1));
1783 if (it != capabilities.end()) {
1784 if (it->second.feature) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001785 skip |= RequireFeature(it->second.feature.IsEnabled(enabled_features), it->second.name);
Dave Houltoneb10ea82017-12-22 12:21:50 -07001786 }
1787 if (it->second.extension) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001788 skip |= RequireExtension(IsExtEnabled((device_extensions.*(it->second.extension))), it->second.name);
Dave Houltoneb10ea82017-12-22 12:21:50 -07001789 }
Chris Forbes47567b72017-06-09 12:09:45 -07001790 }
Dave Houltoneb10ea82017-12-22 12:21:50 -07001791 } else if (1 < n) { // key occurs multiple times, at least one must be enabled
1792 bool needs_feature = false, has_feature = false;
1793 bool needs_ext = false, has_ext = false;
1794 std::string feature_names = "(one of) [ ";
1795 std::string extension_names = feature_names;
1796 auto caps = capabilities.equal_range(insn.word(1));
1797 for (auto it = caps.first; it != caps.second; ++it) {
1798 if (it->second.feature) {
1799 needs_feature = true;
Mark Lobodzinskid7b03cc2019-04-19 14:23:10 -06001800 has_feature = has_feature || it->second.feature.IsEnabled(enabled_features);
Dave Houltoneb10ea82017-12-22 12:21:50 -07001801 feature_names += it->second.name;
1802 feature_names += " ";
1803 }
1804 if (it->second.extension) {
1805 needs_ext = true;
Mark Lobodzinskif45e45f2019-04-19 14:15:39 -06001806 has_ext = has_ext || device_extensions.*(it->second.extension);
Dave Houltoneb10ea82017-12-22 12:21:50 -07001807 extension_names += it->second.name;
1808 extension_names += " ";
1809 }
1810 }
1811 if (needs_feature) {
1812 feature_names += "]";
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001813 skip |= RequireFeature(has_feature, feature_names.c_str());
Dave Houltoneb10ea82017-12-22 12:21:50 -07001814 }
1815 if (needs_ext) {
1816 extension_names += "]";
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001817 skip |= RequireExtension(has_ext, extension_names.c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07001818 }
Graeme Leesec82dbe02019-08-02 10:44:21 +01001819 }
1820
1821 { // Do group non-uniform checks
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001822 const VkSubgroupFeatureFlags supportedOperations = phys_dev_props_core11.subgroupSupportedOperations;
1823 const VkSubgroupFeatureFlags supportedStages = phys_dev_props_core11.subgroupSupportedStages;
Jeff Bolzee743412019-06-20 22:24:32 -05001824
1825 switch (insn.word(1)) {
1826 default:
1827 break;
1828 case spv::CapabilityGroupNonUniform:
1829 case spv::CapabilityGroupNonUniformVote:
1830 case spv::CapabilityGroupNonUniformArithmetic:
1831 case spv::CapabilityGroupNonUniformBallot:
1832 case spv::CapabilityGroupNonUniformShuffle:
1833 case spv::CapabilityGroupNonUniformShuffleRelative:
1834 case spv::CapabilityGroupNonUniformClustered:
1835 case spv::CapabilityGroupNonUniformQuad:
1836 case spv::CapabilityGroupNonUniformPartitionedNV:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001837 RequirePropertyFlag(supportedStages & stage, string_VkShaderStageFlagBits(stage),
Jeff Bolzee743412019-06-20 22:24:32 -05001838 "VkPhysicalDeviceSubgroupProperties::supportedStages");
1839 break;
1840 }
1841
1842 switch (insn.word(1)) {
1843 default:
1844 break;
1845 case spv::CapabilityGroupNonUniform:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001846 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_BASIC_BIT, "VK_SUBGROUP_FEATURE_BASIC_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05001847 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1848 break;
1849 case spv::CapabilityGroupNonUniformVote:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001850 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_VOTE_BIT, "VK_SUBGROUP_FEATURE_VOTE_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05001851 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1852 break;
1853 case spv::CapabilityGroupNonUniformArithmetic:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001854 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_ARITHMETIC_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05001855 "VK_SUBGROUP_FEATURE_ARITHMETIC_BIT",
1856 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1857 break;
1858 case spv::CapabilityGroupNonUniformBallot:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001859 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_BALLOT_BIT, "VK_SUBGROUP_FEATURE_BALLOT_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05001860 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1861 break;
1862 case spv::CapabilityGroupNonUniformShuffle:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001863 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_SHUFFLE_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05001864 "VK_SUBGROUP_FEATURE_SHUFFLE_BIT",
1865 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1866 break;
1867 case spv::CapabilityGroupNonUniformShuffleRelative:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001868 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_SHUFFLE_RELATIVE_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05001869 "VK_SUBGROUP_FEATURE_SHUFFLE_RELATIVE_BIT",
1870 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1871 break;
1872 case spv::CapabilityGroupNonUniformClustered:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001873 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_CLUSTERED_BIT,
Jeff Bolzee743412019-06-20 22:24:32 -05001874 "VK_SUBGROUP_FEATURE_CLUSTERED_BIT",
1875 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1876 break;
1877 case spv::CapabilityGroupNonUniformQuad:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001878 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_QUAD_BIT, "VK_SUBGROUP_FEATURE_QUAD_BIT",
Jeff Bolzee743412019-06-20 22:24:32 -05001879 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1880 break;
1881 case spv::CapabilityGroupNonUniformPartitionedNV:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001882 RequirePropertyFlag(supportedOperations & VK_SUBGROUP_FEATURE_PARTITIONED_BIT_NV,
Jeff Bolzee743412019-06-20 22:24:32 -05001883 "VK_SUBGROUP_FEATURE_PARTITIONED_BIT_NV",
1884 "VkPhysicalDeviceSubgroupProperties::supportedOperations");
1885 break;
1886 }
Chris Forbes47567b72017-06-09 12:09:45 -07001887 }
baldurk4095f932020-02-16 13:24:42 +00001888 } else if (insn.opcode() == spv::OpExtension) {
1889 std::string extension_name = (char const *)&insn.word(1);
1890
1891 if (extension_name == "SPV_KHR_non_semantic_info") {
1892 skip |= RequireExtension(IsExtEnabled(device_extensions.vk_khr_shader_non_semantic_info),
1893 VK_KHR_SHADER_NON_SEMANTIC_INFO_EXTENSION_NAME);
1894 }
Chris Forbes47567b72017-06-09 12:09:45 -07001895 }
1896 }
1897
Jeff Bolzee743412019-06-20 22:24:32 -05001898 return skip;
1899}
1900
John Zulaufac4c6e12019-07-01 16:05:58 -06001901bool CoreChecks::ValidateShaderStageWritableDescriptor(VkShaderStageFlagBits stage, bool has_writable_descriptor) const {
Jeff Bolzee743412019-06-20 22:24:32 -05001902 bool skip = false;
1903
Chris Forbes349b3132018-03-07 11:38:08 -08001904 if (has_writable_descriptor) {
1905 switch (stage) {
1906 case VK_SHADER_STAGE_COMPUTE_BIT:
Jeff Bolz148d94e2018-12-13 21:25:56 -06001907 case VK_SHADER_STAGE_RAYGEN_BIT_NV:
1908 case VK_SHADER_STAGE_ANY_HIT_BIT_NV:
1909 case VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV:
1910 case VK_SHADER_STAGE_MISS_BIT_NV:
1911 case VK_SHADER_STAGE_INTERSECTION_BIT_NV:
1912 case VK_SHADER_STAGE_CALLABLE_BIT_NV:
1913 case VK_SHADER_STAGE_TASK_BIT_NV:
1914 case VK_SHADER_STAGE_MESH_BIT_NV:
Chris Forbes349b3132018-03-07 11:38:08 -08001915 /* No feature requirements for writes and atomics from compute
Jeff Bolz148d94e2018-12-13 21:25:56 -06001916 * raytracing, or mesh stages */
Chris Forbes349b3132018-03-07 11:38:08 -08001917 break;
1918 case VK_SHADER_STAGE_FRAGMENT_BIT:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001919 skip |= RequireFeature(enabled_features.core.fragmentStoresAndAtomics, "fragmentStoresAndAtomics");
Chris Forbes349b3132018-03-07 11:38:08 -08001920 break;
1921 default:
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001922 skip |= RequireFeature(enabled_features.core.vertexPipelineStoresAndAtomics, "vertexPipelineStoresAndAtomics");
Chris Forbes349b3132018-03-07 11:38:08 -08001923 break;
1924 }
1925 }
1926
Chris Forbes47567b72017-06-09 12:09:45 -07001927 return skip;
1928}
1929
Jeff Bolz526f2d52019-09-18 13:18:08 -05001930bool CoreChecks::ValidateShaderStageGroupNonUniform(SHADER_MODULE_STATE const *module, VkShaderStageFlagBits stage) const {
Jeff Bolzee743412019-06-20 22:24:32 -05001931 bool skip = false;
1932
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001933 auto const subgroup_props = phys_dev_props_core11;
Jeff Bolzee743412019-06-20 22:24:32 -05001934
Jeff Bolz526f2d52019-09-18 13:18:08 -05001935 for (auto inst : *module) {
Jeff Bolzee743412019-06-20 22:24:32 -05001936 // Check the quad operations.
1937 switch (inst.opcode()) {
1938 default:
1939 break;
1940 case spv::OpGroupNonUniformQuadBroadcast:
1941 case spv::OpGroupNonUniformQuadSwap:
1942 if ((stage != VK_SHADER_STAGE_FRAGMENT_BIT) && (stage != VK_SHADER_STAGE_COMPUTE_BIT)) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001943 skip |= RequireFeature(subgroup_props.subgroupQuadOperationsInAllStages,
Jeff Bolzee743412019-06-20 22:24:32 -05001944 "VkPhysicalDeviceSubgroupProperties::quadOperationsInAllStages");
1945 }
1946 break;
1947 }
Jeff Bolz526f2d52019-09-18 13:18:08 -05001948
Piers Daniell41b8c5d2020-01-10 15:42:00 -07001949 if (!enabled_features.core12.shaderSubgroupExtendedTypes) {
Jeff Bolz526f2d52019-09-18 13:18:08 -05001950 switch (inst.opcode()) {
1951 default:
1952 break;
1953 case spv::OpGroupNonUniformAllEqual:
1954 case spv::OpGroupNonUniformBroadcast:
1955 case spv::OpGroupNonUniformBroadcastFirst:
1956 case spv::OpGroupNonUniformShuffle:
1957 case spv::OpGroupNonUniformShuffleXor:
1958 case spv::OpGroupNonUniformShuffleUp:
1959 case spv::OpGroupNonUniformShuffleDown:
1960 case spv::OpGroupNonUniformIAdd:
1961 case spv::OpGroupNonUniformFAdd:
1962 case spv::OpGroupNonUniformIMul:
1963 case spv::OpGroupNonUniformFMul:
1964 case spv::OpGroupNonUniformSMin:
1965 case spv::OpGroupNonUniformUMin:
1966 case spv::OpGroupNonUniformFMin:
1967 case spv::OpGroupNonUniformSMax:
1968 case spv::OpGroupNonUniformUMax:
1969 case spv::OpGroupNonUniformFMax:
1970 case spv::OpGroupNonUniformBitwiseAnd:
1971 case spv::OpGroupNonUniformBitwiseOr:
1972 case spv::OpGroupNonUniformBitwiseXor:
1973 case spv::OpGroupNonUniformLogicalAnd:
1974 case spv::OpGroupNonUniformLogicalOr:
1975 case spv::OpGroupNonUniformLogicalXor:
1976 case spv::OpGroupNonUniformQuadBroadcast:
1977 case spv::OpGroupNonUniformQuadSwap: {
1978 auto type = module->get_def(inst.word(1));
1979
1980 if (type.opcode() == spv::OpTypeVector) {
1981 // Get the element type
1982 type = module->get_def(type.word(2));
1983 }
1984
1985 if (type.opcode() == spv::OpTypeBool) {
1986 break;
1987 }
1988
1989 // Both OpTypeInt and OpTypeFloat the width is in the 2nd word.
1990 const uint32_t width = type.word(2);
1991
1992 if ((type.opcode() == spv::OpTypeFloat && width == 16) ||
1993 (type.opcode() == spv::OpTypeInt && (width == 8 || width == 16 || width == 64))) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07001994 skip |= RequireFeature(enabled_features.core12.shaderSubgroupExtendedTypes,
Tony-LunarGa74d3fe2019-11-22 15:43:20 -07001995 "VkPhysicalDeviceShaderSubgroupExtendedTypesFeatures::shaderSubgroupExtendedTypes");
Jeff Bolz526f2d52019-09-18 13:18:08 -05001996 }
1997 break;
1998 }
1999 }
2000 }
Jeff Bolzee743412019-06-20 22:24:32 -05002001 }
2002
2003 return skip;
2004}
2005
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002006bool CoreChecks::ValidateShaderStageInputOutputLimits(SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
John Zulaufac4c6e12019-07-01 16:05:58 -06002007 const PIPELINE_STATE *pipeline, spirv_inst_iter entrypoint) const {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002008 if (pStage->stage == VK_SHADER_STAGE_COMPUTE_BIT || pStage->stage == VK_SHADER_STAGE_ALL_GRAPHICS ||
2009 pStage->stage == VK_SHADER_STAGE_ALL) {
2010 return false;
2011 }
2012
2013 bool skip = false;
Mark Lobodzinski518eadc2019-03-09 12:07:30 -07002014 auto const &limits = phys_dev_props.limits;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002015
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002016 std::set<uint32_t> patchIDs;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002017 struct Variable {
2018 uint32_t baseTypePtrID;
2019 uint32_t ID;
2020 uint32_t storageClass;
2021 };
2022 std::vector<Variable> variables;
2023
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002024 uint32_t numVertices = 0;
2025
Jeff Bolzf234bf82019-11-04 14:07:15 -06002026 auto entrypointVariables = FindEntrypointInterfaces(entrypoint);
2027
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002028 for (auto insn : *src) {
2029 switch (insn.opcode()) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002030 // Find all Patch decorations
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002031 case spv::OpDecorate:
2032 switch (insn.word(2)) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002033 case spv::DecorationPatch: {
2034 patchIDs.insert(insn.word(1));
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002035 break;
2036 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002037 default:
2038 break;
2039 }
2040 break;
2041 // Find all input and output variables
2042 case spv::OpVariable: {
2043 Variable var = {};
2044 var.storageClass = insn.word(3);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002045 if ((var.storageClass == spv::StorageClassInput || var.storageClass == spv::StorageClassOutput) &&
2046 // Only include variables in the entrypoint's interface
2047 find(entrypointVariables.begin(), entrypointVariables.end(), insn.word(2)) != entrypointVariables.end()) {
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002048 var.baseTypePtrID = insn.word(1);
2049 var.ID = insn.word(2);
2050 variables.push_back(var);
2051 }
2052 break;
2053 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002054 case spv::OpExecutionMode:
2055 if (insn.word(1) == entrypoint.word(2)) {
2056 switch (insn.word(2)) {
2057 default:
2058 break;
2059 case spv::ExecutionModeOutputVertices:
2060 numVertices = insn.word(3);
2061 break;
2062 }
2063 }
2064 break;
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002065 default:
2066 break;
2067 }
2068 }
2069
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002070 bool strip_output_array_level =
2071 (pStage->stage == VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT || pStage->stage == VK_SHADER_STAGE_MESH_BIT_NV);
2072 bool strip_input_array_level =
2073 (pStage->stage == VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT ||
2074 pStage->stage == VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT || pStage->stage == VK_SHADER_STAGE_GEOMETRY_BIT);
2075
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002076 uint32_t numCompIn = 0, numCompOut = 0;
Jeff Bolzf234bf82019-11-04 14:07:15 -06002077 int maxCompIn = 0, maxCompOut = 0;
2078
2079 auto inputs = CollectInterfaceByLocation(src, entrypoint, spv::StorageClassInput, strip_input_array_level);
2080 auto outputs = CollectInterfaceByLocation(src, entrypoint, spv::StorageClassOutput, strip_output_array_level);
2081
2082 // Find max component location used for input variables.
2083 for (auto &var : inputs) {
2084 int location = var.first.first;
2085 int component = var.first.second;
2086 interface_var &iv = var.second;
2087
2088 // Only need to look at the first location, since we use the type's whole size
2089 if (iv.offset != 0) {
2090 continue;
2091 }
2092
2093 if (iv.is_patch) {
2094 continue;
2095 }
2096
2097 int numComponents = GetComponentsConsumedByType(src, iv.type_id, strip_input_array_level);
2098 maxCompIn = std::max(maxCompIn, location * 4 + component + numComponents);
2099 }
2100
2101 // Find max component location used for output variables.
2102 for (auto &var : outputs) {
2103 int location = var.first.first;
2104 int component = var.first.second;
2105 interface_var &iv = var.second;
2106
2107 // Only need to look at the first location, since we use the type's whole size
2108 if (iv.offset != 0) {
2109 continue;
2110 }
2111
2112 if (iv.is_patch) {
2113 continue;
2114 }
2115
2116 int numComponents = GetComponentsConsumedByType(src, iv.type_id, strip_output_array_level);
2117 maxCompOut = std::max(maxCompOut, location * 4 + component + numComponents);
2118 }
2119
2120 // XXX TODO: Would be nice to rewrite this to use CollectInterfaceByLocation (or something similar),
2121 // but that doesn't include builtins.
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002122 for (auto &var : variables) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002123 // Check if the variable is a patch. Patches can also be members of blocks,
2124 // but if they are then the top-level arrayness has already been stripped
2125 // by the time GetComponentsConsumedByType gets to it.
2126 bool isPatch = patchIDs.find(var.ID) != patchIDs.end();
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002127
2128 if (var.storageClass == spv::StorageClassInput) {
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002129 numCompIn += GetComponentsConsumedByType(src, var.baseTypePtrID, strip_input_array_level && !isPatch);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002130 } else { // var.storageClass == spv::StorageClassOutput
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002131 numCompOut += GetComponentsConsumedByType(src, var.baseTypePtrID, strip_output_array_level && !isPatch);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002132 }
2133 }
2134
2135 switch (pStage->stage) {
2136 case VK_SHADER_STAGE_VERTEX_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002137 if (numCompOut > limits.maxVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002138 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2139 "Invalid Pipeline CreateInfo State: Vertex shader exceeds "
2140 "VkPhysicalDeviceLimits::maxVertexOutputComponents of %u "
2141 "components by %u components",
2142 limits.maxVertexOutputComponents, numCompOut - limits.maxVertexOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002143 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002144 if (maxCompOut > (int)limits.maxVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002145 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2146 "Invalid Pipeline CreateInfo State: Vertex shader output variable uses location that "
2147 "exceeds component limit VkPhysicalDeviceLimits::maxVertexOutputComponents (%u)",
2148 limits.maxVertexOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002149 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002150 break;
2151
2152 case VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002153 if (numCompIn > limits.maxTessellationControlPerVertexInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002154 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2155 "Invalid Pipeline CreateInfo State: Tessellation control shader exceeds "
2156 "VkPhysicalDeviceLimits::maxTessellationControlPerVertexInputComponents of %u "
2157 "components by %u components",
2158 limits.maxTessellationControlPerVertexInputComponents,
2159 numCompIn - limits.maxTessellationControlPerVertexInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002160 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002161 if (maxCompIn > (int)limits.maxTessellationControlPerVertexInputComponents) {
2162 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002163 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2164 "Invalid Pipeline CreateInfo State: Tessellation control shader input variable uses location that "
2165 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationControlPerVertexInputComponents (%u)",
2166 limits.maxTessellationControlPerVertexInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002167 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002168 if (numCompOut > limits.maxTessellationControlPerVertexOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002169 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2170 "Invalid Pipeline CreateInfo State: Tessellation control shader exceeds "
2171 "VkPhysicalDeviceLimits::maxTessellationControlPerVertexOutputComponents of %u "
2172 "components by %u components",
2173 limits.maxTessellationControlPerVertexOutputComponents,
2174 numCompOut - limits.maxTessellationControlPerVertexOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002175 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002176 if (maxCompOut > (int)limits.maxTessellationControlPerVertexOutputComponents) {
2177 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002178 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2179 "Invalid Pipeline CreateInfo State: Tessellation control shader output variable uses location that "
2180 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationControlPerVertexOutputComponents (%u)",
2181 limits.maxTessellationControlPerVertexOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002182 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002183 break;
2184
2185 case VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002186 if (numCompIn > limits.maxTessellationEvaluationInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002187 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2188 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader exceeds "
2189 "VkPhysicalDeviceLimits::maxTessellationEvaluationInputComponents of %u "
2190 "components by %u components",
2191 limits.maxTessellationEvaluationInputComponents,
2192 numCompIn - limits.maxTessellationEvaluationInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002193 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002194 if (maxCompIn > (int)limits.maxTessellationEvaluationInputComponents) {
2195 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002196 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2197 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader input variable uses location that "
2198 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationEvaluationInputComponents (%u)",
2199 limits.maxTessellationEvaluationInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002200 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002201 if (numCompOut > limits.maxTessellationEvaluationOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002202 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2203 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader exceeds "
2204 "VkPhysicalDeviceLimits::maxTessellationEvaluationOutputComponents of %u "
2205 "components by %u components",
2206 limits.maxTessellationEvaluationOutputComponents,
2207 numCompOut - limits.maxTessellationEvaluationOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002208 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002209 if (maxCompOut > (int)limits.maxTessellationEvaluationOutputComponents) {
2210 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002211 LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2212 "Invalid Pipeline CreateInfo State: Tessellation evaluation shader output variable uses location that "
2213 "exceeds component limit VkPhysicalDeviceLimits::maxTessellationEvaluationOutputComponents (%u)",
2214 limits.maxTessellationEvaluationOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002215 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002216 break;
2217
2218 case VK_SHADER_STAGE_GEOMETRY_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002219 if (numCompIn > limits.maxGeometryInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002220 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2221 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2222 "VkPhysicalDeviceLimits::maxGeometryInputComponents of %u "
2223 "components by %u components",
2224 limits.maxGeometryInputComponents, numCompIn - limits.maxGeometryInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002225 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002226 if (maxCompIn > (int)limits.maxGeometryInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002227 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2228 "Invalid Pipeline CreateInfo State: Geometry shader input variable uses location that "
2229 "exceeds component limit VkPhysicalDeviceLimits::maxGeometryInputComponents (%u)",
2230 limits.maxGeometryInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002231 }
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002232 if (numCompOut > limits.maxGeometryOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002233 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2234 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2235 "VkPhysicalDeviceLimits::maxGeometryOutputComponents of %u "
2236 "components by %u components",
2237 limits.maxGeometryOutputComponents, numCompOut - limits.maxGeometryOutputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002238 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002239 if (maxCompOut > (int)limits.maxGeometryOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002240 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2241 "Invalid Pipeline CreateInfo State: Geometry shader output variable uses location that "
2242 "exceeds component limit VkPhysicalDeviceLimits::maxGeometryOutputComponents (%u)",
2243 limits.maxGeometryOutputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002244 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002245 if (numCompOut * numVertices > limits.maxGeometryTotalOutputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002246 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2247 "Invalid Pipeline CreateInfo State: Geometry shader exceeds "
2248 "VkPhysicalDeviceLimits::maxGeometryTotalOutputComponents of %u "
2249 "components by %u components",
2250 limits.maxGeometryTotalOutputComponents,
2251 numCompOut * numVertices - limits.maxGeometryTotalOutputComponents);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002252 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002253 break;
2254
2255 case VK_SHADER_STAGE_FRAGMENT_BIT:
Mark Lobodzinski57a44272019-02-27 12:40:50 -07002256 if (numCompIn > limits.maxFragmentInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002257 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2258 "Invalid Pipeline CreateInfo State: Fragment shader exceeds "
2259 "VkPhysicalDeviceLimits::maxFragmentInputComponents of %u "
2260 "components by %u components",
2261 limits.maxFragmentInputComponents, numCompIn - limits.maxFragmentInputComponents);
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002262 }
Jeff Bolzf234bf82019-11-04 14:07:15 -06002263 if (maxCompIn > (int)limits.maxFragmentInputComponents) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002264 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_ExceedDeviceLimit,
2265 "Invalid Pipeline CreateInfo State: Fragment shader input variable uses location that "
2266 "exceeds component limit VkPhysicalDeviceLimits::maxFragmentInputComponents (%u)",
2267 limits.maxFragmentInputComponents);
Jeff Bolzf234bf82019-11-04 14:07:15 -06002268 }
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002269 break;
2270
Jeff Bolz148d94e2018-12-13 21:25:56 -06002271 case VK_SHADER_STAGE_RAYGEN_BIT_NV:
2272 case VK_SHADER_STAGE_ANY_HIT_BIT_NV:
2273 case VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV:
2274 case VK_SHADER_STAGE_MISS_BIT_NV:
2275 case VK_SHADER_STAGE_INTERSECTION_BIT_NV:
2276 case VK_SHADER_STAGE_CALLABLE_BIT_NV:
2277 case VK_SHADER_STAGE_TASK_BIT_NV:
2278 case VK_SHADER_STAGE_MESH_BIT_NV:
2279 break;
2280
Daniel Fedai Larsenc939abc2018-08-07 10:01:58 +02002281 default:
2282 assert(false); // This should never happen
2283 }
2284 return skip;
2285}
2286
sfricke-samsungdc96f302020-03-18 20:42:10 -07002287bool CoreChecks::ValidateShaderStageMaxResources(VkShaderStageFlagBits stage, const PIPELINE_STATE *pipeline) const {
2288 bool skip = false;
2289 uint32_t total_resources = 0;
2290
2291 // Only currently testing for graphics and compute pipelines
2292 // TODO: Add check and support for Ray Tracing pipeline VUID 03428
2293 if ((stage & (VK_SHADER_STAGE_ALL_GRAPHICS | VK_SHADER_STAGE_COMPUTE_BIT)) == 0) {
2294 return false;
2295 }
2296
2297 if (stage == VK_SHADER_STAGE_FRAGMENT_BIT) {
2298 // "For the fragment shader stage the framebuffer color attachments also count against this limit"
2299 total_resources += pipeline->rp_state->createInfo.pSubpasses[pipeline->graphicsPipelineCI.subpass].colorAttachmentCount;
2300 }
2301
2302 // TODO: This reuses a lot of GetDescriptorCountMaxPerStage but currently would need to make it agnostic in a way to handle
2303 // input from CreatePipeline and CreatePipelineLayout level
2304 for (auto set_layout : pipeline->pipeline_layout->set_layouts) {
2305 if ((set_layout->GetCreateFlags() & VK_DESCRIPTOR_SET_LAYOUT_CREATE_UPDATE_AFTER_BIND_POOL_BIT) != 0) {
2306 continue;
2307 }
2308
2309 for (uint32_t binding_idx = 0; binding_idx < set_layout->GetBindingCount(); binding_idx++) {
2310 const VkDescriptorSetLayoutBinding *binding = set_layout->GetDescriptorSetLayoutBindingPtrFromIndex(binding_idx);
2311 // Bindings with a descriptorCount of 0 are "reserved" and should be skipped
2312 if (((stage & binding->stageFlags) != 0) && (binding->descriptorCount > 0)) {
2313 // Check only descriptor types listed in maxPerStageResources description in spec
2314 switch (binding->descriptorType) {
2315 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
2316 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
2317 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
2318 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
2319 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
2320 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
2321 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
2322 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
2323 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
2324 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
2325 total_resources += binding->descriptorCount;
2326 break;
2327 default:
2328 break;
2329 }
2330 }
2331 }
2332 }
2333
2334 if (total_resources > phys_dev_props.limits.maxPerStageResources) {
2335 const char *vuid = (stage == VK_SHADER_STAGE_COMPUTE_BIT) ? "VUID-VkComputePipelineCreateInfo-layout-01687"
2336 : "VUID-VkGraphicsPipelineCreateInfo-layout-01688";
2337 skip |= LogError(pipeline->pipeline, vuid,
2338 "Invalid Pipeline CreateInfo State: Shader Stage %s exceeds component limit "
2339 "VkPhysicalDeviceLimits::maxPerStageResources (%u)",
2340 string_VkShaderStageFlagBits(stage), phys_dev_props.limits.maxPerStageResources);
2341 }
2342
2343 return skip;
2344}
2345
Jeff Bolze4356752019-03-07 11:23:46 -06002346// copy the specialization constant value into buf, if it is present
2347void GetSpecConstantValue(VkPipelineShaderStageCreateInfo const *pStage, uint32_t spec_id, void *buf) {
2348 VkSpecializationInfo const *spec = pStage->pSpecializationInfo;
2349
2350 if (spec && spec_id < spec->mapEntryCount) {
2351 memcpy(buf, (uint8_t *)spec->pData + spec->pMapEntries[spec_id].offset, spec->pMapEntries[spec_id].size);
2352 }
2353}
2354
2355// Fill in value with the constant or specialization constant value, if available.
2356// Returns true if the value has been accurately filled out.
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002357static bool GetIntConstantValue(spirv_inst_iter insn, SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
Jeff Bolze4356752019-03-07 11:23:46 -06002358 const std::unordered_map<uint32_t, uint32_t> &id_to_spec_id, uint32_t *value) {
2359 auto type_id = src->get_def(insn.word(1));
2360 if (type_id.opcode() != spv::OpTypeInt || type_id.word(2) != 32) {
2361 return false;
2362 }
2363 switch (insn.opcode()) {
2364 case spv::OpSpecConstant:
2365 *value = insn.word(3);
2366 GetSpecConstantValue(pStage, id_to_spec_id.at(insn.word(2)), value);
2367 return true;
2368 case spv::OpConstant:
2369 *value = insn.word(3);
2370 return true;
2371 default:
2372 return false;
2373 }
2374}
2375
2376// Map SPIR-V type to VK_COMPONENT_TYPE enum
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002377VkComponentTypeNV GetComponentType(spirv_inst_iter insn, SHADER_MODULE_STATE const *src) {
Jeff Bolze4356752019-03-07 11:23:46 -06002378 switch (insn.opcode()) {
2379 case spv::OpTypeInt:
2380 switch (insn.word(2)) {
2381 case 8:
2382 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT8_NV : VK_COMPONENT_TYPE_UINT8_NV;
2383 case 16:
2384 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT16_NV : VK_COMPONENT_TYPE_UINT16_NV;
2385 case 32:
2386 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT32_NV : VK_COMPONENT_TYPE_UINT32_NV;
2387 case 64:
2388 return insn.word(3) != 0 ? VK_COMPONENT_TYPE_SINT64_NV : VK_COMPONENT_TYPE_UINT64_NV;
2389 default:
2390 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2391 }
2392 case spv::OpTypeFloat:
2393 switch (insn.word(2)) {
2394 case 16:
2395 return VK_COMPONENT_TYPE_FLOAT16_NV;
2396 case 32:
2397 return VK_COMPONENT_TYPE_FLOAT32_NV;
2398 case 64:
2399 return VK_COMPONENT_TYPE_FLOAT64_NV;
2400 default:
2401 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2402 }
2403 default:
2404 return VK_COMPONENT_TYPE_MAX_ENUM_NV;
2405 }
2406}
2407
2408// Validate SPV_NV_cooperative_matrix behavior that can't be statically validated
2409// in SPIRV-Tools (e.g. due to specialization constant usage).
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002410bool CoreChecks::ValidateCooperativeMatrix(SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
John Zulaufac4c6e12019-07-01 16:05:58 -06002411 const PIPELINE_STATE *pipeline) const {
Jeff Bolze4356752019-03-07 11:23:46 -06002412 bool skip = false;
2413
2414 // Map SPIR-V result ID to specialization constant id (SpecId decoration value)
2415 std::unordered_map<uint32_t, uint32_t> id_to_spec_id;
2416 // Map SPIR-V result ID to the ID of its type.
2417 std::unordered_map<uint32_t, uint32_t> id_to_type_id;
2418
2419 struct CoopMatType {
2420 uint32_t scope, rows, cols;
2421 VkComponentTypeNV component_type;
2422 bool all_constant;
2423
2424 CoopMatType() : scope(0), rows(0), cols(0), component_type(VK_COMPONENT_TYPE_MAX_ENUM_NV), all_constant(false) {}
2425
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002426 void Init(uint32_t id, SHADER_MODULE_STATE const *src, VkPipelineShaderStageCreateInfo const *pStage,
Jeff Bolze4356752019-03-07 11:23:46 -06002427 const std::unordered_map<uint32_t, uint32_t> &id_to_spec_id) {
2428 spirv_inst_iter insn = src->get_def(id);
2429 uint32_t component_type_id = insn.word(2);
2430 uint32_t scope_id = insn.word(3);
2431 uint32_t rows_id = insn.word(4);
2432 uint32_t cols_id = insn.word(5);
2433 auto component_type_iter = src->get_def(component_type_id);
2434 auto scope_iter = src->get_def(scope_id);
2435 auto rows_iter = src->get_def(rows_id);
2436 auto cols_iter = src->get_def(cols_id);
2437
2438 all_constant = true;
2439 if (!GetIntConstantValue(scope_iter, src, pStage, id_to_spec_id, &scope)) {
2440 all_constant = false;
2441 }
2442 if (!GetIntConstantValue(rows_iter, src, pStage, id_to_spec_id, &rows)) {
2443 all_constant = false;
2444 }
2445 if (!GetIntConstantValue(cols_iter, src, pStage, id_to_spec_id, &cols)) {
2446 all_constant = false;
2447 }
2448 component_type = GetComponentType(component_type_iter, src);
2449 }
2450 };
2451
2452 bool seen_coopmat_capability = false;
2453
2454 for (auto insn : *src) {
2455 // Whitelist instructions whose result can be a cooperative matrix type, and
2456 // keep track of their types. It would be nice if SPIRV-Headers generated code
2457 // to identify which instructions have a result type and result id. Lacking that,
2458 // this whitelist is based on the set of instructions that
2459 // SPV_NV_cooperative_matrix says can be used with cooperative matrix types.
2460 switch (insn.opcode()) {
2461 case spv::OpLoad:
2462 case spv::OpCooperativeMatrixLoadNV:
2463 case spv::OpCooperativeMatrixMulAddNV:
2464 case spv::OpSNegate:
2465 case spv::OpFNegate:
2466 case spv::OpIAdd:
2467 case spv::OpFAdd:
2468 case spv::OpISub:
2469 case spv::OpFSub:
2470 case spv::OpFDiv:
2471 case spv::OpSDiv:
2472 case spv::OpUDiv:
2473 case spv::OpMatrixTimesScalar:
2474 case spv::OpConstantComposite:
2475 case spv::OpCompositeConstruct:
2476 case spv::OpConvertFToU:
2477 case spv::OpConvertFToS:
2478 case spv::OpConvertSToF:
2479 case spv::OpConvertUToF:
2480 case spv::OpUConvert:
2481 case spv::OpSConvert:
2482 case spv::OpFConvert:
2483 id_to_type_id[insn.word(2)] = insn.word(1);
2484 break;
2485 default:
2486 break;
2487 }
2488
2489 switch (insn.opcode()) {
2490 case spv::OpDecorate:
2491 if (insn.word(2) == spv::DecorationSpecId) {
2492 id_to_spec_id[insn.word(1)] = insn.word(3);
2493 }
2494 break;
2495 case spv::OpCapability:
2496 if (insn.word(1) == spv::CapabilityCooperativeMatrixNV) {
2497 seen_coopmat_capability = true;
2498
2499 if (!(pStage->stage & phys_dev_ext_props.cooperative_matrix_props.cooperativeMatrixSupportedStages)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002500 skip |= LogError(
2501 pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixSupportedStages,
2502 "OpTypeCooperativeMatrixNV used in shader stage not in cooperativeMatrixSupportedStages (= %u)",
2503 phys_dev_ext_props.cooperative_matrix_props.cooperativeMatrixSupportedStages);
Jeff Bolze4356752019-03-07 11:23:46 -06002504 }
2505 }
2506 break;
2507 case spv::OpMemoryModel:
2508 // If the capability isn't enabled, don't bother with the rest of this function.
2509 // OpMemoryModel is the first required instruction after all OpCapability instructions.
2510 if (!seen_coopmat_capability) {
2511 return skip;
2512 }
2513 break;
2514 case spv::OpTypeCooperativeMatrixNV: {
2515 CoopMatType M;
2516 M.Init(insn.word(1), src, pStage, id_to_spec_id);
2517
2518 if (M.all_constant) {
2519 // Validate that the type parameters are all supported for one of the
2520 // operands of a cooperative matrix property.
2521 bool valid = false;
2522 for (unsigned i = 0; i < cooperative_matrix_properties.size(); ++i) {
2523 if (cooperative_matrix_properties[i].AType == M.component_type &&
2524 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].KSize == M.cols &&
2525 cooperative_matrix_properties[i].scope == M.scope) {
2526 valid = true;
2527 break;
2528 }
2529 if (cooperative_matrix_properties[i].BType == M.component_type &&
2530 cooperative_matrix_properties[i].KSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
2531 cooperative_matrix_properties[i].scope == M.scope) {
2532 valid = true;
2533 break;
2534 }
2535 if (cooperative_matrix_properties[i].CType == M.component_type &&
2536 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
2537 cooperative_matrix_properties[i].scope == M.scope) {
2538 valid = true;
2539 break;
2540 }
2541 if (cooperative_matrix_properties[i].DType == M.component_type &&
2542 cooperative_matrix_properties[i].MSize == M.rows && cooperative_matrix_properties[i].NSize == M.cols &&
2543 cooperative_matrix_properties[i].scope == M.scope) {
2544 valid = true;
2545 break;
2546 }
2547 }
2548 if (!valid) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002549 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixType,
2550 "OpTypeCooperativeMatrixNV (result id = %u) operands don't match a supported matrix type",
2551 insn.word(1));
Jeff Bolze4356752019-03-07 11:23:46 -06002552 }
2553 }
2554 break;
2555 }
2556 case spv::OpCooperativeMatrixMulAddNV: {
2557 CoopMatType A, B, C, D;
2558 if (id_to_type_id.find(insn.word(2)) == id_to_type_id.end() ||
2559 id_to_type_id.find(insn.word(3)) == id_to_type_id.end() ||
2560 id_to_type_id.find(insn.word(4)) == id_to_type_id.end() ||
2561 id_to_type_id.find(insn.word(5)) == id_to_type_id.end()) {
Mike Schuchardte48dc142019-04-18 09:12:03 -07002562 // Couldn't find type of matrix
2563 assert(false);
Jeff Bolze4356752019-03-07 11:23:46 -06002564 break;
2565 }
2566 D.Init(id_to_type_id[insn.word(2)], src, pStage, id_to_spec_id);
2567 A.Init(id_to_type_id[insn.word(3)], src, pStage, id_to_spec_id);
2568 B.Init(id_to_type_id[insn.word(4)], src, pStage, id_to_spec_id);
2569 C.Init(id_to_type_id[insn.word(5)], src, pStage, id_to_spec_id);
2570
2571 if (A.all_constant && B.all_constant && C.all_constant && D.all_constant) {
2572 // Validate that the type parameters are all supported for the same
2573 // cooperative matrix property.
2574 bool valid = false;
2575 for (unsigned i = 0; i < cooperative_matrix_properties.size(); ++i) {
2576 if (cooperative_matrix_properties[i].AType == A.component_type &&
2577 cooperative_matrix_properties[i].MSize == A.rows && cooperative_matrix_properties[i].KSize == A.cols &&
2578 cooperative_matrix_properties[i].scope == A.scope &&
2579
2580 cooperative_matrix_properties[i].BType == B.component_type &&
2581 cooperative_matrix_properties[i].KSize == B.rows && cooperative_matrix_properties[i].NSize == B.cols &&
2582 cooperative_matrix_properties[i].scope == B.scope &&
2583
2584 cooperative_matrix_properties[i].CType == C.component_type &&
2585 cooperative_matrix_properties[i].MSize == C.rows && cooperative_matrix_properties[i].NSize == C.cols &&
2586 cooperative_matrix_properties[i].scope == C.scope &&
2587
2588 cooperative_matrix_properties[i].DType == D.component_type &&
2589 cooperative_matrix_properties[i].MSize == D.rows && cooperative_matrix_properties[i].NSize == D.cols &&
2590 cooperative_matrix_properties[i].scope == D.scope) {
2591 valid = true;
2592 break;
2593 }
2594 }
2595 if (!valid) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002596 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_CooperativeMatrixMulAdd,
2597 "OpCooperativeMatrixMulAddNV (result id = %u) operands don't match a supported matrix "
2598 "VkCooperativeMatrixPropertiesNV",
2599 insn.word(2));
Jeff Bolze4356752019-03-07 11:23:46 -06002600 }
2601 }
2602 break;
2603 }
2604 default:
2605 break;
2606 }
2607 }
2608
2609 return skip;
2610}
2611
John Zulaufac4c6e12019-07-01 16:05:58 -06002612bool CoreChecks::ValidateExecutionModes(SHADER_MODULE_STATE const *src, spirv_inst_iter entrypoint) const {
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002613 auto entrypoint_id = entrypoint.word(2);
2614
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002615 // The first denorm execution mode encountered, along with its bit width.
2616 // Used to check if SeparateDenormSettings is respected.
2617 std::pair<spv::ExecutionMode, uint32_t> first_denorm_execution_mode = std::make_pair(spv::ExecutionModeMax, 0);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002618
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002619 // The first rounding mode encountered, along with its bit width.
2620 // Used to check if SeparateRoundingModeSettings is respected.
2621 std::pair<spv::ExecutionMode, uint32_t> first_rounding_mode = std::make_pair(spv::ExecutionModeMax, 0);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002622
2623 bool skip = false;
2624
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002625 uint32_t verticesOut = 0;
2626 uint32_t invocations = 0;
2627
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002628 for (auto insn : *src) {
2629 if (insn.opcode() == spv::OpExecutionMode && insn.word(1) == entrypoint_id) {
2630 auto mode = insn.word(2);
2631 switch (mode) {
2632 case spv::ExecutionModeSignedZeroInfNanPreserve: {
2633 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002634 if ((bit_width == 16 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat16) ||
2635 (bit_width == 32 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat32) ||
2636 (bit_width == 64 && !phys_dev_props_core12.shaderSignedZeroInfNanPreserveFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002637 skip |= LogError(
2638 device, kVUID_Core_Shader_FeatureNotEnabled,
2639 "Shader requires SignedZeroInfNanPreserve for bit width %d but it is not enabled on the device",
2640 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002641 }
2642 break;
2643 }
2644
2645 case spv::ExecutionModeDenormPreserve: {
2646 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002647 if ((bit_width == 16 && !phys_dev_props_core12.shaderDenormPreserveFloat16) ||
2648 (bit_width == 32 && !phys_dev_props_core12.shaderDenormPreserveFloat32) ||
2649 (bit_width == 64 && !phys_dev_props_core12.shaderDenormPreserveFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002650 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2651 "Shader requires DenormPreserve for bit width %d but it is not enabled on the device",
2652 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002653 }
2654
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002655 if (first_denorm_execution_mode.first == spv::ExecutionModeMax) {
2656 // Register the first denorm execution mode found
2657 first_denorm_execution_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002658 } else if (first_denorm_execution_mode.first != mode && first_denorm_execution_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002659 switch (phys_dev_props_core12.denormBehaviorIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002660 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
2661 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002662 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2663 "Shader uses different denorm execution modes for 16 and 64-bit but "
2664 "denormBehaviorIndependence is "
2665 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002666 }
2667 break;
2668
2669 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
2670 break;
2671
2672 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002673 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2674 "Shader uses different denorm execution modes for different bit widths but "
2675 "denormBehaviorIndependence is "
2676 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002677 break;
2678
2679 default:
2680 break;
2681 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002682 }
2683 break;
2684 }
2685
2686 case spv::ExecutionModeDenormFlushToZero: {
2687 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002688 if ((bit_width == 16 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat16) ||
2689 (bit_width == 32 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat32) ||
2690 (bit_width == 64 && !phys_dev_props_core12.shaderDenormFlushToZeroFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002691 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2692 "Shader requires DenormFlushToZero for bit width %d but it is not enabled on the device",
2693 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002694 }
2695
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002696 if (first_denorm_execution_mode.first == spv::ExecutionModeMax) {
2697 // Register the first denorm execution mode found
2698 first_denorm_execution_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002699 } else if (first_denorm_execution_mode.first != mode && first_denorm_execution_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002700 switch (phys_dev_props_core12.denormBehaviorIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002701 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
2702 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002703 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2704 "Shader uses different denorm execution modes for 16 and 64-bit but "
2705 "denormBehaviorIndependence is "
2706 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002707 }
2708 break;
2709
2710 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
2711 break;
2712
2713 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002714 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2715 "Shader uses different denorm execution modes for different bit widths but "
2716 "denormBehaviorIndependence is "
2717 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002718 break;
2719
2720 default:
2721 break;
2722 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002723 }
2724 break;
2725 }
2726
2727 case spv::ExecutionModeRoundingModeRTE: {
2728 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002729 if ((bit_width == 16 && !phys_dev_props_core12.shaderRoundingModeRTEFloat16) ||
2730 (bit_width == 32 && !phys_dev_props_core12.shaderRoundingModeRTEFloat32) ||
2731 (bit_width == 64 && !phys_dev_props_core12.shaderRoundingModeRTEFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002732 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2733 "Shader requires RoundingModeRTE for bit width %d but it is not enabled on the device",
2734 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002735 }
2736
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002737 if (first_rounding_mode.first == spv::ExecutionModeMax) {
2738 // Register the first rounding mode found
2739 first_rounding_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002740 } else if (first_rounding_mode.first != mode && first_rounding_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002741 switch (phys_dev_props_core12.roundingModeIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002742 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
2743 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002744 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2745 "Shader uses different rounding modes for 16 and 64-bit but "
2746 "roundingModeIndependence is "
2747 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002748 }
2749 break;
2750
2751 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
2752 break;
2753
2754 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002755 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2756 "Shader uses different rounding modes for different bit widths but "
2757 "roundingModeIndependence is "
2758 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002759 break;
2760
2761 default:
2762 break;
2763 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002764 }
2765 break;
2766 }
2767
2768 case spv::ExecutionModeRoundingModeRTZ: {
2769 auto bit_width = insn.word(3);
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002770 if ((bit_width == 16 && !phys_dev_props_core12.shaderRoundingModeRTZFloat16) ||
2771 (bit_width == 32 && !phys_dev_props_core12.shaderRoundingModeRTZFloat32) ||
2772 (bit_width == 64 && !phys_dev_props_core12.shaderRoundingModeRTZFloat64)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002773 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2774 "Shader requires RoundingModeRTZ for bit width %d but it is not enabled on the device",
2775 bit_width);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002776 }
2777
Attilio Provenzanof6c0e852019-04-09 11:01:18 +01002778 if (first_rounding_mode.first == spv::ExecutionModeMax) {
2779 // Register the first rounding mode found
2780 first_rounding_mode = std::make_pair(static_cast<spv::ExecutionMode>(mode), bit_width);
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002781 } else if (first_rounding_mode.first != mode && first_rounding_mode.second != bit_width) {
Piers Daniell41b8c5d2020-01-10 15:42:00 -07002782 switch (phys_dev_props_core12.roundingModeIndependence) {
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002783 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR:
2784 if (first_rounding_mode.second != 32 && bit_width != 32) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002785 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2786 "Shader uses different rounding modes for 16 and 64-bit but "
2787 "roundingModeIndependence is "
2788 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_32_BIT_ONLY_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002789 }
2790 break;
2791
2792 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_ALL_KHR:
2793 break;
2794
2795 case VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR:
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002796 skip |= LogError(device, kVUID_Core_Shader_FeatureNotEnabled,
2797 "Shader uses different rounding modes for different bit widths but "
2798 "roundingModeIndependence is "
2799 "VK_SHADER_FLOAT_CONTROLS_INDEPENDENCE_NONE_KHR on the device");
Jason Ekstrande1e06de2019-08-05 11:43:43 -05002800 break;
2801
2802 default:
2803 break;
2804 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002805 }
2806 break;
2807 }
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002808
2809 case spv::ExecutionModeOutputVertices: {
2810 verticesOut = insn.word(3);
2811 break;
2812 }
2813
2814 case spv::ExecutionModeInvocations: {
2815 invocations = insn.word(3);
2816 break;
2817 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002818 }
2819 }
2820 }
2821
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002822 if (entrypoint.word(1) == spv::ExecutionModelGeometry) {
2823 if (verticesOut == 0 || verticesOut > phys_dev_props.limits.maxGeometryOutputVertices) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002824 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-stage-00714",
2825 "Geometry shader entry point must have an OpExecutionMode instruction that "
2826 "specifies a maximum output vertex count that is greater than 0 and less "
2827 "than or equal to maxGeometryOutputVertices. "
2828 "OutputVertices=%d, maxGeometryOutputVertices=%d",
2829 verticesOut, phys_dev_props.limits.maxGeometryOutputVertices);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002830 }
2831
2832 if (invocations == 0 || invocations > phys_dev_props.limits.maxGeometryShaderInvocations) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07002833 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-stage-00715",
2834 "Geometry shader entry point must have an OpExecutionMode instruction that "
2835 "specifies an invocation count that is greater than 0 and less "
2836 "than or equal to maxGeometryShaderInvocations. "
2837 "Invocations=%d, maxGeometryShaderInvocations=%d",
2838 invocations, phys_dev_props.limits.maxGeometryShaderInvocations);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05002839 }
2840 }
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00002841 return skip;
2842}
2843
locke-lunargd9a069d2019-09-17 01:50:19 -06002844uint32_t DescriptorTypeToReqs(SHADER_MODULE_STATE const *module, uint32_t type_id) {
Chris Forbes47567b72017-06-09 12:09:45 -07002845 auto type = module->get_def(type_id);
2846
2847 while (true) {
2848 switch (type.opcode()) {
2849 case spv::OpTypeArray:
Chris Forbes062f1222018-08-21 15:34:15 -07002850 case spv::OpTypeRuntimeArray:
Chris Forbes47567b72017-06-09 12:09:45 -07002851 case spv::OpTypeSampledImage:
2852 type = module->get_def(type.word(2));
2853 break;
2854 case spv::OpTypePointer:
2855 type = module->get_def(type.word(3));
2856 break;
2857 case spv::OpTypeImage: {
2858 auto dim = type.word(3);
2859 auto arrayed = type.word(5);
2860 auto msaa = type.word(6);
2861
Chris Forbes74ba2232018-08-27 15:19:27 -07002862 uint32_t bits = 0;
2863 switch (GetFundamentalType(module, type.word(2))) {
2864 case FORMAT_TYPE_FLOAT:
2865 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_FLOAT;
2866 break;
2867 case FORMAT_TYPE_UINT:
2868 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_UINT;
2869 break;
2870 case FORMAT_TYPE_SINT:
2871 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_SINT;
2872 break;
2873 default:
2874 break;
2875 }
2876
Chris Forbes47567b72017-06-09 12:09:45 -07002877 switch (dim) {
2878 case spv::Dim1D:
Chris Forbes74ba2232018-08-27 15:19:27 -07002879 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_1D_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_1D;
2880 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002881 case spv::Dim2D:
Chris Forbes74ba2232018-08-27 15:19:27 -07002882 bits |= msaa ? DESCRIPTOR_REQ_MULTI_SAMPLE : DESCRIPTOR_REQ_SINGLE_SAMPLE;
2883 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_2D_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_2D;
2884 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002885 case spv::Dim3D:
Chris Forbes74ba2232018-08-27 15:19:27 -07002886 bits |= DESCRIPTOR_REQ_VIEW_TYPE_3D;
2887 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002888 case spv::DimCube:
Chris Forbes74ba2232018-08-27 15:19:27 -07002889 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_CUBE_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_CUBE;
2890 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002891 case spv::DimSubpassData:
Chris Forbes74ba2232018-08-27 15:19:27 -07002892 bits |= msaa ? DESCRIPTOR_REQ_MULTI_SAMPLE : DESCRIPTOR_REQ_SINGLE_SAMPLE;
2893 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002894 default: // buffer, etc.
Chris Forbes74ba2232018-08-27 15:19:27 -07002895 return bits;
Chris Forbes47567b72017-06-09 12:09:45 -07002896 }
2897 }
2898 default:
2899 return 0;
2900 }
2901 }
2902}
2903
2904// For given pipelineLayout verify that the set_layout_node at slot.first
2905// has the requested binding at slot.second and return ptr to that binding
Mark Lobodzinskica6ebe32019-04-25 11:43:37 -06002906static VkDescriptorSetLayoutBinding const *GetDescriptorBinding(PIPELINE_LAYOUT_STATE const *pipelineLayout,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06002907 descriptor_slot_t slot) {
Chris Forbes47567b72017-06-09 12:09:45 -07002908 if (!pipelineLayout) return nullptr;
2909
2910 if (slot.first >= pipelineLayout->set_layouts.size()) return nullptr;
2911
2912 return pipelineLayout->set_layouts[slot.first]->GetDescriptorSetLayoutBindingPtrFromBinding(slot.second);
2913}
2914
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002915static bool FindLocalSize(SHADER_MODULE_STATE const *src, uint32_t &local_size_x, uint32_t &local_size_y, uint32_t &local_size_z) {
Locke1ec6d952019-04-02 11:57:21 -06002916 for (auto insn : *src) {
2917 if (insn.opcode() == spv::OpEntryPoint) {
2918 auto executionModel = insn.word(1);
2919 auto entrypointStageBits = ExecutionModelToShaderStageFlagBits(executionModel);
2920 if (entrypointStageBits == VK_SHADER_STAGE_COMPUTE_BIT) {
2921 auto entrypoint_id = insn.word(2);
2922 for (auto insn1 : *src) {
2923 if (insn1.opcode() == spv::OpExecutionMode && insn1.word(1) == entrypoint_id &&
2924 insn1.word(2) == spv::ExecutionModeLocalSize) {
2925 local_size_x = insn1.word(3);
2926 local_size_y = insn1.word(4);
2927 local_size_z = insn1.word(5);
2928 return true;
2929 }
2930 }
2931 }
2932 }
2933 }
2934 return false;
2935}
2936
locke-lunargd9a069d2019-09-17 01:50:19 -06002937void ProcessExecutionModes(SHADER_MODULE_STATE const *src, const spirv_inst_iter &entrypoint, PIPELINE_STATE *pipeline) {
Jeff Bolz105d6492018-09-29 15:46:44 -05002938 auto entrypoint_id = entrypoint.word(2);
Chris Forbes0771b672018-03-22 21:13:46 -07002939 bool is_point_mode = false;
2940
2941 for (auto insn : *src) {
2942 if (insn.opcode() == spv::OpExecutionMode && insn.word(1) == entrypoint_id) {
2943 switch (insn.word(2)) {
2944 case spv::ExecutionModePointMode:
2945 // In tessellation shaders, PointMode is separate and trumps the tessellation topology.
2946 is_point_mode = true;
2947 break;
2948
2949 case spv::ExecutionModeOutputPoints:
2950 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_POINT_LIST;
2951 break;
2952
2953 case spv::ExecutionModeIsolines:
2954 case spv::ExecutionModeOutputLineStrip:
2955 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_LINE_STRIP;
2956 break;
2957
2958 case spv::ExecutionModeTriangles:
2959 case spv::ExecutionModeQuads:
2960 case spv::ExecutionModeOutputTriangleStrip:
2961 pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_TRIANGLE_STRIP;
2962 break;
2963 }
2964 }
2965 }
2966
2967 if (is_point_mode) pipeline->topology_at_rasterizer = VK_PRIMITIVE_TOPOLOGY_POINT_LIST;
2968}
2969
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06002970// If PointList topology is specified in the pipeline, verify that a shader geometry stage writes PointSize
2971// o If there is only a vertex shader : gl_PointSize must be written when using points
2972// o If there is a geometry or tessellation shader:
2973// - If shaderTessellationAndGeometryPointSize feature is enabled:
2974// * gl_PointSize must be written in the final geometry stage
2975// - If shaderTessellationAndGeometryPointSize feature is disabled:
2976// * gl_PointSize must NOT be written and a default of 1.0 is assumed
Mark Lobodzinski3c59d972019-04-25 11:28:14 -06002977bool CoreChecks::ValidatePointListShaderState(const PIPELINE_STATE *pipeline, SHADER_MODULE_STATE const *src,
John Zulaufac4c6e12019-07-01 16:05:58 -06002978 spirv_inst_iter entrypoint, VkShaderStageFlagBits stage) const {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06002979 if (pipeline->topology_at_rasterizer != VK_PRIMITIVE_TOPOLOGY_POINT_LIST) {
2980 return false;
2981 }
2982
2983 bool pointsize_written = false;
2984 bool skip = false;
2985
2986 // Search for PointSize built-in decorations
2987 std::vector<uint32_t> pointsize_builtin_offsets;
2988 spirv_inst_iter insn = entrypoint;
2989 while (!pointsize_written && (insn.opcode() != spv::OpFunction)) {
2990 if (insn.opcode() == spv::OpMemberDecorate) {
2991 if (insn.word(3) == spv::DecorationBuiltIn) {
2992 if (insn.word(4) == spv::BuiltInPointSize) {
2993 pointsize_written = IsPointSizeWritten(src, insn, entrypoint);
2994 }
2995 }
2996 } else if (insn.opcode() == spv::OpDecorate) {
2997 if (insn.word(2) == spv::DecorationBuiltIn) {
2998 if (insn.word(3) == spv::BuiltInPointSize) {
2999 pointsize_written = IsPointSizeWritten(src, insn, entrypoint);
3000 }
3001 }
3002 }
3003
3004 insn++;
3005 }
3006
3007 if ((stage == VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT || stage == VK_SHADER_STAGE_GEOMETRY_BIT) &&
Mark Lobodzinskid7b03cc2019-04-19 14:23:10 -06003008 !enabled_features.core.shaderTessellationAndGeometryPointSize) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003009 if (pointsize_written) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003010 skip |= LogError(pipeline->pipeline, kVUID_Core_Shader_PointSizeBuiltInOverSpecified,
3011 "Pipeline topology is set to POINT_LIST and geometry or tessellation shaders write PointSize which "
3012 "is prohibited when the shaderTessellationAndGeometryPointSize feature is not enabled.");
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003013 }
3014 } else if (!pointsize_written) {
3015 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003016 LogError(pipeline->pipeline, kVUID_Core_Shader_MissingPointSizeBuiltIn,
3017 "Pipeline topology is set to POINT_LIST, but PointSize is not written to in the shader corresponding to %s.",
3018 string_VkShaderStageFlagBits(stage));
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003019 }
3020 return skip;
3021}
John Zulauf14c355b2019-06-27 16:09:37 -06003022
3023bool CoreChecks::ValidatePipelineShaderStage(VkPipelineShaderStageCreateInfo const *pStage, const PIPELINE_STATE *pipeline,
3024 const PIPELINE_STATE::StageState &stage_state, const SHADER_MODULE_STATE *module,
John Zulaufac4c6e12019-07-01 16:05:58 -06003025 const spirv_inst_iter &entrypoint, bool check_point_size) const {
John Zulauf14c355b2019-06-27 16:09:37 -06003026 bool skip = false;
3027
3028 // Check the module
3029 if (!module->has_valid_spirv) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003030 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-module-parameter",
3031 "%s does not contain valid spirv for stage %s.",
3032 report_data->FormatHandle(module->vk_shader_module).c_str(), string_VkShaderStageFlagBits(pStage->stage));
John Zulauf14c355b2019-06-27 16:09:37 -06003033 }
3034
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003035 // If specialization-constant values are given and specialization-constant instructions are present in the shader, the
3036 // specializations should be applied and validated.
3037 if (pStage->pSpecializationInfo != nullptr && pStage->pSpecializationInfo->mapEntryCount > 0 &&
3038 pStage->pSpecializationInfo->pMapEntries != nullptr && module->has_specialization_constants) {
3039 // Gather the specialization-constant values.
3040 auto const &specialization_info = pStage->pSpecializationInfo;
Jeremy Hayes521221d2020-01-15 16:48:49 -07003041 auto const &specialization_data = reinterpret_cast<uint8_t const *>(specialization_info->pData);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003042 std::unordered_map<uint32_t, std::vector<uint32_t>> id_value_map;
3043 id_value_map.reserve(specialization_info->mapEntryCount);
3044 for (auto i = 0u; i < specialization_info->mapEntryCount; ++i) {
3045 auto const &map_entry = specialization_info->pMapEntries[i];
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003046
Jeremy Hayes521221d2020-01-15 16:48:49 -07003047 // Expect only scalar types.
3048 assert(map_entry.size == 1 || map_entry.size == 2 || map_entry.size == 4 || map_entry.size == 8);
3049 auto entry = id_value_map.emplace(map_entry.constantID, std::vector<uint32_t>(map_entry.size > 4 ? 2 : 1));
3050 memcpy(entry.first->second.data(), specialization_data + map_entry.offset, map_entry.size);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003051 }
3052
3053 // Apply the specialization-constant values and revalidate the shader module.
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06003054 spv_target_env spirv_environment = PickSpirvEnv(api_version, (device_extensions.vk_khr_spirv_1_4 != kNotEnabled));
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003055 spvtools::Optimizer optimizer(spirv_environment);
3056 spvtools::MessageConsumer consumer = [&skip, &module, &pStage, this](spv_message_level_t level, const char *source,
3057 const spv_position_t &position, const char *message) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003058 skip |= LogError(
3059 device, "VUID-VkPipelineShaderStageCreateInfo-module-parameter", "%s does not contain valid spirv for stage %s. %s",
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003060 report_data->FormatHandle(module->vk_shader_module).c_str(), string_VkShaderStageFlagBits(pStage->stage), message);
3061 };
3062 optimizer.SetMessageConsumer(consumer);
3063 optimizer.RegisterPass(spvtools::CreateSetSpecConstantDefaultValuePass(id_value_map));
3064 optimizer.RegisterPass(spvtools::CreateFreezeSpecConstantValuePass());
3065 std::vector<uint32_t> specialized_spirv;
3066 auto const optimized =
3067 optimizer.Run(module->words.data(), module->words.size(), &specialized_spirv, spvtools::ValidatorOptions(), true);
3068 assert(optimized == true);
3069
3070 if (optimized) {
3071 spv_context ctx = spvContextCreate(spirv_environment);
3072 spv_const_binary_t binary{specialized_spirv.data(), specialized_spirv.size()};
3073 spv_diagnostic diag = nullptr;
Tony-LunarG9fe69a42020-07-23 15:09:37 -06003074 spvtools::ValidatorOptions options;
3075 AdjustValidatorOptions(device_extensions, enabled_features, options);
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003076 auto const spv_valid = spvValidateWithOptions(ctx, options, &binary, &diag);
3077 if (spv_valid != SPV_SUCCESS) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003078 skip |= LogError(device, "VUID-VkPipelineShaderStageCreateInfo-module-parameter",
3079 "After specialization was applied, %s does not contain valid spirv for stage %s.",
3080 report_data->FormatHandle(module->vk_shader_module).c_str(),
3081 string_VkShaderStageFlagBits(pStage->stage));
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003082 }
3083
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003084 spvDiagnosticDestroy(diag);
3085 spvContextDestroy(ctx);
3086 }
3087 }
3088
John Zulauf14c355b2019-06-27 16:09:37 -06003089 // Check the entrypoint
3090 if (entrypoint == module->end()) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003091 skip |=
3092 LogError(device, "VUID-VkPipelineShaderStageCreateInfo-pName-00707", "No entrypoint found named `%s` for stage %s..",
3093 pStage->pName, string_VkShaderStageFlagBits(pStage->stage));
John Zulauf14c355b2019-06-27 16:09:37 -06003094 }
3095 if (skip) return true; // no point continuing beyond here, any analysis is just going to be garbage.
3096
3097 // Mark accessible ids
3098 auto &accessible_ids = stage_state.accessible_ids;
3099
Chris Forbes47567b72017-06-09 12:09:45 -07003100 // Validate descriptor set layout against what the entrypoint actually uses
John Zulauf14c355b2019-06-27 16:09:37 -06003101 bool has_writable_descriptor = stage_state.has_writable_descriptor;
3102 auto &descriptor_uses = stage_state.descriptor_uses;
Chris Forbes47567b72017-06-09 12:09:45 -07003103
Chris Forbes349b3132018-03-07 11:38:08 -08003104 // Validate shader capabilities against enabled device features
Jeff Bolzee743412019-06-20 22:24:32 -05003105 skip |= ValidateShaderCapabilities(module, pStage->stage);
3106 skip |= ValidateShaderStageWritableDescriptor(pStage->stage, has_writable_descriptor);
Jeff Bolze9ee3d82019-05-29 13:45:13 -05003107 skip |= ValidateShaderStageInputOutputLimits(module, pStage, pipeline, entrypoint);
sfricke-samsungdc96f302020-03-18 20:42:10 -07003108 skip |= ValidateShaderStageMaxResources(pStage->stage, pipeline);
Jeff Bolz526f2d52019-09-18 13:18:08 -05003109 skip |= ValidateShaderStageGroupNonUniform(module, pStage->stage);
Attilio Provenzanoc5d50102019-03-25 17:40:37 +00003110 skip |= ValidateExecutionModes(module, entrypoint);
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003111 skip |= ValidateSpecializationOffsets(pStage);
3112 skip |= ValidatePushConstantUsage(pipeline->pipeline_layout->push_constant_ranges.get(), module, accessible_ids, pStage->stage);
Jeff Bolze54ae892018-09-08 12:16:29 -05003113 if (check_point_size && !pipeline->graphicsPipelineCI.pRasterizationState->rasterizerDiscardEnable) {
Mark Lobodzinski518eadc2019-03-09 12:07:30 -07003114 skip |= ValidatePointListShaderState(pipeline, module, entrypoint, pStage->stage);
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003115 }
Jeff Bolze4356752019-03-07 11:23:46 -06003116 skip |= ValidateCooperativeMatrix(module, pStage, pipeline);
Chris Forbes47567b72017-06-09 12:09:45 -07003117
3118 // Validate descriptor use
3119 for (auto use : descriptor_uses) {
Chris Forbes47567b72017-06-09 12:09:45 -07003120 // Verify given pipelineLayout has requested setLayout with requested binding
Jeff Bolze7fc67b2019-10-04 12:29:31 -05003121 const auto &binding = GetDescriptorBinding(pipeline->pipeline_layout.get(), use.first);
Chris Forbes47567b72017-06-09 12:09:45 -07003122 unsigned required_descriptor_count;
Jeff Bolze54ae892018-09-08 12:16:29 -05003123 std::set<uint32_t> descriptor_types = TypeToDescriptorTypeSet(module, use.second.type_id, required_descriptor_count);
Chris Forbes47567b72017-06-09 12:09:45 -07003124
3125 if (!binding) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003126 skip |= LogError(device, kVUID_Core_Shader_MissingDescriptor,
3127 "Shader uses descriptor slot %u.%u (expected `%s`) but not declared in pipeline layout",
3128 use.first.first, use.first.second, string_descriptorTypes(descriptor_types).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003129 } else if (~binding->stageFlags & pStage->stage) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003130 skip |= LogError(device, kVUID_Core_Shader_DescriptorNotAccessibleFromStage,
3131 "Shader uses descriptor slot %u.%u but descriptor not accessible from stage %s", use.first.first,
3132 use.first.second, string_VkShaderStageFlagBits(pStage->stage));
Jeff Bolze54ae892018-09-08 12:16:29 -05003133 } else if (descriptor_types.find(binding->descriptorType) == descriptor_types.end()) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003134 skip |= LogError(device, kVUID_Core_Shader_DescriptorTypeMismatch,
3135 "Type mismatch on descriptor slot %u.%u (expected `%s`) but descriptor of type %s", use.first.first,
3136 use.first.second, string_descriptorTypes(descriptor_types).c_str(),
3137 string_VkDescriptorType(binding->descriptorType));
Chris Forbes47567b72017-06-09 12:09:45 -07003138 } else if (binding->descriptorCount < required_descriptor_count) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003139 skip |= LogError(device, kVUID_Core_Shader_DescriptorTypeMismatch,
3140 "Shader expects at least %u descriptors for binding %u.%u but only %u provided",
3141 required_descriptor_count, use.first.first, use.first.second, binding->descriptorCount);
Chris Forbes47567b72017-06-09 12:09:45 -07003142 }
3143 }
3144
3145 // Validate use of input attachments against subpass structure
3146 if (pStage->stage == VK_SHADER_STAGE_FRAGMENT_BIT) {
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003147 auto input_attachment_uses = CollectInterfaceByInputAttachmentIndex(module, accessible_ids);
Chris Forbes47567b72017-06-09 12:09:45 -07003148
Petr Krause91f7a12017-12-14 20:57:36 +01003149 auto rpci = pipeline->rp_state->createInfo.ptr();
Chris Forbes47567b72017-06-09 12:09:45 -07003150 auto subpass = pipeline->graphicsPipelineCI.subpass;
3151
3152 for (auto use : input_attachment_uses) {
3153 auto input_attachments = rpci->pSubpasses[subpass].pInputAttachments;
3154 auto index = (input_attachments && use.first < rpci->pSubpasses[subpass].inputAttachmentCount)
Dave Houltona9df0ce2018-02-07 10:51:23 -07003155 ? input_attachments[use.first].attachment
3156 : VK_ATTACHMENT_UNUSED;
Chris Forbes47567b72017-06-09 12:09:45 -07003157
3158 if (index == VK_ATTACHMENT_UNUSED) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003159 skip |= LogError(device, kVUID_Core_Shader_MissingInputAttachment,
3160 "Shader consumes input attachment index %d but not provided in subpass", use.first);
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003161 } else if (!(GetFormatType(rpci->pAttachments[index].format) & GetFundamentalType(module, use.second.type_id))) {
Chris Forbes47567b72017-06-09 12:09:45 -07003162 skip |=
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003163 LogError(device, kVUID_Core_Shader_InputAttachmentTypeMismatch,
3164 "Subpass input attachment %u format of %s does not match type used in shader `%s`", use.first,
3165 string_VkFormat(rpci->pAttachments[index].format), DescribeType(module, use.second.type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003166 }
3167 }
3168 }
Lockeaa8fdc02019-04-02 11:59:20 -06003169 if (pStage->stage == VK_SHADER_STAGE_COMPUTE_BIT) {
3170 skip |= ValidateComputeWorkGroupSizes(module);
3171 }
Chris Forbes47567b72017-06-09 12:09:45 -07003172 return skip;
3173}
3174
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003175bool CoreChecks::ValidateInterfaceBetweenStages(SHADER_MODULE_STATE const *producer, spirv_inst_iter producer_entrypoint,
3176 shader_stage_attributes const *producer_stage, SHADER_MODULE_STATE const *consumer,
3177 spirv_inst_iter consumer_entrypoint,
3178 shader_stage_attributes const *consumer_stage) const {
Chris Forbes47567b72017-06-09 12:09:45 -07003179 bool skip = false;
3180
3181 auto outputs =
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003182 CollectInterfaceByLocation(producer, producer_entrypoint, spv::StorageClassOutput, producer_stage->arrayed_output);
3183 auto inputs = CollectInterfaceByLocation(consumer, consumer_entrypoint, spv::StorageClassInput, consumer_stage->arrayed_input);
Chris Forbes47567b72017-06-09 12:09:45 -07003184
3185 auto a_it = outputs.begin();
3186 auto b_it = inputs.begin();
3187
3188 // Maps sorted by key (location); walk them together to find mismatches
3189 while ((outputs.size() > 0 && a_it != outputs.end()) || (inputs.size() && b_it != inputs.end())) {
3190 bool a_at_end = outputs.size() == 0 || a_it == outputs.end();
3191 bool b_at_end = inputs.size() == 0 || b_it == inputs.end();
3192 auto a_first = a_at_end ? std::make_pair(0u, 0u) : a_it->first;
3193 auto b_first = b_at_end ? std::make_pair(0u, 0u) : b_it->first;
3194
3195 if (b_at_end || ((!a_at_end) && (a_first < b_first))) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003196 skip |= LogPerformanceWarning(producer->vk_shader_module, kVUID_Core_Shader_OutputNotConsumed,
3197 "%s writes to output location %u.%u which is not consumed by %s", producer_stage->name,
3198 a_first.first, a_first.second, consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003199 a_it++;
3200 } else if (a_at_end || a_first > b_first) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003201 skip |= LogError(consumer->vk_shader_module, kVUID_Core_Shader_InputNotProduced,
3202 "%s consumes input location %u.%u which is not written by %s", consumer_stage->name, b_first.first,
3203 b_first.second, producer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003204 b_it++;
3205 } else {
3206 // subtleties of arrayed interfaces:
3207 // - if is_patch, then the member is not arrayed, even though the interface may be.
3208 // - if is_block_member, then the extra array level of an arrayed interface is not
3209 // expressed in the member type -- it's expressed in the block type.
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003210 if (!TypesMatch(producer, consumer, a_it->second.type_id, b_it->second.type_id,
3211 producer_stage->arrayed_output && !a_it->second.is_patch && !a_it->second.is_block_member,
3212 consumer_stage->arrayed_input && !b_it->second.is_patch && !b_it->second.is_block_member, true)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003213 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3214 "Type mismatch on location %u.%u: '%s' vs '%s'", a_first.first, a_first.second,
3215 DescribeType(producer, a_it->second.type_id).c_str(),
3216 DescribeType(consumer, b_it->second.type_id).c_str());
Chris Forbes47567b72017-06-09 12:09:45 -07003217 }
3218 if (a_it->second.is_patch != b_it->second.is_patch) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003219 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3220 "Decoration mismatch on location %u.%u: is per-%s in %s stage but per-%s in %s stage",
3221 a_first.first, a_first.second, a_it->second.is_patch ? "patch" : "vertex", producer_stage->name,
3222 b_it->second.is_patch ? "patch" : "vertex", consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003223 }
3224 if (a_it->second.is_relaxed_precision != b_it->second.is_relaxed_precision) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003225 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3226 "Decoration mismatch on location %u.%u: %s and %s stages differ in precision", a_first.first,
3227 a_first.second, producer_stage->name, consumer_stage->name);
Chris Forbes47567b72017-06-09 12:09:45 -07003228 }
3229 a_it++;
3230 b_it++;
3231 }
3232 }
3233
Ari Suonpaa696b3432019-03-11 14:02:57 +02003234 if (consumer_stage->stage != VK_SHADER_STAGE_FRAGMENT_BIT) {
3235 auto builtins_producer = CollectBuiltinBlockMembers(producer, producer_entrypoint, spv::StorageClassOutput);
3236 auto builtins_consumer = CollectBuiltinBlockMembers(consumer, consumer_entrypoint, spv::StorageClassInput);
3237
3238 if (!builtins_producer.empty() && !builtins_consumer.empty()) {
3239 if (builtins_producer.size() != builtins_consumer.size()) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003240 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3241 "Number of elements inside builtin block differ between stages (%s %d vs %s %d).",
3242 producer_stage->name, (int)builtins_producer.size(), consumer_stage->name,
3243 (int)builtins_consumer.size());
Ari Suonpaa696b3432019-03-11 14:02:57 +02003244 } else {
3245 auto it_producer = builtins_producer.begin();
3246 auto it_consumer = builtins_consumer.begin();
3247 while (it_producer != builtins_producer.end() && it_consumer != builtins_consumer.end()) {
3248 if (*it_producer != *it_consumer) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003249 skip |= LogError(producer->vk_shader_module, kVUID_Core_Shader_InterfaceTypeMismatch,
3250 "Builtin variable inside block doesn't match between %s and %s.", producer_stage->name,
3251 consumer_stage->name);
Ari Suonpaa696b3432019-03-11 14:02:57 +02003252 break;
3253 }
3254 it_producer++;
3255 it_consumer++;
3256 }
3257 }
3258 }
3259 }
3260
Chris Forbes47567b72017-06-09 12:09:45 -07003261 return skip;
3262}
3263
John Zulauf14c355b2019-06-27 16:09:37 -06003264static inline uint32_t DetermineFinalGeomStage(const PIPELINE_STATE *pipeline, const VkGraphicsPipelineCreateInfo *pCreateInfo) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003265 uint32_t stage_mask = 0;
3266 if (pipeline->topology_at_rasterizer == VK_PRIMITIVE_TOPOLOGY_POINT_LIST) {
3267 for (uint32_t i = 0; i < pCreateInfo->stageCount; i++) {
3268 stage_mask |= pCreateInfo->pStages[i].stage;
3269 }
3270 // Determine which shader in which PointSize should be written (the final geometry stage)
Jeff Bolz105d6492018-09-29 15:46:44 -05003271 if (stage_mask & VK_SHADER_STAGE_MESH_BIT_NV) {
3272 stage_mask = VK_SHADER_STAGE_MESH_BIT_NV;
3273 } else if (stage_mask & VK_SHADER_STAGE_GEOMETRY_BIT) {
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003274 stage_mask = VK_SHADER_STAGE_GEOMETRY_BIT;
3275 } else if (stage_mask & VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT) {
3276 stage_mask = VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT;
3277 } else if (stage_mask & VK_SHADER_STAGE_VERTEX_BIT) {
3278 stage_mask = VK_SHADER_STAGE_VERTEX_BIT;
Mark Lobodzinski2c984cc2018-07-31 09:57:46 -06003279 }
3280 }
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003281 return stage_mask;
Mark Lobodzinski2c984cc2018-07-31 09:57:46 -06003282}
3283
Chris Forbes47567b72017-06-09 12:09:45 -07003284// Validate that the shaders used by the given pipeline and store the active_slots
3285// that are actually used by the pipeline into pPipeline->active_slots
John Zulaufac4c6e12019-07-01 16:05:58 -06003286bool CoreChecks::ValidateGraphicsPipelineShaderState(const PIPELINE_STATE *pipeline) const {
Chris Forbesa400a8a2017-07-20 13:10:24 -07003287 auto pCreateInfo = pipeline->graphicsPipelineCI.ptr();
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003288 int vertex_stage = GetShaderStageId(VK_SHADER_STAGE_VERTEX_BIT);
3289 int fragment_stage = GetShaderStageId(VK_SHADER_STAGE_FRAGMENT_BIT);
Chris Forbes47567b72017-06-09 12:09:45 -07003290
John Zulauf14c355b2019-06-27 16:09:37 -06003291 const SHADER_MODULE_STATE *shaders[32];
Chris Forbes47567b72017-06-09 12:09:45 -07003292 memset(shaders, 0, sizeof(shaders));
Jeff Bolz7e35c392018-09-04 15:30:41 -05003293 spirv_inst_iter entrypoints[32];
Chris Forbes47567b72017-06-09 12:09:45 -07003294 memset(entrypoints, 0, sizeof(entrypoints));
3295 bool skip = false;
3296
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003297 uint32_t pointlist_stage_mask = DetermineFinalGeomStage(pipeline, pCreateInfo);
3298
Chris Forbes47567b72017-06-09 12:09:45 -07003299 for (uint32_t i = 0; i < pCreateInfo->stageCount; i++) {
3300 auto pStage = &pCreateInfo->pStages[i];
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003301 auto stage_id = GetShaderStageId(pStage->stage);
John Zulauf14c355b2019-06-27 16:09:37 -06003302 shaders[stage_id] = GetShaderModuleState(pStage->module);
3303 entrypoints[stage_id] = FindEntrypoint(shaders[stage_id], pStage->pName, pStage->stage);
3304 skip |= ValidatePipelineShaderStage(pStage, pipeline, pipeline->stage_state[i], shaders[stage_id], entrypoints[stage_id],
Mark Lobodzinski1b4a8ed2018-08-07 08:47:05 -06003305 (pointlist_stage_mask == pStage->stage));
Chris Forbes47567b72017-06-09 12:09:45 -07003306 }
3307
3308 // if the shader stages are no good individually, cross-stage validation is pointless.
3309 if (skip) return true;
3310
3311 auto vi = pCreateInfo->pVertexInputState;
3312
3313 if (vi) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003314 skip |= ValidateViConsistency(vi);
Chris Forbes47567b72017-06-09 12:09:45 -07003315 }
3316
3317 if (shaders[vertex_stage] && shaders[vertex_stage]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003318 skip |= ValidateViAgainstVsInputs(vi, shaders[vertex_stage], entrypoints[vertex_stage]);
Chris Forbes47567b72017-06-09 12:09:45 -07003319 }
3320
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003321 int producer = GetShaderStageId(VK_SHADER_STAGE_VERTEX_BIT);
3322 int consumer = GetShaderStageId(VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT);
Chris Forbes47567b72017-06-09 12:09:45 -07003323
3324 while (!shaders[producer] && producer != fragment_stage) {
3325 producer++;
3326 consumer++;
3327 }
3328
3329 for (; producer != fragment_stage && consumer <= fragment_stage; consumer++) {
3330 assert(shaders[producer]);
Chris Forbesdbb43fc2018-02-16 16:59:23 -08003331 if (shaders[consumer]) {
3332 if (shaders[consumer]->has_valid_spirv && shaders[producer]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003333 skip |= ValidateInterfaceBetweenStages(shaders[producer], entrypoints[producer], &shader_stage_attribs[producer],
3334 shaders[consumer], entrypoints[consumer], &shader_stage_attribs[consumer]);
Chris Forbesdbb43fc2018-02-16 16:59:23 -08003335 }
Chris Forbes47567b72017-06-09 12:09:45 -07003336
3337 producer = consumer;
3338 }
3339 }
3340
3341 if (shaders[fragment_stage] && shaders[fragment_stage]->has_valid_spirv) {
Mark Lobodzinskid8d658e2020-01-30 15:05:51 -07003342 skip |= ValidateFsOutputsAgainstRenderPass(shaders[fragment_stage], entrypoints[fragment_stage], pipeline,
Shannon McPhersonc06c33d2018-06-28 17:21:12 -06003343 pCreateInfo->subpass);
Chris Forbes47567b72017-06-09 12:09:45 -07003344 }
3345
3346 return skip;
3347}
3348
sfricke-samsunge72a85e2020-02-29 21:48:37 -08003349bool CoreChecks::ValidateComputePipelineShaderState(PIPELINE_STATE *pipeline) const {
John Zulauf14c355b2019-06-27 16:09:37 -06003350 const auto &stage = *pipeline->computePipelineCI.stage.ptr();
Chris Forbes47567b72017-06-09 12:09:45 -07003351
John Zulauf14c355b2019-06-27 16:09:37 -06003352 const SHADER_MODULE_STATE *module = GetShaderModuleState(stage.module);
3353 const spirv_inst_iter entrypoint = FindEntrypoint(module, stage.pName, stage.stage);
Chris Forbes47567b72017-06-09 12:09:45 -07003354
John Zulauf14c355b2019-06-27 16:09:37 -06003355 return ValidatePipelineShaderStage(&stage, pipeline, pipeline->stage_state[0], module, entrypoint, false);
Chris Forbes47567b72017-06-09 12:09:45 -07003356}
Chris Forbes4ae55b32017-06-09 14:42:56 -07003357
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003358bool CoreChecks::ValidateRayTracingPipeline(PIPELINE_STATE *pipeline, bool isKHR) const {
John Zulaufe4474e72019-07-01 17:28:27 -06003359 bool skip = false;
Jason Macnak15f95e82019-08-21 21:52:02 -04003360
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003361 if (isKHR) {
3362 if (pipeline->raytracingPipelineCI.maxRecursionDepth > phys_dev_ext_props.ray_tracing_propsKHR.maxRecursionDepth) {
3363 skip |= LogError(device, "VUID-VkRayTracingPipelineCreateInfoKHR-maxRecursionDepth-03464", ": %d > %d",
3364 pipeline->raytracingPipelineCI.maxRecursionDepth,
3365 phys_dev_ext_props.ray_tracing_propsKHR.maxRecursionDepth);
3366 }
sourav parmar83c31b12020-05-06 12:30:54 -07003367 for (uint32_t i = 0; i < pipeline->raytracingPipelineCI.libraries.libraryCount; ++i) {
3368 const PIPELINE_STATE *pLibrary_pipelinestate = GetPipelineState(pipeline->raytracingPipelineCI.libraries.pLibraries[i]);
3369 if (pLibrary_pipelinestate->raytracingPipelineCI.maxRecursionDepth !=
3370 pipeline->raytracingPipelineCI.maxRecursionDepth) {
3371 skip |= LogError(
3372 device, "VUID-VkRayTracingPipelineCreateInfoKHR-pLibraries-03467",
3373 "vkCreateRayTracingPipelinesKHR: Each element (%d) of the pLibraries member of libraries must have been"
3374 "created with the value of maxRecursionDepth (%d) equal to that in this pipeline (%d) .",
3375 i, pLibrary_pipelinestate->raytracingPipelineCI.maxRecursionDepth,
3376 pipeline->raytracingPipelineCI.maxRecursionDepth);
3377 }
3378 if (pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxAttributeSize !=
3379 pipeline->raytracingPipelineCI.pLibraryInterface->maxAttributeSize ||
3380 pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxPayloadSize !=
3381 pipeline->raytracingPipelineCI.pLibraryInterface->maxPayloadSize ||
3382 pLibrary_pipelinestate->raytracingPipelineCI.pLibraryInterface->maxCallableSize !=
3383 pipeline->raytracingPipelineCI.pLibraryInterface->maxCallableSize) {
3384 skip |=
3385 LogError(device, "VUID-VkRayTracingPipelineCreateInfoKHR-pLibraries-03469",
3386 "vkCreateRayTracingPipelinesKHR: Each element of the pLibraries member of libraries must have been "
3387 "created with values of the maxPayloadSize,"
3388 "maxAttributeSize, and maxCallableSize members of pLibraryInterface equal to those in this pipeline.");
3389 }
3390 }
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003391 } else {
3392 if (pipeline->raytracingPipelineCI.maxRecursionDepth > phys_dev_ext_props.ray_tracing_propsNV.maxRecursionDepth) {
3393 skip |= LogError(device, "VUID-VkRayTracingPipelineCreateInfoNV-maxRecursionDepth-03457", ": %d > %d",
3394 pipeline->raytracingPipelineCI.maxRecursionDepth,
3395 phys_dev_ext_props.ray_tracing_propsNV.maxRecursionDepth);
3396 }
Jason Macnak15f95e82019-08-21 21:52:02 -04003397 }
Jason Macnak15f95e82019-08-21 21:52:02 -04003398 const auto *stages = pipeline->raytracingPipelineCI.ptr()->pStages;
3399 const auto *groups = pipeline->raytracingPipelineCI.ptr()->pGroups;
3400
3401 uint32_t raygen_stages_found = 0;
John Zulaufe4474e72019-07-01 17:28:27 -06003402 for (uint32_t stage_index = 0; stage_index < pipeline->raytracingPipelineCI.stageCount; stage_index++) {
Jason Macnak15f95e82019-08-21 21:52:02 -04003403 const auto &stage = stages[stage_index];
Jeff Bolzfbe51582018-09-13 10:01:35 -05003404
John Zulaufe4474e72019-07-01 17:28:27 -06003405 const SHADER_MODULE_STATE *module = GetShaderModuleState(stage.module);
3406 const spirv_inst_iter entrypoint = FindEntrypoint(module, stage.pName, stage.stage);
Jeff Bolzfbe51582018-09-13 10:01:35 -05003407
John Zulaufe4474e72019-07-01 17:28:27 -06003408 skip |= ValidatePipelineShaderStage(&stage, pipeline, pipeline->stage_state[stage_index], module, entrypoint, false);
Jason Macnak15f95e82019-08-21 21:52:02 -04003409
3410 if (stage.stage == VK_SHADER_STAGE_RAYGEN_BIT_NV) {
3411 raygen_stages_found++;
3412 }
3413 }
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003414 if (raygen_stages_found == 0) {
3415 skip |= LogError(
3416 device,
3417 isKHR ? "VUID-VkRayTracingPipelineCreateInfoKHR-stage-03425" : "VUID-VkRayTracingPipelineCreateInfoNV-stage-03425",
3418 " : zero raygen stages specified");
Jason Macnak15f95e82019-08-21 21:52:02 -04003419 }
3420
3421 for (uint32_t group_index = 0; group_index < pipeline->raytracingPipelineCI.groupCount; group_index++) {
3422 const auto &group = groups[group_index];
3423
3424 if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_GENERAL_NV) {
3425 if (group.generalShader >= pipeline->raytracingPipelineCI.stageCount ||
3426 (stages[group.generalShader].stage != VK_SHADER_STAGE_RAYGEN_BIT_NV &&
3427 stages[group.generalShader].stage != VK_SHADER_STAGE_MISS_BIT_NV &&
3428 stages[group.generalShader].stage != VK_SHADER_STAGE_CALLABLE_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003429 skip |= LogError(device,
3430 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03474"
3431 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02413",
3432 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003433 }
3434 if (group.anyHitShader != VK_SHADER_UNUSED_NV || group.closestHitShader != VK_SHADER_UNUSED_NV ||
3435 group.intersectionShader != VK_SHADER_UNUSED_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003436 skip |= LogError(device,
3437 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03475"
3438 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02414",
3439 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003440 }
3441 } else if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_PROCEDURAL_HIT_GROUP_NV) {
3442 if (group.intersectionShader >= pipeline->raytracingPipelineCI.stageCount ||
3443 stages[group.intersectionShader].stage != VK_SHADER_STAGE_INTERSECTION_BIT_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003444 skip |= LogError(device,
3445 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03476"
3446 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02415",
3447 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003448 }
3449 } else if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_TRIANGLES_HIT_GROUP_NV) {
3450 if (group.intersectionShader != VK_SHADER_UNUSED_NV) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003451 skip |= LogError(device,
3452 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-type-03477"
3453 : "VUID-VkRayTracingShaderGroupCreateInfoNV-type-02416",
3454 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003455 }
3456 }
3457
3458 if (group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_PROCEDURAL_HIT_GROUP_NV ||
3459 group.type == VK_RAY_TRACING_SHADER_GROUP_TYPE_TRIANGLES_HIT_GROUP_NV) {
3460 if (group.anyHitShader != VK_SHADER_UNUSED_NV && (group.anyHitShader >= pipeline->raytracingPipelineCI.stageCount ||
3461 stages[group.anyHitShader].stage != VK_SHADER_STAGE_ANY_HIT_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003462 skip |= LogError(device,
3463 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-anyHitShader-03479"
3464 : "VUID-VkRayTracingShaderGroupCreateInfoNV-anyHitShader-02418",
3465 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003466 }
3467 if (group.closestHitShader != VK_SHADER_UNUSED_NV &&
3468 (group.closestHitShader >= pipeline->raytracingPipelineCI.stageCount ||
3469 stages[group.closestHitShader].stage != VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV)) {
Jeff Bolz443c2ca2020-03-19 12:11:51 -05003470 skip |= LogError(device,
3471 isKHR ? "VUID-VkRayTracingShaderGroupCreateInfoKHR-closestHitShader-03478"
3472 : "VUID-VkRayTracingShaderGroupCreateInfoNV-closestHitShader-02417",
3473 ": pGroups[%d]", group_index);
Jason Macnak15f95e82019-08-21 21:52:02 -04003474 }
3475 }
John Zulaufe4474e72019-07-01 17:28:27 -06003476 }
3477 return skip;
Jeff Bolzfbe51582018-09-13 10:01:35 -05003478}
3479
Dave Houltona9df0ce2018-02-07 10:51:23 -07003480uint32_t ValidationCache::MakeShaderHash(VkShaderModuleCreateInfo const *smci) { return XXH32(smci->pCode, smci->codeSize, 0); }
Chris Forbes9a61e082017-07-24 15:35:29 -07003481
Dave Houltona9df0ce2018-02-07 10:51:23 -07003482static ValidationCache *GetValidationCacheInfo(VkShaderModuleCreateInfo const *pCreateInfo) {
John Zulauf25ea2432019-04-05 10:07:38 -06003483 const auto validation_cache_ci = lvl_find_in_chain<VkShaderModuleValidationCacheCreateInfoEXT>(pCreateInfo->pNext);
3484 if (validation_cache_ci) {
John Zulauf146ee802019-04-05 15:31:06 -06003485 return CastFromHandle<ValidationCache *>(validation_cache_ci->validationCache);
Chris Forbes9a61e082017-07-24 15:35:29 -07003486 }
Chris Forbes9a61e082017-07-24 15:35:29 -07003487 return nullptr;
3488}
3489
Mark Lobodzinskib56bbb92019-02-18 11:49:59 -07003490bool CoreChecks::PreCallValidateCreateShaderModule(VkDevice device, const VkShaderModuleCreateInfo *pCreateInfo,
Jeff Bolz5c801d12019-10-09 10:38:45 -05003491 const VkAllocationCallbacks *pAllocator, VkShaderModule *pShaderModule) const {
Chris Forbes4ae55b32017-06-09 14:42:56 -07003492 bool skip = false;
3493 spv_result_t spv_valid = SPV_SUCCESS;
Chris Forbes4ae55b32017-06-09 14:42:56 -07003494
Mark Lobodzinski90eea5b2020-05-15 12:54:00 -06003495 if (disabled[shader_validation]) {
Chris Forbes4ae55b32017-06-09 14:42:56 -07003496 return false;
3497 }
3498
Mark Lobodzinskif45e45f2019-04-19 14:15:39 -06003499 auto have_glsl_shader = device_extensions.vk_nv_glsl_shader;
Chris Forbes4ae55b32017-06-09 14:42:56 -07003500
3501 if (!have_glsl_shader && (pCreateInfo->codeSize % 4)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003502 skip |= LogError(device, "VUID-VkShaderModuleCreateInfo-pCode-01376",
3503 "SPIR-V module not valid: Codesize must be a multiple of 4 but is " PRINTF_SIZE_T_SPECIFIER ".",
3504 pCreateInfo->codeSize);
Chris Forbes4ae55b32017-06-09 14:42:56 -07003505 } else {
Chris Forbes9a61e082017-07-24 15:35:29 -07003506 auto cache = GetValidationCacheInfo(pCreateInfo);
3507 uint32_t hash = 0;
3508 if (cache) {
3509 hash = ValidationCache::MakeShaderHash(pCreateInfo);
Dave Houltona9df0ce2018-02-07 10:51:23 -07003510 if (cache->Contains(hash)) return false;
Chris Forbes9a61e082017-07-24 15:35:29 -07003511 }
3512
Jeremy Hayesb3e4d532019-08-16 10:08:49 -06003513 // Use SPIRV-Tools validator to try and catch any issues with the module itself. If specialization constants are present,
3514 // the default values will be used during validation.
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06003515 spv_target_env spirv_environment = PickSpirvEnv(api_version, (device_extensions.vk_khr_spirv_1_4 != kNotEnabled));
Dave Houlton0ea2d012018-06-21 14:00:26 -06003516 spv_context ctx = spvContextCreate(spirv_environment);
Dave Houltona9df0ce2018-02-07 10:51:23 -07003517 spv_const_binary_t binary{pCreateInfo->pCode, pCreateInfo->codeSize / sizeof(uint32_t)};
Chris Forbes4ae55b32017-06-09 14:42:56 -07003518 spv_diagnostic diag = nullptr;
Tony-LunarG9fe69a42020-07-23 15:09:37 -06003519 spvtools::ValidatorOptions options;
3520 AdjustValidatorOptions(device_extensions, enabled_features, options);
Karl Schultzfda1b382018-08-08 18:56:11 -06003521 spv_valid = spvValidateWithOptions(ctx, options, &binary, &diag);
Chris Forbes4ae55b32017-06-09 14:42:56 -07003522 if (spv_valid != SPV_SUCCESS) {
3523 if (!have_glsl_shader || (pCreateInfo->pCode[0] == spv::MagicNumber)) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003524 if (spv_valid == SPV_WARNING) {
3525 skip |= LogWarning(device, kVUID_Core_Shader_InconsistentSpirv, "SPIR-V module not valid: %s",
3526 diag && diag->error ? diag->error : "(no error text)");
3527 } else {
3528 skip |= LogError(device, kVUID_Core_Shader_InconsistentSpirv, "SPIR-V module not valid: %s",
3529 diag && diag->error ? diag->error : "(no error text)");
3530 }
Chris Forbes4ae55b32017-06-09 14:42:56 -07003531 }
Chris Forbes9a61e082017-07-24 15:35:29 -07003532 } else {
3533 if (cache) {
3534 cache->Insert(hash);
3535 }
Chris Forbes4ae55b32017-06-09 14:42:56 -07003536 }
3537
3538 spvDiagnosticDestroy(diag);
3539 spvContextDestroy(ctx);
3540 }
3541
Chris Forbes4ae55b32017-06-09 14:42:56 -07003542 return skip;
Mark Lobodzinski01734072019-02-13 17:39:15 -07003543}
3544
John Zulaufac4c6e12019-07-01 16:05:58 -06003545bool CoreChecks::ValidateComputeWorkGroupSizes(const SHADER_MODULE_STATE *shader) const {
Lockeaa8fdc02019-04-02 11:59:20 -06003546 bool skip = false;
3547 uint32_t local_size_x = 0;
3548 uint32_t local_size_y = 0;
3549 uint32_t local_size_z = 0;
3550 if (FindLocalSize(shader, local_size_x, local_size_y, local_size_z)) {
3551 if (local_size_x > phys_dev_props.limits.maxComputeWorkGroupSize[0]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003552 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
3553 "%s local_size_x (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[0] (%" PRIu32 ").",
3554 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
3555 phys_dev_props.limits.maxComputeWorkGroupSize[0]);
Lockeaa8fdc02019-04-02 11:59:20 -06003556 }
3557 if (local_size_y > phys_dev_props.limits.maxComputeWorkGroupSize[1]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003558 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
3559 "%s local_size_y (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[1] (%" PRIu32 ").",
3560 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
3561 phys_dev_props.limits.maxComputeWorkGroupSize[1]);
Lockeaa8fdc02019-04-02 11:59:20 -06003562 }
3563 if (local_size_z > phys_dev_props.limits.maxComputeWorkGroupSize[2]) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003564 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupSize",
3565 "%s local_size_z (%" PRIu32 ") exceeds device limit maxComputeWorkGroupSize[2] (%" PRIu32 ").",
3566 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x,
3567 phys_dev_props.limits.maxComputeWorkGroupSize[2]);
Lockeaa8fdc02019-04-02 11:59:20 -06003568 }
3569
3570 uint32_t limit = phys_dev_props.limits.maxComputeWorkGroupInvocations;
3571 uint64_t invocations = local_size_x * local_size_y;
3572 // Prevent overflow.
3573 bool fail = false;
3574 if (invocations > UINT32_MAX || invocations > limit) {
3575 fail = true;
3576 }
3577 if (!fail) {
3578 invocations *= local_size_z;
3579 if (invocations > UINT32_MAX || invocations > limit) {
3580 fail = true;
3581 }
3582 }
3583 if (fail) {
Mark Lobodzinski12b9be92020-01-30 15:25:55 -07003584 skip |= LogError(shader->vk_shader_module, "UNASSIGNED-features-limits-maxComputeWorkGroupInvocations",
3585 "%s local_size (%" PRIu32 ", %" PRIu32 ", %" PRIu32
3586 ") exceeds device limit maxComputeWorkGroupInvocations (%" PRIu32 ").",
3587 report_data->FormatHandle(shader->vk_shader_module).c_str(), local_size_x, local_size_y, local_size_z,
3588 limit);
Lockeaa8fdc02019-04-02 11:59:20 -06003589 }
3590 }
3591 return skip;
3592}
Tony-LunarG8a51b7d2020-07-01 15:57:23 -06003593
3594spv_target_env PickSpirvEnv(uint32_t api_version, bool spirv_1_4) {
3595 if (api_version >= VK_API_VERSION_1_2) {
3596 return SPV_ENV_VULKAN_1_2;
3597 } else if (api_version >= VK_API_VERSION_1_1) {
3598 if (spirv_1_4) {
3599 return SPV_ENV_VULKAN_1_1_SPIRV_1_4;
3600 } else {
3601 return SPV_ENV_VULKAN_1_1;
3602 }
3603 }
3604 return SPV_ENV_VULKAN_1_0;
3605}
Tony-LunarG9fe69a42020-07-23 15:09:37 -06003606
3607void AdjustValidatorOptions(const DeviceExtensions device_extensions, const DeviceFeatures enabled_features,
3608 spvtools::ValidatorOptions &options) {
3609 if (device_extensions.vk_khr_relaxed_block_layout) {
3610 options.SetRelaxBlockLayout(true);
3611 }
3612 if (device_extensions.vk_khr_uniform_buffer_standard_layout && enabled_features.core12.uniformBufferStandardLayout == VK_TRUE) {
3613 options.SetUniformBufferStandardLayout(true);
3614 }
3615 if (device_extensions.vk_ext_scalar_block_layout && enabled_features.core12.scalarBlockLayout == VK_TRUE) {
3616 options.SetScalarBlockLayout(true);
3617 }
3618}