blob: c896f28c3804f920fc6ad22303bd0e511374382e [file] [log] [blame]
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001/* Copyright (c) 2021-2022 The Khronos Group Inc.
sfricke-samsung962cad92021-04-13 00:46:29 -07002 *
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 *
15 * Author: Spencer Fricke <s.fricke@samsung.com>
16 */
17
18#include "shader_module.h"
19
20#include <sstream>
21#include <string>
22
23#include "vk_layer_data.h"
24#include "vk_layer_utils.h"
Jeremy Gebben5d970742021-05-31 16:04:14 -060025#include "pipeline_state.h"
26#include "descriptor_sets.h"
sfricke-samsung3c5dee22021-10-14 09:58:14 -070027#include "spirv_grammar_helper.h"
sfricke-samsung962cad92021-04-13 00:46:29 -070028
29void decoration_set::merge(decoration_set const &other) {
30 if (other.flags & location_bit) location = other.location;
31 if (other.flags & component_bit) component = other.component;
32 if (other.flags & input_attachment_index_bit) input_attachment_index = other.input_attachment_index;
33 if (other.flags & descriptor_set_bit) descriptor_set = other.descriptor_set;
34 if (other.flags & binding_bit) binding = other.binding;
35 if (other.flags & builtin_bit) builtin = other.builtin;
36 flags |= other.flags;
37}
38
39void decoration_set::add(uint32_t decoration, uint32_t value) {
40 switch (decoration) {
41 case spv::DecorationLocation:
42 flags |= location_bit;
43 location = value;
44 break;
45 case spv::DecorationPatch:
46 flags |= patch_bit;
47 break;
48 case spv::DecorationRelaxedPrecision:
49 flags |= relaxed_precision_bit;
50 break;
51 case spv::DecorationBlock:
52 flags |= block_bit;
53 break;
54 case spv::DecorationBufferBlock:
55 flags |= buffer_block_bit;
56 break;
57 case spv::DecorationComponent:
58 flags |= component_bit;
59 component = value;
60 break;
61 case spv::DecorationInputAttachmentIndex:
62 flags |= input_attachment_index_bit;
63 input_attachment_index = value;
64 break;
65 case spv::DecorationDescriptorSet:
66 flags |= descriptor_set_bit;
67 descriptor_set = value;
68 break;
69 case spv::DecorationBinding:
70 flags |= binding_bit;
71 binding = value;
72 break;
73 case spv::DecorationNonWritable:
74 flags |= nonwritable_bit;
75 break;
76 case spv::DecorationBuiltIn:
77 flags |= builtin_bit;
78 builtin = value;
79 break;
Lionel Landwerlin38d2e122021-07-21 14:21:47 +030080 case spv::DecorationNonReadable:
81 flags |= nonreadable_bit;
82 break;
ziga-lunarg9e94e112021-09-27 00:21:10 +020083 case spv::DecorationPerVertexNV:
84 flags |= per_vertex_bit;
85 break;
86 case spv::DecorationPassthroughNV:
87 flags |= passthrough_bit;
88 break;
sfricke-samsung962cad92021-04-13 00:46:29 -070089 }
90}
91
92std::string shader_struct_member::GetLocationDesc(uint32_t index_used_bytes) const {
93 std::string desc = "";
94 if (array_length_hierarchy.size() > 0) {
95 desc += " index:";
96 for (const auto block_size : array_block_size) {
97 desc += "[";
98 desc += std::to_string(index_used_bytes / (block_size * size));
99 desc += "]";
100 index_used_bytes = index_used_bytes % (block_size * size);
101 }
102 }
103 const int struct_members_size = static_cast<int>(struct_members.size());
104 if (struct_members_size > 0) {
105 desc += " member:";
106 for (int i = struct_members_size - 1; i >= 0; --i) {
107 if (index_used_bytes > struct_members[i].offset) {
108 desc += std::to_string(i);
109 desc += struct_members[i].GetLocationDesc(index_used_bytes - struct_members[i].offset);
110 break;
111 }
112 }
113 } else {
114 desc += " offset:";
115 desc += std::to_string(index_used_bytes);
116 }
117 return desc;
118}
119
120static unsigned ExecutionModelToShaderStageFlagBits(unsigned mode) {
121 switch (mode) {
122 case spv::ExecutionModelVertex:
123 return VK_SHADER_STAGE_VERTEX_BIT;
124 case spv::ExecutionModelTessellationControl:
125 return VK_SHADER_STAGE_TESSELLATION_CONTROL_BIT;
126 case spv::ExecutionModelTessellationEvaluation:
127 return VK_SHADER_STAGE_TESSELLATION_EVALUATION_BIT;
128 case spv::ExecutionModelGeometry:
129 return VK_SHADER_STAGE_GEOMETRY_BIT;
130 case spv::ExecutionModelFragment:
131 return VK_SHADER_STAGE_FRAGMENT_BIT;
132 case spv::ExecutionModelGLCompute:
133 return VK_SHADER_STAGE_COMPUTE_BIT;
134 case spv::ExecutionModelRayGenerationNV:
135 return VK_SHADER_STAGE_RAYGEN_BIT_NV;
136 case spv::ExecutionModelAnyHitNV:
137 return VK_SHADER_STAGE_ANY_HIT_BIT_NV;
138 case spv::ExecutionModelClosestHitNV:
139 return VK_SHADER_STAGE_CLOSEST_HIT_BIT_NV;
140 case spv::ExecutionModelMissNV:
141 return VK_SHADER_STAGE_MISS_BIT_NV;
142 case spv::ExecutionModelIntersectionNV:
143 return VK_SHADER_STAGE_INTERSECTION_BIT_NV;
144 case spv::ExecutionModelCallableNV:
145 return VK_SHADER_STAGE_CALLABLE_BIT_NV;
146 case spv::ExecutionModelTaskNV:
147 return VK_SHADER_STAGE_TASK_BIT_NV;
148 case spv::ExecutionModelMeshNV:
149 return VK_SHADER_STAGE_MESH_BIT_NV;
150 default:
151 return 0;
152 }
153}
154
155// For some analyses, we need to know about all ids referenced by the static call tree of a particular entrypoint. This is
156// important for identifying the set of shader resources actually used by an entrypoint, for example.
157// Note: we only explore parts of the image which might actually contain ids we care about for the above analyses.
158// - NOT the shader input/output interfaces.
159//
160// TODO: The set of interesting opcodes here was determined by eyeballing the SPIRV spec. It might be worth
161// converting parts of this to be generated from the machine-readable spec instead.
162layer_data::unordered_set<uint32_t> SHADER_MODULE_STATE::MarkAccessibleIds(spirv_inst_iter entrypoint) const {
163 layer_data::unordered_set<uint32_t> ids;
Jeremy Gebben84b838b2021-08-23 08:41:39 -0600164 if (entrypoint == end() || !has_valid_spirv) {
165 return ids;
166 }
sfricke-samsung962cad92021-04-13 00:46:29 -0700167 layer_data::unordered_set<uint32_t> worklist;
168 worklist.insert(entrypoint.word(2));
169
170 while (!worklist.empty()) {
171 auto id_iter = worklist.begin();
172 auto id = *id_iter;
173 worklist.erase(id_iter);
174
175 auto insn = get_def(id);
176 if (insn == end()) {
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600177 // ID is something we didn't collect in SpirvStaticData. that's OK -- we'll stumble across all kinds of things here
sfricke-samsung962cad92021-04-13 00:46:29 -0700178 // that we may not care about.
179 continue;
180 }
181
182 // Try to add to the output set
183 if (!ids.insert(id).second) {
184 continue; // If we already saw this id, we don't want to walk it again.
185 }
186
187 switch (insn.opcode()) {
188 case spv::OpFunction:
189 // Scan whole body of the function, enlisting anything interesting
190 while (++insn, insn.opcode() != spv::OpFunctionEnd) {
191 switch (insn.opcode()) {
192 case spv::OpLoad:
193 worklist.insert(insn.word(3)); // ptr
194 break;
195 case spv::OpStore:
196 worklist.insert(insn.word(1)); // ptr
197 break;
198 case spv::OpAccessChain:
199 case spv::OpInBoundsAccessChain:
200 worklist.insert(insn.word(3)); // base ptr
201 break;
202 case spv::OpSampledImage:
203 case spv::OpImageSampleImplicitLod:
204 case spv::OpImageSampleExplicitLod:
205 case spv::OpImageSampleDrefImplicitLod:
206 case spv::OpImageSampleDrefExplicitLod:
207 case spv::OpImageSampleProjImplicitLod:
208 case spv::OpImageSampleProjExplicitLod:
209 case spv::OpImageSampleProjDrefImplicitLod:
210 case spv::OpImageSampleProjDrefExplicitLod:
211 case spv::OpImageFetch:
212 case spv::OpImageGather:
213 case spv::OpImageDrefGather:
214 case spv::OpImageRead:
215 case spv::OpImage:
216 case spv::OpImageQueryFormat:
217 case spv::OpImageQueryOrder:
218 case spv::OpImageQuerySizeLod:
219 case spv::OpImageQuerySize:
220 case spv::OpImageQueryLod:
221 case spv::OpImageQueryLevels:
222 case spv::OpImageQuerySamples:
223 case spv::OpImageSparseSampleImplicitLod:
224 case spv::OpImageSparseSampleExplicitLod:
225 case spv::OpImageSparseSampleDrefImplicitLod:
226 case spv::OpImageSparseSampleDrefExplicitLod:
227 case spv::OpImageSparseSampleProjImplicitLod:
228 case spv::OpImageSparseSampleProjExplicitLod:
229 case spv::OpImageSparseSampleProjDrefImplicitLod:
230 case spv::OpImageSparseSampleProjDrefExplicitLod:
231 case spv::OpImageSparseFetch:
232 case spv::OpImageSparseGather:
233 case spv::OpImageSparseDrefGather:
234 case spv::OpImageTexelPointer:
235 worklist.insert(insn.word(3)); // Image or sampled image
236 break;
237 case spv::OpImageWrite:
238 worklist.insert(insn.word(1)); // Image -- different operand order to above
239 break;
240 case spv::OpFunctionCall:
241 for (uint32_t i = 3; i < insn.len(); i++) {
242 worklist.insert(insn.word(i)); // fn itself, and all args
243 }
244 break;
245
246 case spv::OpExtInst:
247 for (uint32_t i = 5; i < insn.len(); i++) {
248 worklist.insert(insn.word(i)); // Operands to ext inst
249 }
250 break;
251
252 default: {
253 if (AtomicOperation(insn.opcode())) {
254 if (insn.opcode() == spv::OpAtomicStore) {
255 worklist.insert(insn.word(1)); // ptr
256 } else {
257 worklist.insert(insn.word(3)); // ptr
258 }
259 }
260 break;
261 }
262 }
263 }
264 break;
265 }
266 }
267
268 return ids;
269}
270
Jeremy Gebben84b838b2021-08-23 08:41:39 -0600271layer_data::optional<VkPrimitiveTopology> SHADER_MODULE_STATE::GetTopology(const spirv_inst_iter &entrypoint) const {
272 layer_data::optional<VkPrimitiveTopology> result;
273
sfricke-samsung962cad92021-04-13 00:46:29 -0700274 auto entrypoint_id = entrypoint.word(2);
275 bool is_point_mode = false;
276
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600277 auto it = static_data_.execution_mode_inst.find(entrypoint_id);
278 if (it != static_data_.execution_mode_inst.end()) {
sfricke-samsung962cad92021-04-13 00:46:29 -0700279 for (auto insn : it->second) {
280 switch (insn.word(2)) {
281 case spv::ExecutionModePointMode:
282 // In tessellation shaders, PointMode is separate and trumps the tessellation topology.
283 is_point_mode = true;
284 break;
285
286 case spv::ExecutionModeOutputPoints:
Jeremy Gebben84b838b2021-08-23 08:41:39 -0600287 result.emplace(VK_PRIMITIVE_TOPOLOGY_POINT_LIST);
sfricke-samsung962cad92021-04-13 00:46:29 -0700288 break;
289
290 case spv::ExecutionModeIsolines:
291 case spv::ExecutionModeOutputLineStrip:
Ricardo Garcia122f8f02021-09-28 16:47:19 +0200292 case spv::ExecutionModeOutputLinesNV:
Jeremy Gebben84b838b2021-08-23 08:41:39 -0600293 result.emplace(VK_PRIMITIVE_TOPOLOGY_LINE_STRIP);
sfricke-samsung962cad92021-04-13 00:46:29 -0700294 break;
295
296 case spv::ExecutionModeTriangles:
297 case spv::ExecutionModeQuads:
298 case spv::ExecutionModeOutputTriangleStrip:
299 case spv::ExecutionModeOutputTrianglesNV:
Jeremy Gebben84b838b2021-08-23 08:41:39 -0600300 result.emplace(VK_PRIMITIVE_TOPOLOGY_TRIANGLE_STRIP);
sfricke-samsung962cad92021-04-13 00:46:29 -0700301 break;
302 }
303 }
304 }
305
Jeremy Gebben84b838b2021-08-23 08:41:39 -0600306 if (is_point_mode) {
307 result.emplace(VK_PRIMITIVE_TOPOLOGY_POINT_LIST);
308 }
309
310 return result;
sfricke-samsung962cad92021-04-13 00:46:29 -0700311}
312
sfricke-samsungef15e482022-01-26 11:32:49 -0800313SHADER_MODULE_STATE::SpirvStaticData::SpirvStaticData(const SHADER_MODULE_STATE &module_state) {
314 for (auto insn : module_state) {
sfricke-samsung962cad92021-04-13 00:46:29 -0700315 switch (insn.opcode()) {
316 // Types
317 case spv::OpTypeVoid:
318 case spv::OpTypeBool:
319 case spv::OpTypeInt:
320 case spv::OpTypeFloat:
321 case spv::OpTypeVector:
322 case spv::OpTypeMatrix:
323 case spv::OpTypeImage:
324 case spv::OpTypeSampler:
325 case spv::OpTypeSampledImage:
326 case spv::OpTypeArray:
327 case spv::OpTypeRuntimeArray:
328 case spv::OpTypeStruct:
329 case spv::OpTypeOpaque:
330 case spv::OpTypePointer:
331 case spv::OpTypeFunction:
332 case spv::OpTypeEvent:
333 case spv::OpTypeDeviceEvent:
334 case spv::OpTypeReserveId:
335 case spv::OpTypeQueue:
336 case spv::OpTypePipe:
337 case spv::OpTypeAccelerationStructureNV:
338 case spv::OpTypeCooperativeMatrixNV:
339 def_index[insn.word(1)] = insn.offset();
340 break;
341
342 // Fixed constants
343 case spv::OpConstantTrue:
344 case spv::OpConstantFalse:
345 case spv::OpConstant:
346 case spv::OpConstantComposite:
347 case spv::OpConstantSampler:
348 case spv::OpConstantNull:
349 def_index[insn.word(2)] = insn.offset();
350 break;
351
352 // Specialization constants
353 case spv::OpSpecConstantTrue:
354 case spv::OpSpecConstantFalse:
355 case spv::OpSpecConstant:
356 case spv::OpSpecConstantComposite:
357 case spv::OpSpecConstantOp:
358 def_index[insn.word(2)] = insn.offset();
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600359 has_specialization_constants = true;
sfricke-samsung962cad92021-04-13 00:46:29 -0700360 break;
361
sfricke-samsung58b84352021-07-31 21:41:04 -0700362 // Have a result that can be a pointer
sfricke-samsung962cad92021-04-13 00:46:29 -0700363 case spv::OpVariable:
sfricke-samsung58b84352021-07-31 21:41:04 -0700364 case spv::OpAccessChain:
365 case spv::OpInBoundsAccessChain:
366 case spv::OpFunctionParameter:
367 case spv::OpImageTexelPointer:
sfricke-samsung962cad92021-04-13 00:46:29 -0700368 def_index[insn.word(2)] = insn.offset();
369 break;
370
sfricke-samsungdb3f3f82022-01-18 06:41:15 -0800371 // Will need to extract loads for SAMPLED_IMAGE and SAMPLER
372 case spv::OpSampledImage:
373 def_index[insn.word(2)] = insn.offset();
374 break;
375
sfricke-samsung962cad92021-04-13 00:46:29 -0700376 // Functions
377 case spv::OpFunction:
378 def_index[insn.word(2)] = insn.offset();
sfricke-samsung962cad92021-04-13 00:46:29 -0700379 break;
380
381 // Decorations
382 case spv::OpDecorate: {
383 auto target_id = insn.word(1);
384 decorations[target_id].add(insn.word(2), insn.len() > 3u ? insn.word(3) : 0u);
385 decoration_inst.push_back(insn);
386 if (insn.word(2) == spv::DecorationBuiltIn) {
387 builtin_decoration_list.emplace_back(insn.offset(), static_cast<spv::BuiltIn>(insn.word(3)));
Nathaniel Cesariocf69bda2021-06-22 13:23:42 -0600388 } else if (insn.word(2) == spv::DecorationSpecId) {
389 spec_const_map[insn.word(3)] = target_id;
sfricke-samsung962cad92021-04-13 00:46:29 -0700390 }
391
392 } break;
393 case spv::OpGroupDecorate: {
394 auto const &src = decorations[insn.word(1)];
395 for (auto i = 2u; i < insn.len(); i++) decorations[insn.word(i)].merge(src);
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600396 has_group_decoration = true;
397 } break;
398 case spv::OpDecorationGroup:
399 case spv::OpGroupMemberDecorate: {
400 has_group_decoration = true;
sfricke-samsung962cad92021-04-13 00:46:29 -0700401 } break;
402 case spv::OpMemberDecorate: {
403 member_decoration_inst.push_back(insn);
404 if (insn.word(3) == spv::DecorationBuiltIn) {
405 builtin_decoration_list.emplace_back(insn.offset(), static_cast<spv::BuiltIn>(insn.word(4)));
406 }
407 } break;
408
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600409 // Copy operations
410 case spv::OpCopyLogical:
411 case spv::OpCopyObject: {
412 def_index[insn.word(2)] = insn.offset();
413 break;
414 }
sfricke-samsung962cad92021-04-13 00:46:29 -0700415
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600416 // Execution Mode
417 case spv::OpExecutionMode: {
418 execution_mode_inst[insn.word(1)].push_back(insn);
419 } break;
420
421 case spv::OpLoad: {
422 def_index[insn.word(2)] = insn.offset();
423 } break;
424
425 default:
426 if (AtomicOperation(insn.opcode()) == true) {
427 // All atomics have a pointer referenced
428 spirv_inst_iter access;
429 if (insn.opcode() == spv::OpAtomicStore) {
sfricke-samsungef15e482022-01-26 11:32:49 -0800430 access = module_state.get_def(insn.word(1));
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600431 } else {
sfricke-samsungef15e482022-01-26 11:32:49 -0800432 access = module_state.get_def(insn.word(3));
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600433 def_index[insn.word(2)] = insn.offset();
434 }
435
436 atomic_instruction atomic;
437
sfricke-samsungef15e482022-01-26 11:32:49 -0800438 auto pointer = module_state.get_def(access.word(1));
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600439 // spirv-val should catch if not pointer
440 assert(pointer.opcode() == spv::OpTypePointer);
441 atomic.storage_class = pointer.word(2);
442
sfricke-samsungef15e482022-01-26 11:32:49 -0800443 auto data_type = module_state.get_def(pointer.word(3));
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600444 atomic.type = data_type.opcode();
445
446 // TODO - Should have a proper GetBitWidth like spirv-val does
447 assert(data_type.opcode() == spv::OpTypeFloat || data_type.opcode() == spv::OpTypeInt);
448 atomic.bit_width = data_type.word(2);
449
450 atomic_inst[insn.offset()] = atomic;
451 }
452 // We don't care about any other defs for now.
453 break;
454 }
455 }
456
sfricke-samsungef15e482022-01-26 11:32:49 -0800457 entry_points = SHADER_MODULE_STATE::ProcessEntryPoints(module_state);
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600458 multiple_entry_points = entry_points.size() > 1;
459}
460
461// static
462std::unordered_multimap<std::string, SHADER_MODULE_STATE::EntryPoint> SHADER_MODULE_STATE::ProcessEntryPoints(
sfricke-samsungef15e482022-01-26 11:32:49 -0800463 const SHADER_MODULE_STATE &module_state) {
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600464 std::unordered_multimap<std::string, SHADER_MODULE_STATE::EntryPoint> entry_points;
465 function_set func_set = {};
466 EntryPoint *entry_point = nullptr;
467
sfricke-samsungef15e482022-01-26 11:32:49 -0800468 for (auto insn : module_state) {
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600469 // offset is not 0, it means it's updated and the offset is in a Function.
470 if (func_set.offset) {
471 func_set.op_lists.emplace(insn.opcode(), insn.offset());
472 } else if (entry_point) {
473 entry_point->decorate_list.emplace(insn.opcode(), insn.offset());
474 }
475
476 switch (insn.opcode()) {
477 // Functions
478 case spv::OpFunction:
479 func_set.id = insn.word(2);
480 func_set.offset = insn.offset();
481 func_set.op_lists.clear();
482 break;
483
484 // Entry points ... add to the entrypoint table
485 case spv::OpEntryPoint: {
sfricke-samsung962cad92021-04-13 00:46:29 -0700486 // Entry points do not have an id (the id is the function id) and thus need their own table
487 auto entrypoint_name = reinterpret_cast<char const *>(&insn.word(3));
488 auto execution_model = insn.word(1);
489 auto entrypoint_stage = ExecutionModelToShaderStageFlagBits(execution_model);
490 entry_points.emplace(entrypoint_name,
491 EntryPoint{insn.offset(), static_cast<VkShaderStageFlagBits>(entrypoint_stage)});
492
493 auto range = entry_points.equal_range(entrypoint_name);
494 for (auto it = range.first; it != range.second; ++it) {
495 if (it->second.offset == insn.offset()) {
496 entry_point = &(it->second);
497 break;
498 }
499 }
500 assert(entry_point != nullptr);
501 break;
502 }
503 case spv::OpFunctionEnd: {
504 assert(entry_point != nullptr);
505 func_set.length = insn.offset() - func_set.offset;
506 entry_point->function_set_list.emplace_back(func_set);
507 break;
508 }
sfricke-samsung962cad92021-04-13 00:46:29 -0700509 }
510 }
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600511
sfricke-samsungef15e482022-01-26 11:32:49 -0800512 SHADER_MODULE_STATE::SetPushConstantUsedInShader(module_state, entry_points);
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600513 return entry_points;
sfricke-samsung962cad92021-04-13 00:46:29 -0700514}
515
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600516void SHADER_MODULE_STATE::PreprocessShaderBinary(const spv_target_env env) {
517 if (static_data_.has_group_decoration) {
sfricke-samsung962cad92021-04-13 00:46:29 -0700518 spvtools::Optimizer optimizer(env);
519 optimizer.RegisterPass(spvtools::CreateFlattenDecorationPass());
520 std::vector<uint32_t> optimized_binary;
521 // Run optimizer to flatten decorations only, set skip_validation so as to not re-run validator
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600522 auto result = optimizer.Run(words.data(), words.size(), &optimized_binary, spvtools::ValidatorOptions(), true);
523
sfricke-samsung962cad92021-04-13 00:46:29 -0700524 if (result) {
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600525 // NOTE: We need to update words with the result from the spirv-tools optimizer.
526 // **THIS ONLY HAPPENS ON INITIALIZATION**. words should remain const for the lifetime
527 // of the SHADER_MODULE_STATE instance.
528 *const_cast<std::vector<uint32_t> *>(&words) = std::move(optimized_binary);
sfricke-samsung962cad92021-04-13 00:46:29 -0700529 }
530 }
sfricke-samsung962cad92021-04-13 00:46:29 -0700531}
532
sfricke-samsung58b84352021-07-31 21:41:04 -0700533char const *StorageClassName(unsigned sc) {
sfricke-samsung962cad92021-04-13 00:46:29 -0700534 switch (sc) {
535 case spv::StorageClassInput:
536 return "input";
537 case spv::StorageClassOutput:
538 return "output";
539 case spv::StorageClassUniformConstant:
540 return "const uniform";
541 case spv::StorageClassUniform:
542 return "uniform";
543 case spv::StorageClassWorkgroup:
544 return "workgroup local";
545 case spv::StorageClassCrossWorkgroup:
546 return "workgroup global";
547 case spv::StorageClassPrivate:
548 return "private global";
549 case spv::StorageClassFunction:
550 return "function";
551 case spv::StorageClassGeneric:
552 return "generic";
553 case spv::StorageClassAtomicCounter:
554 return "atomic counter";
555 case spv::StorageClassImage:
556 return "image";
557 case spv::StorageClassPushConstant:
558 return "push constant";
559 case spv::StorageClassStorageBuffer:
560 return "storage buffer";
561 default:
562 return "unknown";
563 }
564}
565
566void SHADER_MODULE_STATE::DescribeTypeInner(std::ostringstream &ss, unsigned type) const {
567 auto insn = get_def(type);
568 assert(insn != end());
569
570 switch (insn.opcode()) {
571 case spv::OpTypeBool:
572 ss << "bool";
573 break;
574 case spv::OpTypeInt:
575 ss << (insn.word(3) ? 's' : 'u') << "int" << insn.word(2);
576 break;
577 case spv::OpTypeFloat:
578 ss << "float" << insn.word(2);
579 break;
580 case spv::OpTypeVector:
581 ss << "vec" << insn.word(3) << " of ";
582 DescribeTypeInner(ss, insn.word(2));
583 break;
584 case spv::OpTypeMatrix:
585 ss << "mat" << insn.word(3) << " of ";
586 DescribeTypeInner(ss, insn.word(2));
587 break;
588 case spv::OpTypeArray:
589 ss << "arr[" << GetConstantValueById(insn.word(3)) << "] of ";
590 DescribeTypeInner(ss, insn.word(2));
591 break;
592 case spv::OpTypeRuntimeArray:
593 ss << "runtime arr[] of ";
594 DescribeTypeInner(ss, insn.word(2));
595 break;
596 case spv::OpTypePointer:
597 ss << "ptr to " << StorageClassName(insn.word(2)) << " ";
598 DescribeTypeInner(ss, insn.word(3));
599 break;
600 case spv::OpTypeStruct: {
601 ss << "struct of (";
602 for (unsigned i = 2; i < insn.len(); i++) {
603 DescribeTypeInner(ss, insn.word(i));
604 if (i == insn.len() - 1) {
605 ss << ")";
606 } else {
607 ss << ", ";
608 }
609 }
610 break;
611 }
612 case spv::OpTypeSampler:
613 ss << "sampler";
614 break;
615 case spv::OpTypeSampledImage:
616 ss << "sampler+";
617 DescribeTypeInner(ss, insn.word(2));
618 break;
619 case spv::OpTypeImage:
620 ss << "image(dim=" << insn.word(3) << ", sampled=" << insn.word(7) << ")";
621 break;
622 case spv::OpTypeAccelerationStructureNV:
623 ss << "accelerationStruture";
624 break;
625 default:
626 ss << "oddtype";
627 break;
628 }
629}
630
631std::string SHADER_MODULE_STATE::DescribeType(unsigned type) const {
632 std::ostringstream ss;
633 DescribeTypeInner(ss, type);
634 return ss.str();
635}
636
sfricke-samsung7a9bdca2022-01-24 14:38:03 -0800637std::string SHADER_MODULE_STATE::DescribeInstruction(const spirv_inst_iter &insn) const {
638 std::ostringstream ss;
639 const uint32_t opcode = insn.opcode();
640 uint32_t operand_offset = 1; // where to start printing operands
641 // common disassembled for SPIR-V is
642 // %result = Opcode %result_type %operands
643 if (OpcodeHasResult(opcode)) {
644 operand_offset++;
645 ss << "%" << (OpcodeHasType(opcode) ? insn.word(2) : insn.word(1)) << " = ";
646 }
647
648 ss << string_SpvOpcode(opcode);
649
650 if (OpcodeHasType(opcode)) {
651 operand_offset++;
652 ss << " %" << insn.word(1);
653 }
654
655 for (uint32_t i = operand_offset; i < insn.len(); i++) {
656 ss << " %" << insn.word(i);
657 }
658 return ss.str();
659}
660
sfricke-samsung962cad92021-04-13 00:46:29 -0700661const SHADER_MODULE_STATE::EntryPoint *SHADER_MODULE_STATE::FindEntrypointStruct(char const *name,
662 VkShaderStageFlagBits stageBits) const {
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600663 auto range = static_data_.entry_points.equal_range(name);
sfricke-samsung962cad92021-04-13 00:46:29 -0700664 for (auto it = range.first; it != range.second; ++it) {
665 if (it->second.stage == stageBits) {
666 return &(it->second);
667 }
668 }
669 return nullptr;
670}
671
672spirv_inst_iter SHADER_MODULE_STATE::FindEntrypoint(char const *name, VkShaderStageFlagBits stageBits) const {
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600673 auto range = static_data_.entry_points.equal_range(name);
sfricke-samsung962cad92021-04-13 00:46:29 -0700674 for (auto it = range.first; it != range.second; ++it) {
675 if (it->second.stage == stageBits) {
676 return at(it->second.offset);
677 }
678 }
679 return end();
680}
681
682// Because the following is legal, need the entry point
683// OpEntryPoint GLCompute %main "name_a"
684// OpEntryPoint GLCompute %main "name_b"
685bool SHADER_MODULE_STATE::FindLocalSize(const spirv_inst_iter &entrypoint, uint32_t &local_size_x, uint32_t &local_size_y,
686 uint32_t &local_size_z) const {
687 auto entrypoint_id = entrypoint.word(2);
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -0600688 auto it = static_data_.execution_mode_inst.find(entrypoint_id);
689 if (it != static_data_.execution_mode_inst.end()) {
sfricke-samsung962cad92021-04-13 00:46:29 -0700690 for (auto insn : it->second) {
691 // Future Note: For now, Vulkan doesn't have a valid mode that can makes use of OpExecutionModeId
692 // In the future if something like LocalSizeId is supported, the <id> will need to be checked also
693 assert(insn.opcode() == spv::OpExecutionMode);
694 if (insn.word(2) == spv::ExecutionModeLocalSize) {
695 local_size_x = insn.word(3);
696 local_size_y = insn.word(4);
697 local_size_z = insn.word(5);
698 return true;
699 }
700 }
701 }
702 return false;
703}
704
705// If the instruction at id is a constant or copy of a constant, returns a valid iterator pointing to that instruction.
706// Otherwise, returns src->end().
707spirv_inst_iter SHADER_MODULE_STATE::GetConstantDef(unsigned id) const {
708 auto value = get_def(id);
709
710 // If id is a copy, see where it was copied from
711 if ((end() != value) && ((value.opcode() == spv::OpCopyObject) || (value.opcode() == spv::OpCopyLogical))) {
712 id = value.word(3);
713 value = get_def(id);
714 }
715
716 if ((end() != value) && (value.opcode() == spv::OpConstant)) {
717 return value;
718 }
719 return end();
720}
721
722// Either returns the constant value described by the instruction at id, or 1
723uint32_t SHADER_MODULE_STATE::GetConstantValueById(unsigned id) const {
724 auto value = GetConstantDef(id);
725
726 if (end() == value) {
727 // TODO: Either ensure that the specialization transform is already performed on a module we're
728 // considering here, OR -- specialize on the fly now.
729 return 1;
730 }
731 return GetConstantValue(value);
732}
733
734// Returns an int32_t corresponding to the spv::Dim of the given resource, when positive, and corresponding to an unknown type, when
735// negative.
736int32_t SHADER_MODULE_STATE::GetShaderResourceDimensionality(const interface_var &resource) const {
737 auto type = get_def(resource.type_id);
738 while (true) {
739 switch (type.opcode()) {
740 case spv::OpTypeSampledImage:
741 type = get_def(type.word(2));
742 break;
743 case spv::OpTypePointer:
744 type = get_def(type.word(3));
745 break;
746 case spv::OpTypeImage:
747 return type.word(3);
748 default:
749 return -1;
750 }
751 }
752}
753
754unsigned SHADER_MODULE_STATE::GetLocationsConsumedByType(unsigned type, bool strip_array_level) const {
755 auto insn = get_def(type);
756 assert(insn != end());
757
758 switch (insn.opcode()) {
759 case spv::OpTypePointer:
760 // See through the ptr -- this is only ever at the toplevel for graphics shaders we're never actually passing
761 // pointers around.
762 return GetLocationsConsumedByType(insn.word(3), strip_array_level);
763 case spv::OpTypeArray:
764 if (strip_array_level) {
765 return GetLocationsConsumedByType(insn.word(2), false);
766 } else {
767 return GetConstantValueById(insn.word(3)) * GetLocationsConsumedByType(insn.word(2), false);
768 }
769 case spv::OpTypeMatrix:
770 // Num locations is the dimension * element size
771 return insn.word(3) * GetLocationsConsumedByType(insn.word(2), false);
772 case spv::OpTypeVector: {
773 auto scalar_type = get_def(insn.word(2));
774 auto bit_width =
775 (scalar_type.opcode() == spv::OpTypeInt || scalar_type.opcode() == spv::OpTypeFloat) ? scalar_type.word(2) : 32;
776
777 // Locations are 128-bit wide; 3- and 4-component vectors of 64 bit types require two.
778 return (bit_width * insn.word(3) + 127) / 128;
779 }
780 default:
781 // Everything else is just 1.
782 return 1;
783
784 // TODO: extend to handle 64bit scalar types, whose vectors may need multiple locations.
785 }
786}
787
788unsigned SHADER_MODULE_STATE::GetComponentsConsumedByType(unsigned type, bool strip_array_level) const {
789 auto insn = get_def(type);
790 assert(insn != end());
791
792 switch (insn.opcode()) {
793 case spv::OpTypePointer:
794 // See through the ptr -- this is only ever at the toplevel for graphics shaders we're never actually passing
795 // pointers around.
796 return GetComponentsConsumedByType(insn.word(3), strip_array_level);
797 case spv::OpTypeStruct: {
798 uint32_t sum = 0;
799 for (uint32_t i = 2; i < insn.len(); i++) { // i=2 to skip word(0) and word(1)=ID of struct
800 sum += GetComponentsConsumedByType(insn.word(i), false);
801 }
802 return sum;
803 }
804 case spv::OpTypeArray:
805 if (strip_array_level) {
806 return GetComponentsConsumedByType(insn.word(2), false);
807 } else {
808 return GetConstantValueById(insn.word(3)) * GetComponentsConsumedByType(insn.word(2), false);
809 }
810 case spv::OpTypeMatrix:
811 // Num locations is the dimension * element size
812 return insn.word(3) * GetComponentsConsumedByType(insn.word(2), false);
813 case spv::OpTypeVector: {
814 auto scalar_type = get_def(insn.word(2));
815 auto bit_width =
816 (scalar_type.opcode() == spv::OpTypeInt || scalar_type.opcode() == spv::OpTypeFloat) ? scalar_type.word(2) : 32;
817 // One component is 32-bit
818 return (bit_width * insn.word(3) + 31) / 32;
819 }
820 case spv::OpTypeFloat: {
821 auto bit_width = insn.word(2);
822 return (bit_width + 31) / 32;
823 }
824 case spv::OpTypeInt: {
825 auto bit_width = insn.word(2);
826 return (bit_width + 31) / 32;
827 }
828 case spv::OpConstant:
829 return GetComponentsConsumedByType(insn.word(1), false);
830 default:
831 return 0;
832 }
833}
834
835// characterizes a SPIR-V type appearing in an interface to a FF stage, for comparison to a VkFormat's characterization above.
836// also used for input attachments, as we statically know their format.
837unsigned SHADER_MODULE_STATE::GetFundamentalType(unsigned type) const {
838 auto insn = get_def(type);
839 assert(insn != end());
840
841 switch (insn.opcode()) {
842 case spv::OpTypeInt:
843 return insn.word(3) ? FORMAT_TYPE_SINT : FORMAT_TYPE_UINT;
844 case spv::OpTypeFloat:
845 return FORMAT_TYPE_FLOAT;
846 case spv::OpTypeVector:
847 case spv::OpTypeMatrix:
848 case spv::OpTypeArray:
849 case spv::OpTypeRuntimeArray:
850 case spv::OpTypeImage:
851 return GetFundamentalType(insn.word(2));
852 case spv::OpTypePointer:
853 return GetFundamentalType(insn.word(3));
854
855 default:
856 return 0;
857 }
858}
859
860spirv_inst_iter SHADER_MODULE_STATE::GetStructType(spirv_inst_iter def, bool is_array_of_verts) const {
861 while (true) {
862 if (def.opcode() == spv::OpTypePointer) {
863 def = get_def(def.word(3));
864 } else if (def.opcode() == spv::OpTypeArray && is_array_of_verts) {
865 def = get_def(def.word(2));
866 is_array_of_verts = false;
867 } else if (def.opcode() == spv::OpTypeStruct) {
868 return def;
869 } else {
870 return end();
871 }
872 }
873}
874
sfricke-samsungad55ccc2022-01-19 20:06:17 -0800875void SHADER_MODULE_STATE::DefineStructMember(const spirv_inst_iter &it, const std::vector<uint32_t> &member_decorate_offsets,
sfricke-samsung962cad92021-04-13 00:46:29 -0700876 shader_struct_member &data) const {
877 const auto struct_it = GetStructType(it, false);
878 assert(struct_it != end());
879 data.size = 0;
880
881 shader_struct_member data1;
882 uint32_t i = 2;
883 uint32_t local_offset = 0;
884 std::vector<uint32_t> offsets;
885 offsets.resize(struct_it.len() - i);
886
887 // The members of struct in SPRIV_R aren't always sort, so we need to know their order.
sfricke-samsungad55ccc2022-01-19 20:06:17 -0800888 for (const auto offset : member_decorate_offsets) {
sfricke-samsung962cad92021-04-13 00:46:29 -0700889 const auto member_decorate = at(offset);
890 if (member_decorate.word(1) != struct_it.word(1)) {
891 continue;
892 }
893
894 offsets[member_decorate.word(2)] = member_decorate.word(4);
895 }
896
897 for (const auto offset : offsets) {
898 local_offset = offset;
899 data1 = {};
900 data1.root = data.root;
901 data1.offset = local_offset;
902 auto def_member = get_def(struct_it.word(i));
903
904 // Array could be multi-dimensional
905 while (def_member.opcode() == spv::OpTypeArray) {
906 const auto len_id = def_member.word(3);
907 const auto def_len = get_def(len_id);
908 data1.array_length_hierarchy.emplace_back(def_len.word(3)); // array length
909 def_member = get_def(def_member.word(2));
910 }
911
912 if (def_member.opcode() == spv::OpTypeStruct) {
sfricke-samsungad55ccc2022-01-19 20:06:17 -0800913 DefineStructMember(def_member, member_decorate_offsets, data1);
sfricke-samsung962cad92021-04-13 00:46:29 -0700914 } else if (def_member.opcode() == spv::OpTypePointer) {
915 if (def_member.word(2) == spv::StorageClassPhysicalStorageBuffer) {
916 // If it's a pointer with PhysicalStorageBuffer class, this member is essentially a uint64_t containing an address
917 // that "points to something."
918 data1.size = 8;
919 } else {
920 // If it's OpTypePointer. it means the member is a buffer, the type will be TypePointer, and then struct
sfricke-samsungad55ccc2022-01-19 20:06:17 -0800921 DefineStructMember(def_member, member_decorate_offsets, data1);
sfricke-samsung962cad92021-04-13 00:46:29 -0700922 }
923 } else {
924 if (def_member.opcode() == spv::OpTypeMatrix) {
925 data1.array_length_hierarchy.emplace_back(def_member.word(3)); // matrix's columns. matrix's row is vector.
926 def_member = get_def(def_member.word(2));
927 }
928
929 if (def_member.opcode() == spv::OpTypeVector) {
930 data1.array_length_hierarchy.emplace_back(def_member.word(3)); // vector length
931 def_member = get_def(def_member.word(2));
932 }
933
934 // Get scalar type size. The value in SPRV-R is bit. It needs to translate to byte.
935 data1.size = (def_member.word(2) / 8);
936 }
937 const auto array_length_hierarchy_szie = data1.array_length_hierarchy.size();
938 if (array_length_hierarchy_szie > 0) {
939 data1.array_block_size.resize(array_length_hierarchy_szie, 1);
940
941 for (int i2 = static_cast<int>(array_length_hierarchy_szie - 1); i2 > 0; --i2) {
942 data1.array_block_size[i2 - 1] = data1.array_length_hierarchy[i2] * data1.array_block_size[i2];
943 }
944 }
945 data.struct_members.emplace_back(data1);
946 ++i;
947 }
948 uint32_t total_array_length = 1;
949 for (const auto length : data1.array_length_hierarchy) {
950 total_array_length *= length;
951 }
952 data.size = local_offset + data1.size * total_array_length;
953}
954
955static uint32_t UpdateOffset(uint32_t offset, const std::vector<uint32_t> &array_indices, const shader_struct_member &data) {
956 int array_indices_size = static_cast<int>(array_indices.size());
957 if (array_indices_size) {
958 uint32_t array_index = 0;
959 uint32_t i = 0;
960 for (const auto index : array_indices) {
961 array_index += (data.array_block_size[i] * index);
962 ++i;
963 }
964 offset += (array_index * data.size);
965 }
966 return offset;
967}
968
969static void SetUsedBytes(uint32_t offset, const std::vector<uint32_t> &array_indices, const shader_struct_member &data) {
970 int array_indices_size = static_cast<int>(array_indices.size());
971 uint32_t block_memory_size = data.size;
972 for (uint32_t i = static_cast<int>(array_indices_size); i < data.array_length_hierarchy.size(); ++i) {
973 block_memory_size *= data.array_length_hierarchy[i];
974 }
975
976 offset = UpdateOffset(offset, array_indices, data);
977
978 uint32_t end = offset + block_memory_size;
979 auto used_bytes = data.GetUsedbytes();
980 if (used_bytes->size() < end) {
981 used_bytes->resize(end, 0);
982 }
983 std::memset(used_bytes->data() + offset, true, static_cast<std::size_t>(block_memory_size));
984}
985
986void SHADER_MODULE_STATE::RunUsedArray(uint32_t offset, std::vector<uint32_t> array_indices, uint32_t access_chain_word_index,
987 spirv_inst_iter &access_chain_it, const shader_struct_member &data) const {
988 if (access_chain_word_index < access_chain_it.len()) {
989 if (data.array_length_hierarchy.size() > array_indices.size()) {
990 auto def_it = get_def(access_chain_it.word(access_chain_word_index));
991 ++access_chain_word_index;
992
993 if (def_it != end() && def_it.opcode() == spv::OpConstant) {
994 array_indices.emplace_back(def_it.word(3));
995 RunUsedArray(offset, array_indices, access_chain_word_index, access_chain_it, data);
996 } else {
997 // If it is a variable, set the all array is used.
998 if (access_chain_word_index < access_chain_it.len()) {
999 uint32_t array_length = data.array_length_hierarchy[array_indices.size()];
1000 for (uint32_t i = 0; i < array_length; ++i) {
1001 auto array_indices2 = array_indices;
1002 array_indices2.emplace_back(i);
1003 RunUsedArray(offset, array_indices2, access_chain_word_index, access_chain_it, data);
1004 }
1005 } else {
1006 SetUsedBytes(offset, array_indices, data);
1007 }
1008 }
1009 } else {
1010 offset = UpdateOffset(offset, array_indices, data);
1011 RunUsedStruct(offset, access_chain_word_index, access_chain_it, data);
1012 }
1013 } else {
1014 SetUsedBytes(offset, array_indices, data);
1015 }
1016}
1017
1018void SHADER_MODULE_STATE::RunUsedStruct(uint32_t offset, uint32_t access_chain_word_index, spirv_inst_iter &access_chain_it,
1019 const shader_struct_member &data) const {
1020 std::vector<uint32_t> array_indices_emptry;
1021
1022 if (access_chain_word_index < access_chain_it.len()) {
1023 auto strcut_member_index = GetConstantValueById(access_chain_it.word(access_chain_word_index));
1024 ++access_chain_word_index;
1025
1026 auto data1 = data.struct_members[strcut_member_index];
1027 RunUsedArray(offset + data1.offset, array_indices_emptry, access_chain_word_index, access_chain_it, data1);
1028 }
1029}
1030
1031void SHADER_MODULE_STATE::SetUsedStructMember(const uint32_t variable_id, const std::vector<function_set> &function_set_list,
1032 const shader_struct_member &data) const {
1033 for (const auto &func_set : function_set_list) {
1034 auto range = func_set.op_lists.equal_range(spv::OpAccessChain);
1035 for (auto it = range.first; it != range.second; ++it) {
1036 auto access_chain = at(it->second);
1037 if (access_chain.word(3) == variable_id) {
1038 RunUsedStruct(0, 4, access_chain, data);
1039 }
1040 }
1041 }
1042}
1043
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -06001044// static
1045void SHADER_MODULE_STATE::SetPushConstantUsedInShader(
sfricke-samsungef15e482022-01-26 11:32:49 -08001046 const SHADER_MODULE_STATE &module_state, std::unordered_multimap<std::string, SHADER_MODULE_STATE::EntryPoint> &entry_points) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001047 for (auto &entrypoint : entry_points) {
1048 auto range = entrypoint.second.decorate_list.equal_range(spv::OpVariable);
1049 for (auto it = range.first; it != range.second; ++it) {
sfricke-samsungef15e482022-01-26 11:32:49 -08001050 const auto def_insn = module_state.at(it->second);
sfricke-samsung962cad92021-04-13 00:46:29 -07001051
1052 if (def_insn.word(3) == spv::StorageClassPushConstant) {
sfricke-samsungef15e482022-01-26 11:32:49 -08001053 spirv_inst_iter type = module_state.get_def(def_insn.word(1));
sfricke-samsung962cad92021-04-13 00:46:29 -07001054 const auto range2 = entrypoint.second.decorate_list.equal_range(spv::OpMemberDecorate);
1055 std::vector<uint32_t> offsets;
1056
1057 for (auto it2 = range2.first; it2 != range2.second; ++it2) {
sfricke-samsungef15e482022-01-26 11:32:49 -08001058 auto member_decorate = module_state.at(it2->second);
sfricke-samsung962cad92021-04-13 00:46:29 -07001059 if (member_decorate.len() == 5 && member_decorate.word(3) == spv::DecorationOffset) {
1060 offsets.emplace_back(member_decorate.offset());
1061 }
1062 }
1063 entrypoint.second.push_constant_used_in_shader.root = &entrypoint.second.push_constant_used_in_shader;
sfricke-samsungef15e482022-01-26 11:32:49 -08001064 module_state.DefineStructMember(type, offsets, entrypoint.second.push_constant_used_in_shader);
1065 module_state.SetUsedStructMember(def_insn.word(2), entrypoint.second.function_set_list,
1066 entrypoint.second.push_constant_used_in_shader);
sfricke-samsung962cad92021-04-13 00:46:29 -07001067 }
1068 }
1069 }
1070}
1071
1072uint32_t SHADER_MODULE_STATE::DescriptorTypeToReqs(uint32_t type_id) const {
1073 auto type = get_def(type_id);
1074
1075 while (true) {
1076 switch (type.opcode()) {
1077 case spv::OpTypeArray:
1078 case spv::OpTypeRuntimeArray:
1079 case spv::OpTypeSampledImage:
1080 type = get_def(type.word(2));
1081 break;
1082 case spv::OpTypePointer:
1083 type = get_def(type.word(3));
1084 break;
1085 case spv::OpTypeImage: {
1086 auto dim = type.word(3);
1087 auto arrayed = type.word(5);
1088 auto msaa = type.word(6);
1089
1090 uint32_t bits = 0;
1091 switch (GetFundamentalType(type.word(2))) {
1092 case FORMAT_TYPE_FLOAT:
1093 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_FLOAT;
1094 break;
1095 case FORMAT_TYPE_UINT:
1096 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_UINT;
1097 break;
1098 case FORMAT_TYPE_SINT:
1099 bits = DESCRIPTOR_REQ_COMPONENT_TYPE_SINT;
1100 break;
1101 default:
1102 break;
1103 }
1104
1105 switch (dim) {
1106 case spv::Dim1D:
1107 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_1D_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_1D;
1108 return bits;
1109 case spv::Dim2D:
1110 bits |= msaa ? DESCRIPTOR_REQ_MULTI_SAMPLE : DESCRIPTOR_REQ_SINGLE_SAMPLE;
1111 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_2D_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_2D;
1112 return bits;
1113 case spv::Dim3D:
1114 bits |= DESCRIPTOR_REQ_VIEW_TYPE_3D;
1115 return bits;
1116 case spv::DimCube:
1117 bits |= arrayed ? DESCRIPTOR_REQ_VIEW_TYPE_CUBE_ARRAY : DESCRIPTOR_REQ_VIEW_TYPE_CUBE;
1118 return bits;
1119 case spv::DimSubpassData:
1120 bits |= msaa ? DESCRIPTOR_REQ_MULTI_SAMPLE : DESCRIPTOR_REQ_SINGLE_SAMPLE;
1121 return bits;
1122 default: // buffer, etc.
1123 return bits;
1124 }
1125 }
1126 default:
1127 return 0;
1128 }
1129 }
1130}
1131
1132// For some built-in analysis we need to know if the variable decorated with as the built-in was actually written to.
1133// This function examines instructions in the static call tree for a write to this variable.
1134bool SHADER_MODULE_STATE::IsBuiltInWritten(spirv_inst_iter builtin_instr, spirv_inst_iter entrypoint) const {
1135 auto type = builtin_instr.opcode();
1136 uint32_t target_id = builtin_instr.word(1);
1137 bool init_complete = false;
Nathaniel Cesario80c0e0f2021-10-14 13:25:54 -06001138 uint32_t target_member_offset = 0;
sfricke-samsung962cad92021-04-13 00:46:29 -07001139
1140 if (type == spv::OpMemberDecorate) {
1141 // Built-in is part of a structure -- examine instructions up to first function body to get initial IDs
1142 auto insn = entrypoint;
1143 while (!init_complete && (insn.opcode() != spv::OpFunction)) {
1144 switch (insn.opcode()) {
1145 case spv::OpTypePointer:
Nathaniel Cesario58fc2282021-08-18 12:20:40 -06001146 if (insn.word(2) == spv::StorageClassOutput) {
1147 const auto type_id = insn.word(3);
1148 if (type_id == target_id) {
1149 target_id = insn.word(1);
1150 } else {
1151 // If the output is an array, check if the element type is what we're looking for
1152 const auto type_insn = get_def(type_id);
1153 if ((type_insn.opcode() == spv::OpTypeArray) && (type_insn.word(2) == target_id)) {
1154 target_id = insn.word(1);
Nathaniel Cesario80c0e0f2021-10-14 13:25:54 -06001155 target_member_offset = 1;
Nathaniel Cesario58fc2282021-08-18 12:20:40 -06001156 }
1157 }
sfricke-samsung962cad92021-04-13 00:46:29 -07001158 }
1159 break;
1160 case spv::OpVariable:
1161 if (insn.word(1) == target_id) {
1162 target_id = insn.word(2);
1163 init_complete = true;
1164 }
1165 break;
1166 }
1167 insn++;
1168 }
1169 }
1170
1171 if (!init_complete && (type == spv::OpMemberDecorate)) return false;
1172
1173 bool found_write = false;
1174 layer_data::unordered_set<uint32_t> worklist;
1175 worklist.insert(entrypoint.word(2));
1176
1177 // Follow instructions in call graph looking for writes to target
1178 while (!worklist.empty() && !found_write) {
1179 auto id_iter = worklist.begin();
1180 auto id = *id_iter;
1181 worklist.erase(id_iter);
1182
1183 auto insn = get_def(id);
1184 if (insn == end()) {
1185 continue;
1186 }
1187
1188 if (insn.opcode() == spv::OpFunction) {
1189 // Scan body of function looking for other function calls or items in our ID chain
Nathaniel Cesario58fc2282021-08-18 12:20:40 -06001190 while (++insn, (insn.opcode() != spv::OpFunctionEnd) && !found_write) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001191 switch (insn.opcode()) {
1192 case spv::OpAccessChain:
1193 if (insn.word(3) == target_id) {
1194 if (type == spv::OpMemberDecorate) {
Nathaniel Cesario80c0e0f2021-10-14 13:25:54 -06001195 // Get the target member of the struct
1196 // NOTE: this will only work for structs and arrays of structs. Deeper levels of nesting (e.g.,
1197 // arrays of structs of structs) is not currently supported.
1198 const auto value_itr = GetConstantDef(insn.word(4 + target_member_offset));
1199 if (value_itr != end()) {
1200 auto value = GetConstantValue(value_itr);
1201 if (value == builtin_instr.word(2)) {
1202 target_id = insn.word(2);
1203 }
sfricke-samsung962cad92021-04-13 00:46:29 -07001204 }
1205 } else {
1206 target_id = insn.word(2);
1207 }
1208 }
1209 break;
1210 case spv::OpStore:
1211 if (insn.word(1) == target_id) {
1212 found_write = true;
1213 }
1214 break;
1215 case spv::OpFunctionCall:
1216 worklist.insert(insn.word(3));
1217 break;
1218 }
1219 }
1220 }
1221 }
1222 return found_write;
1223}
1224
1225// Used by the collection functions to help aid in state tracking
1226struct shader_module_used_operators {
1227 bool updated;
sfricke-samsungad55ccc2022-01-19 20:06:17 -08001228 std::vector<unsigned> image_read_members;
1229 std::vector<unsigned> image_write_members;
sfricke-samsung962cad92021-04-13 00:46:29 -07001230 std::vector<unsigned> atomic_members;
1231 std::vector<unsigned> store_members;
1232 std::vector<unsigned> atomic_store_members;
1233 std::vector<unsigned> sampler_implicitLod_dref_proj_members; // sampler Load id
1234 std::vector<unsigned> sampler_bias_offset_members; // sampler Load id
Lionel Landwerlincdbe8682021-12-08 15:10:37 +02001235 std::vector<unsigned> image_dref_members;
sfricke-samsungad55ccc2022-01-19 20:06:17 -08001236 std::vector<std::pair<unsigned, unsigned>> sampled_image_members; // <image,sampler> Load id
sfricke-samsung962cad92021-04-13 00:46:29 -07001237 layer_data::unordered_map<unsigned, unsigned> load_members;
1238 layer_data::unordered_map<unsigned, std::pair<unsigned, unsigned>> accesschain_members;
1239 layer_data::unordered_map<unsigned, unsigned> image_texel_pointer_members;
1240
1241 shader_module_used_operators() : updated(false) {}
1242
1243 bool CheckImageOperandsBiasOffset(uint32_t type) {
1244 return type & (spv::ImageOperandsBiasMask | spv::ImageOperandsConstOffsetMask | spv::ImageOperandsOffsetMask |
1245 spv::ImageOperandsConstOffsetsMask)
1246 ? true
1247 : false;
1248 }
1249
sfricke-samsungef15e482022-01-26 11:32:49 -08001250 void update(SHADER_MODULE_STATE const *module_state) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001251 if (updated) return;
1252 updated = true;
1253
sfricke-samsungef15e482022-01-26 11:32:49 -08001254 for (auto insn : *module_state) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001255 switch (insn.opcode()) {
1256 case spv::OpImageSampleImplicitLod:
1257 case spv::OpImageSampleProjImplicitLod:
1258 case spv::OpImageSampleProjExplicitLod:
1259 case spv::OpImageSparseSampleImplicitLod:
1260 case spv::OpImageSparseSampleProjImplicitLod:
1261 case spv::OpImageSparseSampleProjExplicitLod: {
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001262 // combined image samples are just OpLoad, but also can be separate image and sampler
sfricke-samsungef15e482022-01-26 11:32:49 -08001263 auto id = module_state->get_def(insn.word(3)); // <id> Sampled Image
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001264 auto load_id = (id.opcode() == spv::OpSampledImage) ? id.word(4) : insn.word(3);
1265 sampler_implicitLod_dref_proj_members.emplace_back(load_id);
sfricke-samsung962cad92021-04-13 00:46:29 -07001266 // ImageOperands in index: 5
1267 if (insn.len() > 5 && CheckImageOperandsBiasOffset(insn.word(5))) {
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001268 sampler_bias_offset_members.emplace_back(load_id);
sfricke-samsung962cad92021-04-13 00:46:29 -07001269 }
1270 break;
1271 }
Lionel Landwerlincdbe8682021-12-08 15:10:37 +02001272 case spv::OpImageDrefGather:
1273 case spv::OpImageSparseDrefGather: {
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001274 // combined image samples are just OpLoad, but also can be separate image and sampler
sfricke-samsungef15e482022-01-26 11:32:49 -08001275 auto id = module_state->get_def(insn.word(3)); // <id> Sampled Image
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001276 auto load_id = (id.opcode() == spv::OpSampledImage) ? id.word(3) : insn.word(3);
1277 image_dref_members.emplace_back(load_id);
Lionel Landwerlincdbe8682021-12-08 15:10:37 +02001278 break;
1279 }
sfricke-samsung962cad92021-04-13 00:46:29 -07001280 case spv::OpImageSampleDrefImplicitLod:
1281 case spv::OpImageSampleDrefExplicitLod:
1282 case spv::OpImageSampleProjDrefImplicitLod:
1283 case spv::OpImageSampleProjDrefExplicitLod:
1284 case spv::OpImageSparseSampleDrefImplicitLod:
1285 case spv::OpImageSparseSampleDrefExplicitLod:
1286 case spv::OpImageSparseSampleProjDrefImplicitLod:
1287 case spv::OpImageSparseSampleProjDrefExplicitLod: {
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001288 // combined image samples are just OpLoad, but also can be separate image and sampler
sfricke-samsungef15e482022-01-26 11:32:49 -08001289 auto id = module_state->get_def(insn.word(3)); // <id> Sampled Image
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001290 auto sampler_load_id = (id.opcode() == spv::OpSampledImage) ? id.word(4) : insn.word(3);
1291 auto image_load_id = (id.opcode() == spv::OpSampledImage) ? id.word(3) : insn.word(3);
1292
1293 image_dref_members.emplace_back(image_load_id);
1294 sampler_implicitLod_dref_proj_members.emplace_back(sampler_load_id);
sfricke-samsung962cad92021-04-13 00:46:29 -07001295 // ImageOperands in index: 6
1296 if (insn.len() > 6 && CheckImageOperandsBiasOffset(insn.word(6))) {
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001297 sampler_bias_offset_members.emplace_back(sampler_load_id);
sfricke-samsung962cad92021-04-13 00:46:29 -07001298 }
1299 break;
1300 }
1301 case spv::OpImageSampleExplicitLod:
1302 case spv::OpImageSparseSampleExplicitLod: {
1303 // ImageOperands in index: 5
1304 if (insn.len() > 5 && CheckImageOperandsBiasOffset(insn.word(5))) {
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001305 // combined image samples are just OpLoad, but also can be separate image and sampler
sfricke-samsungef15e482022-01-26 11:32:49 -08001306 auto id = module_state->get_def(insn.word(3)); // <id> Sampled Image
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001307 auto load_id = (id.opcode() == spv::OpSampledImage) ? id.word(4) : insn.word(3);
1308 sampler_bias_offset_members.emplace_back(load_id);
sfricke-samsung962cad92021-04-13 00:46:29 -07001309 }
1310 break;
1311 }
1312 case spv::OpStore: {
1313 store_members.emplace_back(insn.word(1)); // object id or AccessChain id
1314 break;
1315 }
Lionel Landwerlinbc7401b2021-12-07 15:43:05 +02001316 case spv::OpImageRead:
1317 case spv::OpImageSparseRead: {
sfricke-samsungad55ccc2022-01-19 20:06:17 -08001318 image_read_members.emplace_back(insn.word(3)); // Load id
Lionel Landwerlinbc7401b2021-12-07 15:43:05 +02001319 break;
1320 }
sfricke-samsung962cad92021-04-13 00:46:29 -07001321 case spv::OpImageWrite: {
sfricke-samsungad55ccc2022-01-19 20:06:17 -08001322 image_write_members.emplace_back(insn.word(1)); // Load id
sfricke-samsung962cad92021-04-13 00:46:29 -07001323 break;
1324 }
1325 case spv::OpSampledImage: {
1326 // 3: image load id, 4: sampler load id
sfricke-samsungad55ccc2022-01-19 20:06:17 -08001327 sampled_image_members.emplace_back(std::pair<unsigned, unsigned>(insn.word(3), insn.word(4)));
sfricke-samsung962cad92021-04-13 00:46:29 -07001328 break;
1329 }
1330 case spv::OpLoad: {
1331 // 2: Load id, 3: object id or AccessChain id
1332 load_members.emplace(insn.word(2), insn.word(3));
1333 break;
1334 }
1335 case spv::OpAccessChain: {
1336 if (insn.len() == 4) {
1337 // If it is for struct, the length is only 4.
1338 // 2: AccessChain id, 3: object id
1339 accesschain_members.emplace(insn.word(2), std::pair<unsigned, unsigned>(insn.word(3), 0));
1340 } else {
1341 // 2: AccessChain id, 3: object id, 4: object id of array index
1342 accesschain_members.emplace(insn.word(2), std::pair<unsigned, unsigned>(insn.word(3), insn.word(4)));
1343 }
1344 break;
1345 }
1346 case spv::OpImageTexelPointer: {
1347 // 2: ImageTexelPointer id, 3: object id
1348 image_texel_pointer_members.emplace(insn.word(2), insn.word(3));
1349 break;
1350 }
1351 default: {
1352 if (AtomicOperation(insn.opcode())) {
1353 if (insn.opcode() == spv::OpAtomicStore) {
1354 atomic_store_members.emplace_back(insn.word(1)); // ImageTexelPointer id
1355 } else {
1356 atomic_members.emplace_back(insn.word(3)); // ImageTexelPointer id
1357 }
1358 }
1359 break;
1360 }
1361 }
1362 }
1363 }
1364};
1365
1366static bool CheckObjectIDFromOpLoad(uint32_t object_id, const std::vector<unsigned> &operator_members,
1367 const layer_data::unordered_map<unsigned, unsigned> &load_members,
1368 const layer_data::unordered_map<unsigned, std::pair<unsigned, unsigned>> &accesschain_members) {
1369 for (auto load_id : operator_members) {
1370 if (object_id == load_id) return true;
1371 auto load_it = load_members.find(load_id);
1372 if (load_it == load_members.end()) {
1373 continue;
1374 }
1375 if (load_it->second == object_id) {
1376 return true;
1377 }
1378
1379 auto accesschain_it = accesschain_members.find(load_it->second);
1380 if (accesschain_it == accesschain_members.end()) {
1381 continue;
1382 }
1383 if (accesschain_it->second.first == object_id) {
1384 return true;
1385 }
1386 }
1387 return false;
1388}
1389
1390// Takes a OpVariable and looks at the the descriptor type it uses. This will find things such as if the variable is writable, image
1391// atomic operation, matching images to samplers, etc
1392void SHADER_MODULE_STATE::IsSpecificDescriptorType(const spirv_inst_iter &id_it, bool is_storage_buffer, bool is_check_writable,
1393 interface_var &out_interface_var,
1394 shader_module_used_operators &used_operators) const {
1395 uint32_t type_id = id_it.word(1);
1396 unsigned int id = id_it.word(2);
1397
1398 auto type = get_def(type_id);
1399
1400 // Strip off any array or ptrs. Where we remove array levels, adjust the descriptor count for each dimension.
1401 while (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypePointer || type.opcode() == spv::OpTypeRuntimeArray ||
1402 type.opcode() == spv::OpTypeSampledImage) {
1403 if (type.opcode() == spv::OpTypeArray || type.opcode() == spv::OpTypeRuntimeArray ||
1404 type.opcode() == spv::OpTypeSampledImage) {
1405 type = get_def(type.word(2)); // Element type
1406 } else {
1407 type = get_def(type.word(3)); // Pointer type
1408 }
1409 }
Lionel Landwerlinbc7401b2021-12-07 15:43:05 +02001410
sfricke-samsung962cad92021-04-13 00:46:29 -07001411 switch (type.opcode()) {
1412 case spv::OpTypeImage: {
1413 auto dim = type.word(3);
1414 if (dim != spv::DimSubpassData) {
1415 used_operators.update(this);
1416
Lionel Landwerlinbc7401b2021-12-07 15:43:05 +02001417 // Sampled == 2 indicates used without a sampler (a storage image)
1418 bool is_image_without_format = false;
1419 if (type.word(7) == 2) is_image_without_format = type.word(8) == spv::ImageFormatUnknown;
1420
sfricke-samsungad55ccc2022-01-19 20:06:17 -08001421 if (CheckObjectIDFromOpLoad(id, used_operators.image_write_members, used_operators.load_members,
sfricke-samsung962cad92021-04-13 00:46:29 -07001422 used_operators.accesschain_members)) {
1423 out_interface_var.is_writable = true;
Lionel Landwerlinbc7401b2021-12-07 15:43:05 +02001424 if (is_image_without_format) out_interface_var.is_write_without_format = true;
1425 }
sfricke-samsungad55ccc2022-01-19 20:06:17 -08001426 if (CheckObjectIDFromOpLoad(id, used_operators.image_read_members, used_operators.load_members,
Lionel Landwerlinbc7401b2021-12-07 15:43:05 +02001427 used_operators.accesschain_members)) {
1428 out_interface_var.is_readable = true;
1429 if (is_image_without_format) out_interface_var.is_read_without_format = true;
sfricke-samsung962cad92021-04-13 00:46:29 -07001430 }
1431 if (CheckObjectIDFromOpLoad(id, used_operators.sampler_implicitLod_dref_proj_members, used_operators.load_members,
1432 used_operators.accesschain_members)) {
1433 out_interface_var.is_sampler_implicitLod_dref_proj = true;
1434 }
1435 if (CheckObjectIDFromOpLoad(id, used_operators.sampler_bias_offset_members, used_operators.load_members,
1436 used_operators.accesschain_members)) {
1437 out_interface_var.is_sampler_bias_offset = true;
1438 }
1439 if (CheckObjectIDFromOpLoad(id, used_operators.atomic_members, used_operators.image_texel_pointer_members,
1440 used_operators.accesschain_members) ||
1441 CheckObjectIDFromOpLoad(id, used_operators.atomic_store_members, used_operators.image_texel_pointer_members,
1442 used_operators.accesschain_members)) {
1443 out_interface_var.is_atomic_operation = true;
1444 }
Lionel Landwerlincdbe8682021-12-08 15:10:37 +02001445 if (CheckObjectIDFromOpLoad(id, used_operators.image_dref_members, used_operators.load_members,
1446 used_operators.accesschain_members)) {
1447 out_interface_var.is_dref_operation = true;
1448 }
sfricke-samsung962cad92021-04-13 00:46:29 -07001449
sfricke-samsungad55ccc2022-01-19 20:06:17 -08001450 for (auto &itp_id : used_operators.sampled_image_members) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001451 // Find if image id match.
1452 uint32_t image_index = 0;
1453 auto load_it = used_operators.load_members.find(itp_id.first);
1454 if (load_it == used_operators.load_members.end()) {
1455 continue;
1456 } else {
1457 if (load_it->second != id) {
1458 auto accesschain_it = used_operators.accesschain_members.find(load_it->second);
1459 if (accesschain_it == used_operators.accesschain_members.end()) {
1460 continue;
1461 } else {
1462 if (accesschain_it->second.first != id) {
1463 continue;
1464 }
1465
1466 const auto const_itr = GetConstantDef(accesschain_it->second.second);
1467 if (const_itr == end()) {
1468 // access chain index not a constant, skip.
1469 break;
1470 }
1471 image_index = GetConstantValue(const_itr);
1472 }
1473 }
1474 }
1475 // Find sampler's set binding.
1476 load_it = used_operators.load_members.find(itp_id.second);
1477 if (load_it == used_operators.load_members.end()) {
1478 continue;
1479 } else {
1480 uint32_t sampler_id = load_it->second;
1481 uint32_t sampler_index = 0;
1482 auto accesschain_it = used_operators.accesschain_members.find(load_it->second);
1483
1484 if (accesschain_it != used_operators.accesschain_members.end()) {
1485 const auto const_itr = GetConstantDef(accesschain_it->second.second);
1486 if (const_itr == end()) {
1487 // access chain index representing sampler index is not a constant, skip.
1488 break;
1489 }
1490 sampler_id = const_itr.offset();
1491 sampler_index = GetConstantValue(const_itr);
1492 }
1493 auto sampler_dec = get_decorations(sampler_id);
1494 if (image_index >= out_interface_var.samplers_used_by_image.size()) {
1495 out_interface_var.samplers_used_by_image.resize(image_index + 1);
1496 }
sfricke-samsungdb3f3f82022-01-18 06:41:15 -08001497
1498 // Need to check again for these properties in case not using a combined image sampler
1499 if (CheckObjectIDFromOpLoad(sampler_id, used_operators.sampler_implicitLod_dref_proj_members,
1500 used_operators.load_members, used_operators.accesschain_members)) {
1501 out_interface_var.is_sampler_implicitLod_dref_proj = true;
1502 }
1503 if (CheckObjectIDFromOpLoad(sampler_id, used_operators.sampler_bias_offset_members,
1504 used_operators.load_members, used_operators.accesschain_members)) {
1505 out_interface_var.is_sampler_bias_offset = true;
1506 }
1507
sfricke-samsung962cad92021-04-13 00:46:29 -07001508 out_interface_var.samplers_used_by_image[image_index].emplace(
Jeremy Gebben7fc88a22021-08-25 13:30:45 -06001509 SamplerUsedByImage{DescriptorSlot{sampler_dec.descriptor_set, sampler_dec.binding}, sampler_index});
sfricke-samsung962cad92021-04-13 00:46:29 -07001510 }
1511 }
1512 }
1513 return;
1514 }
1515
1516 case spv::OpTypeStruct: {
1517 layer_data::unordered_set<unsigned> nonwritable_members;
1518 if (get_decorations(type.word(1)).flags & decoration_set::buffer_block_bit) is_storage_buffer = true;
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -06001519 for (auto insn : static_data_.member_decoration_inst) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001520 if (insn.word(1) == type.word(1) && insn.word(3) == spv::DecorationNonWritable) {
1521 nonwritable_members.insert(insn.word(2));
1522 }
1523 }
1524
1525 // A buffer is writable if it's either flavor of storage buffer, and has any member not decorated
1526 // as nonwritable.
1527 if (is_storage_buffer && nonwritable_members.size() != type.len() - 2) {
1528 used_operators.update(this);
1529
1530 for (auto oid : used_operators.store_members) {
1531 if (id == oid) {
1532 out_interface_var.is_writable = true;
1533 return;
1534 }
1535 auto accesschain_it = used_operators.accesschain_members.find(oid);
1536 if (accesschain_it == used_operators.accesschain_members.end()) {
1537 continue;
1538 }
1539 if (accesschain_it->second.first == id) {
1540 out_interface_var.is_writable = true;
1541 return;
1542 }
1543 }
1544 if (CheckObjectIDFromOpLoad(id, used_operators.atomic_store_members, used_operators.image_texel_pointer_members,
1545 used_operators.accesschain_members)) {
1546 out_interface_var.is_writable = true;
1547 return;
1548 }
1549 }
1550 }
1551 }
1552}
1553
Jeremy Gebben7fc88a22021-08-25 13:30:45 -06001554std::vector<std::pair<DescriptorSlot, interface_var>> SHADER_MODULE_STATE::CollectInterfaceByDescriptorSlot(
Jeremy Gebben84b838b2021-08-23 08:41:39 -06001555 layer_data::unordered_set<uint32_t> const &accessible_ids) const {
Jeremy Gebben7fc88a22021-08-25 13:30:45 -06001556 std::vector<std::pair<DescriptorSlot, interface_var>> out;
sfricke-samsung962cad92021-04-13 00:46:29 -07001557 shader_module_used_operators operators;
1558
1559 for (auto id : accessible_ids) {
1560 auto insn = get_def(id);
1561 assert(insn != end());
1562
1563 if (insn.opcode() == spv::OpVariable &&
Lionel Landwerlin6a9f89c2021-12-07 15:46:46 +02001564 (insn.word(3) == spv::StorageClassUniform ||
1565 insn.word(3) == spv::StorageClassUniformConstant ||
sfricke-samsung962cad92021-04-13 00:46:29 -07001566 insn.word(3) == spv::StorageClassStorageBuffer)) {
1567 auto d = get_decorations(insn.word(2));
1568 unsigned set = d.descriptor_set;
1569 unsigned binding = d.binding;
1570
1571 interface_var v = {};
1572 v.id = insn.word(2);
1573 v.type_id = insn.word(1);
1574
1575 IsSpecificDescriptorType(insn, insn.word(3) == spv::StorageClassStorageBuffer,
1576 !(d.flags & decoration_set::nonwritable_bit), v, operators);
Jeremy Gebben84b838b2021-08-23 08:41:39 -06001577 out.emplace_back(DescriptorSlot{set, binding}, v);
sfricke-samsung962cad92021-04-13 00:46:29 -07001578 }
1579 }
1580
1581 return out;
1582}
1583
1584layer_data::unordered_set<uint32_t> SHADER_MODULE_STATE::CollectWritableOutputLocationinFS(
Jeremy Gebben84b838b2021-08-23 08:41:39 -06001585 const spirv_inst_iter &entrypoint) const {
sfricke-samsung962cad92021-04-13 00:46:29 -07001586 layer_data::unordered_set<uint32_t> location_list;
sfricke-samsung962cad92021-04-13 00:46:29 -07001587 const auto outputs = CollectInterfaceByLocation(entrypoint, spv::StorageClassOutput, false);
1588 layer_data::unordered_set<unsigned> store_members;
1589 layer_data::unordered_map<unsigned, unsigned> accesschain_members;
1590
1591 for (auto insn : *this) {
1592 switch (insn.opcode()) {
1593 case spv::OpStore:
1594 case spv::OpAtomicStore: {
1595 store_members.insert(insn.word(1)); // object id or AccessChain id
1596 break;
1597 }
1598 case spv::OpAccessChain: {
1599 // 2: AccessChain id, 3: object id
1600 if (insn.word(3)) accesschain_members.emplace(insn.word(2), insn.word(3));
1601 break;
1602 }
1603 default:
1604 break;
1605 }
1606 }
1607 if (store_members.empty()) {
1608 return location_list;
1609 }
1610 for (auto output : outputs) {
1611 auto store_it = store_members.find(output.second.id);
1612 if (store_it != store_members.end()) {
1613 location_list.insert(output.first.first);
1614 store_members.erase(store_it);
1615 continue;
1616 }
1617 store_it = store_members.begin();
1618 while (store_it != store_members.end()) {
1619 auto accesschain_it = accesschain_members.find(*store_it);
1620 if (accesschain_it == accesschain_members.end()) {
1621 ++store_it;
1622 continue;
1623 }
1624 if (accesschain_it->second == output.second.id) {
1625 location_list.insert(output.first.first);
1626 store_members.erase(store_it);
1627 accesschain_members.erase(accesschain_it);
1628 break;
1629 }
1630 ++store_it;
1631 }
1632 }
1633 return location_list;
1634}
1635
1636bool SHADER_MODULE_STATE::CollectInterfaceBlockMembers(std::map<location_t, interface_var> *out, bool is_array_of_verts,
ziga-lunarg9e94e112021-09-27 00:21:10 +02001637 uint32_t id, uint32_t type_id, bool is_patch,
1638 uint32_t /*first_location*/) const {
sfricke-samsung962cad92021-04-13 00:46:29 -07001639 // Walk down the type_id presented, trying to determine whether it's actually an interface block.
1640 auto type = GetStructType(get_def(type_id), is_array_of_verts && !is_patch);
1641 if (type == end() || !(get_decorations(type.word(1)).flags & decoration_set::block_bit)) {
1642 // This isn't an interface block.
1643 return false;
1644 }
1645
1646 layer_data::unordered_map<unsigned, unsigned> member_components;
1647 layer_data::unordered_map<unsigned, unsigned> member_relaxed_precision;
1648 layer_data::unordered_map<unsigned, unsigned> member_patch;
1649
1650 // Walk all the OpMemberDecorate for type's result id -- first pass, collect components.
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -06001651 for (auto insn : static_data_.member_decoration_inst) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001652 if (insn.word(1) == type.word(1)) {
1653 unsigned member_index = insn.word(2);
1654
1655 if (insn.word(3) == spv::DecorationComponent) {
1656 unsigned component = insn.word(4);
1657 member_components[member_index] = component;
1658 }
1659
1660 if (insn.word(3) == spv::DecorationRelaxedPrecision) {
1661 member_relaxed_precision[member_index] = 1;
1662 }
1663
1664 if (insn.word(3) == spv::DecorationPatch) {
1665 member_patch[member_index] = 1;
1666 }
1667 }
1668 }
1669
1670 // TODO: correctly handle location assignment from outside
1671
1672 // Second pass -- produce the output, from Location decorations
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -06001673 for (auto insn : static_data_.member_decoration_inst) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001674 if (insn.word(1) == type.word(1)) {
1675 unsigned member_index = insn.word(2);
1676 unsigned member_type_id = type.word(2 + member_index);
1677
1678 if (insn.word(3) == spv::DecorationLocation) {
1679 unsigned location = insn.word(4);
1680 unsigned num_locations = GetLocationsConsumedByType(member_type_id, false);
1681 auto component_it = member_components.find(member_index);
1682 unsigned component = component_it == member_components.end() ? 0 : component_it->second;
1683 bool is_relaxed_precision = member_relaxed_precision.find(member_index) != member_relaxed_precision.end();
1684 bool member_is_patch = is_patch || member_patch.count(member_index) > 0;
1685
1686 for (unsigned int offset = 0; offset < num_locations; offset++) {
1687 interface_var v = {};
1688 v.id = id;
1689 // TODO: member index in interface_var too?
1690 v.type_id = member_type_id;
1691 v.offset = offset;
1692 v.is_patch = member_is_patch;
1693 v.is_block_member = true;
1694 v.is_relaxed_precision = is_relaxed_precision;
1695 (*out)[std::make_pair(location + offset, component)] = v;
1696 }
1697 }
1698 }
1699 }
1700
1701 return true;
1702}
1703
1704std::map<location_t, interface_var> SHADER_MODULE_STATE::CollectInterfaceByLocation(spirv_inst_iter entrypoint,
1705 spv::StorageClass sinterface,
1706 bool is_array_of_verts) const {
1707 // TODO: handle index=1 dual source outputs from FS -- two vars will have the same location, and we DON'T want to clobber.
1708
1709 std::map<location_t, interface_var> out;
1710
1711 for (uint32_t iid : FindEntrypointInterfaces(entrypoint)) {
1712 auto insn = get_def(iid);
1713 assert(insn != end());
1714 assert(insn.opcode() == spv::OpVariable);
1715
ziga-lunarg9e94e112021-09-27 00:21:10 +02001716 const auto d = get_decorations(iid);
1717 bool passthrough = sinterface == spv::StorageClassOutput && insn.word(3) == spv::StorageClassInput &&
1718 (d.flags & decoration_set::passthrough_bit) != 0;
1719 if (insn.word(3) == static_cast<uint32_t>(sinterface) || passthrough) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001720 unsigned id = insn.word(2);
1721 unsigned type = insn.word(1);
1722
ziga-lunarg9e94e112021-09-27 00:21:10 +02001723 auto location = d.location;
sfricke-samsung962cad92021-04-13 00:46:29 -07001724 int builtin = d.builtin;
1725 unsigned component = d.component;
1726 bool is_patch = (d.flags & decoration_set::patch_bit) != 0;
1727 bool is_relaxed_precision = (d.flags & decoration_set::relaxed_precision_bit) != 0;
ziga-lunarg9e94e112021-09-27 00:21:10 +02001728 bool is_per_vertex = (d.flags & decoration_set::per_vertex_bit) != 0;
sfricke-samsung962cad92021-04-13 00:46:29 -07001729
1730 if (builtin != -1) {
1731 continue;
ziga-lunarg9e94e112021-09-27 00:21:10 +02001732 } else if (!CollectInterfaceBlockMembers(&out, is_array_of_verts, id, type, is_patch, location) ||
1733 location != decoration_set::kInvalidValue) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001734 // A user-defined interface variable, with a location. Where a variable occupied multiple locations, emit
1735 // one result for each.
ziga-lunarg9e94e112021-09-27 00:21:10 +02001736 unsigned num_locations = GetLocationsConsumedByType(type, (is_array_of_verts && !is_patch) || is_per_vertex);
sfricke-samsung962cad92021-04-13 00:46:29 -07001737 for (unsigned int offset = 0; offset < num_locations; offset++) {
1738 interface_var v = {};
1739 v.id = id;
1740 v.type_id = type;
1741 v.offset = offset;
1742 v.is_patch = is_patch;
1743 v.is_relaxed_precision = is_relaxed_precision;
1744 out[std::make_pair(location + offset, component)] = v;
1745 }
1746 }
1747 }
1748 }
1749
1750 return out;
1751}
1752
1753std::vector<uint32_t> SHADER_MODULE_STATE::CollectBuiltinBlockMembers(spirv_inst_iter entrypoint, uint32_t storageClass) const {
sfricke-samsung962cad92021-04-13 00:46:29 -07001754 // Find all interface variables belonging to the entrypoint and matching the storage class
sfricke-samsung0df5ee72021-07-24 23:27:16 -07001755 std::vector<uint32_t> variables;
sfricke-samsung962cad92021-04-13 00:46:29 -07001756 for (uint32_t id : FindEntrypointInterfaces(entrypoint)) {
1757 auto def = get_def(id);
1758 assert(def != end());
1759 assert(def.opcode() == spv::OpVariable);
1760
1761 if (def.word(3) == storageClass) variables.push_back(def.word(1));
1762 }
1763
1764 // Find all members belonging to the builtin block selected
1765 std::vector<uint32_t> builtin_block_members;
1766 for (auto &var : variables) {
1767 auto def = get_def(get_def(var).word(3));
1768
1769 // It could be an array of IO blocks. The element type should be the struct defining the block contents
1770 if (def.opcode() == spv::OpTypeArray) def = get_def(def.word(2));
1771
1772 // Now find all members belonging to the struct defining the IO block
1773 if (def.opcode() == spv::OpTypeStruct) {
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -06001774 for (auto set : static_data_.builtin_decoration_list) {
sfricke-samsung0df5ee72021-07-24 23:27:16 -07001775 auto insn = at(set.offset);
1776 if ((insn.opcode() == spv::OpMemberDecorate) && (def.word(1) == insn.word(1))) {
1777 // Start with undefined builtin for each struct member.
1778 // But only when confirmed the struct is the built-in inteface block (can only be one per shader)
1779 if (builtin_block_members.size() == 0) {
1780 builtin_block_members.resize(def.len() - 2, spv::BuiltInMax);
sfricke-samsung962cad92021-04-13 00:46:29 -07001781 }
sfricke-samsung0df5ee72021-07-24 23:27:16 -07001782 auto struct_index = insn.word(2);
1783 assert(struct_index < builtin_block_members.size());
1784 builtin_block_members[struct_index] = insn.word(4);
sfricke-samsung962cad92021-04-13 00:46:29 -07001785 }
1786 }
1787 }
1788 }
1789
1790 return builtin_block_members;
1791}
1792
1793std::vector<std::pair<uint32_t, interface_var>> SHADER_MODULE_STATE::CollectInterfaceByInputAttachmentIndex(
1794 layer_data::unordered_set<uint32_t> const &accessible_ids) const {
1795 std::vector<std::pair<uint32_t, interface_var>> out;
1796
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -06001797 for (auto insn : static_data_.decoration_inst) {
sfricke-samsung962cad92021-04-13 00:46:29 -07001798 if (insn.word(2) == spv::DecorationInputAttachmentIndex) {
1799 auto attachment_index = insn.word(3);
1800 auto id = insn.word(1);
1801
1802 if (accessible_ids.count(id)) {
1803 auto def = get_def(id);
1804 assert(def != end());
1805 if (def.opcode() == spv::OpVariable && def.word(3) == spv::StorageClassUniformConstant) {
1806 auto num_locations = GetLocationsConsumedByType(def.word(1), false);
1807 for (unsigned int offset = 0; offset < num_locations; offset++) {
1808 interface_var v = {};
1809 v.id = id;
1810 v.type_id = def.word(1);
1811 v.offset = offset;
1812 out.emplace_back(attachment_index + offset, v);
1813 }
1814 }
1815 }
1816 }
1817 }
1818
1819 return out;
1820}
1821
ziga-lunarg8346fe82021-08-22 17:30:50 +02001822uint32_t SHADER_MODULE_STATE::GetNumComponentsInBaseType(const spirv_inst_iter &iter) const {
1823 const uint32_t opcode = iter.opcode();
1824 if (opcode == spv::OpTypeFloat || opcode == spv::OpTypeInt) {
1825 return 1;
1826 } else if (opcode == spv::OpTypeVector) {
1827 const uint32_t component_count = iter.word(3);
1828 return component_count;
1829 } else if (opcode == spv::OpTypeMatrix) {
1830 const auto column_type = get_def(iter.word(2));
1831 const uint32_t vector_length = GetNumComponentsInBaseType(column_type);
1832 const uint32_t column_count = iter.word(3);
1833 return vector_length * column_count;
1834 } else if (opcode == spv::OpTypeArray) {
1835 const auto element_type = get_def(iter.word(2));
1836 const uint32_t element_length = GetNumComponentsInBaseType(element_type);
1837 return element_length;
1838 } else if (opcode == spv::OpTypeStruct) {
1839 uint32_t total_size = 0;
1840 for (uint32_t i = 2; i < iter.len(); ++i) {
1841 total_size += GetNumComponentsInBaseType(get_def(iter.word(i)));
1842 }
1843 return total_size;
1844 } else if (opcode == spv::OpTypePointer) {
1845 const auto type = get_def(iter.word(3));
1846 return GetNumComponentsInBaseType(type);
1847 }
1848 return 0;
1849}
1850
ziga-lunarg2818f492021-08-12 14:30:51 +02001851std::array<uint32_t, 3> SHADER_MODULE_STATE::GetWorkgroupSize(
1852 VkPipelineShaderStageCreateInfo const *pStage, const std::unordered_map<uint32_t, std::vector<uint32_t>>& id_value_map) const {
1853 std::array<uint32_t, 3> work_group_size = {1, 1, 1};
1854
1855 uint32_t work_group_size_id = std::numeric_limits<uint32_t>::max();
1856
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -06001857 for (const auto &builtin : static_data_.builtin_decoration_list) {
ziga-lunarg2818f492021-08-12 14:30:51 +02001858 if (builtin.builtin == spv::BuiltInWorkgroupSize) {
1859 work_group_size_id = at(builtin.offset).word(1);
1860 break;
1861 }
1862 }
1863 for (auto insn : *this) {
1864 uint32_t opcode = insn.opcode();
1865 if (opcode == spv::OpSpecConstantComposite) { // WorkGroupSize must be a composite
1866 uint32_t result_id = insn.word(2);
1867 if (result_id == work_group_size_id) {
1868 uint32_t result_type_id = insn.word(1);
1869 auto result_type = get_def(result_type_id);
1870 if (result_type.opcode() == spv::OpTypeVector) {
1871 uint32_t component_count = result_type.word(3);
1872 for (uint32_t i = 0; i < component_count; ++i) {
1873 auto constituent = get_def(insn.word(3 + i));
Nathaniel Cesario77cd59b2021-10-11 23:52:24 -06001874 for (const auto &sc : static_data_.spec_const_map) {
ziga-lunarg2818f492021-08-12 14:30:51 +02001875 if (sc.second == constituent.word(2)) {
1876 const auto iter = id_value_map.find(sc.first);
1877 if (iter != id_value_map.cend()) {
1878 work_group_size[i] = *iter->second.begin();
1879 }
1880 break;
1881 }
1882 }
1883 }
1884 }
1885 }
1886 }
1887 }
1888
1889 return work_group_size;
1890}
1891
ziga-lunarga26b3602021-08-08 15:53:00 +02001892uint32_t SHADER_MODULE_STATE::GetTypeBitsSize(const spirv_inst_iter &iter) const {
1893 const uint32_t opcode = iter.opcode();
1894 if (opcode == spv::OpTypeFloat || opcode == spv::OpTypeInt) {
1895 return iter.word(2);
1896 } else if (opcode == spv::OpTypeVector) {
1897 const auto component_type = get_def(iter.word(2));
1898 uint32_t scalar_width = GetTypeBitsSize(component_type);
1899 uint32_t component_count = iter.word(3);
1900 return scalar_width * component_count;
1901 } else if (opcode == spv::OpTypeMatrix) {
1902 const auto column_type = get_def(iter.word(2));
1903 uint32_t vector_width = GetTypeBitsSize(column_type);
1904 uint32_t column_count = iter.word(3);
1905 return vector_width * column_count;
1906 } else if (opcode == spv::OpTypeArray) {
1907 const auto element_type = get_def(iter.word(2));
1908 uint32_t element_width = GetTypeBitsSize(element_type);
1909 const auto length_type = get_def(iter.word(3));
1910 uint32_t length = GetConstantValue(length_type);
1911 return element_width * length;
1912 } else if (opcode == spv::OpTypeStruct) {
1913 uint32_t total_size = 0;
1914 for (uint32_t i = 2; i < iter.len(); ++i) {
1915 total_size += GetTypeBitsSize(get_def(iter.word(i)));
1916 }
1917 return total_size;
ziga-lunarg8346fe82021-08-22 17:30:50 +02001918 } else if (opcode == spv::OpTypePointer) {
1919 const auto type = get_def(iter.word(3));
1920 return GetTypeBitsSize(type);
ziga-lunargef2c3172021-11-07 10:35:29 +01001921 } else if (opcode == spv::OpVariable) {
1922 const auto type = get_def(iter.word(1));
1923 return GetTypeBitsSize(type);
ziga-lunarga26b3602021-08-08 15:53:00 +02001924 }
1925 return 0;
1926}
1927
1928uint32_t SHADER_MODULE_STATE::GetTypeBytesSize(const spirv_inst_iter &iter) const { return GetTypeBitsSize(iter) / 8; }
1929
ziga-lunarg19fc6ae2021-09-09 00:05:19 +02001930// Returns the base type (float, int or unsigned int) or struct (can have multiple different base types inside)
ziga-lunarg8346fe82021-08-22 17:30:50 +02001931uint32_t SHADER_MODULE_STATE::GetBaseType(const spirv_inst_iter &iter) const {
1932 const uint32_t opcode = iter.opcode();
1933 if (opcode == spv::OpTypeFloat || opcode == spv::OpTypeInt || opcode == spv::OpTypeStruct) {
1934 return iter.word(1);
1935 } else if (opcode == spv::OpTypeVector) {
1936 const auto& component_type = get_def(iter.word(2));
1937 return GetBaseType(component_type);
1938 } else if (opcode == spv::OpTypeMatrix) {
1939 const auto& column_type = get_def(iter.word(2));
1940 return GetBaseType(column_type);
1941 } else if (opcode == spv::OpTypeArray) {
1942 const auto& element_type = get_def(iter.word(2));
1943 return GetBaseType(element_type);
1944 } else if (opcode == spv::OpTypePointer) {
1945 const auto& type = get_def(iter.word(3));
1946 return GetBaseType(type);
1947 }
1948 return 0;
1949}
1950
sfricke-samsunga6c1ddc2022-01-23 14:15:40 -08001951// Returns type_id if id has type or zero otherwise
1952uint32_t SHADER_MODULE_STATE::GetTypeId(uint32_t id) const {
1953 const auto type = get_def(id);
1954 return OpcodeHasType(type.opcode()) ? type.word(1) : 0;
1955}
1956
ziga-lunarga26b3602021-08-08 15:53:00 +02001957uint32_t SHADER_MODULE_STATE::CalcComputeSharedMemory(VkShaderStageFlagBits stage,
1958 const spirv_inst_iter &insn) const {
1959 if (stage == VK_SHADER_STAGE_COMPUTE_BIT && insn.opcode() == spv::OpVariable) {
1960 uint32_t storage_class = insn.word(3);
1961 if (storage_class == spv::StorageClassWorkgroup) { // StorageClass Workgroup is shared memory
1962 uint32_t result_type_id = insn.word(1);
1963 auto result_type = get_def(result_type_id);
1964 auto type = get_def(result_type.word(3));
1965 return GetTypeBytesSize(type);
1966 }
1967 }
1968
1969 return 0;
1970}
1971
sfricke-samsung962cad92021-04-13 00:46:29 -07001972// Assumes itr points to an OpConstant instruction
1973uint32_t GetConstantValue(const spirv_inst_iter &itr) { return itr.word(3); }
1974
1975std::vector<uint32_t> FindEntrypointInterfaces(const spirv_inst_iter &entrypoint) {
1976 assert(entrypoint.opcode() == spv::OpEntryPoint);
1977
1978 std::vector<uint32_t> interfaces;
1979 // Find the end of the entrypoint's name string. additional zero bytes follow the actual null terminator, to fill out the
1980 // rest of the word - so we only need to look at the last byte in the word to determine which word contains the terminator.
1981 uint32_t word = 3;
1982 while (entrypoint.word(word) & 0xff000000u) {
1983 ++word;
1984 }
1985 ++word;
1986
1987 for (; word < entrypoint.len(); word++) interfaces.push_back(entrypoint.word(word));
1988
1989 return interfaces;
1990}