blob: 4eb8f23e45bee86187bcfb50908880ad3dc46995 [file] [log] [blame]
David Neto482550a2018-03-24 05:21:07 -07001// Copyright 2018 The Clspv Authors. All rights reserved.
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
15// This translation unit defines all Clspv command line option variables.
16
Diego Novilloa4c44fa2019-04-11 10:56:15 -040017#include "llvm/PassRegistry.h"
David Neto118188e2018-08-24 11:27:54 -040018#include "llvm/Support/CommandLine.h"
David Neto482550a2018-03-24 05:21:07 -070019
Diego Novilloa4c44fa2019-04-11 10:56:15 -040020#include "Passes.h"
Kévin Petitf0515712020-01-07 18:29:20 +000021#include "clspv/Option.h"
Diego Novilloa4c44fa2019-04-11 10:56:15 -040022
David Neto482550a2018-03-24 05:21:07 -070023namespace {
David Neto862b7d82018-06-14 18:48:37 -040024
Alan Bakeraf289ab2018-08-29 11:26:44 -040025llvm::cl::opt<bool>
26 inline_entry_points("inline-entry-points", llvm::cl::init(false),
27 llvm::cl::desc("Exhaustively inline entry points."));
28
Alan Baker0dd3fd22018-08-24 11:03:12 -040029llvm::cl::opt<bool> no_inline_single_call_site(
30 "no-inline-single", llvm::cl::init(false),
31 llvm::cl::desc("Disable inlining functions with single call sites."));
32
David Netoc5fb5242018-07-30 13:28:31 -040033// Should the compiler try to use direct resource accesses within helper
David Neto862b7d82018-06-14 18:48:37 -040034// functions instead of passing pointers via function arguments?
David Netoc5fb5242018-07-30 13:28:31 -040035llvm::cl::opt<bool> no_direct_resource_access(
36 "no-dra", llvm::cl::init(false),
David Neto862b7d82018-06-14 18:48:37 -040037 llvm::cl::desc(
David Netoc5fb5242018-07-30 13:28:31 -040038 "No Direct Resource Access: Avoid rewriting helper functions "
39 "to access resources directly instead of by pointers "
40 "in function arguments. Affects kernel arguments of type "
41 "pointer-to-global, pointer-to-constant, image, and sampler."));
David Neto862b7d82018-06-14 18:48:37 -040042
Alan Bakerfc6888e2018-08-20 20:54:33 -040043llvm::cl::opt<bool> no_share_module_scope_variables(
44 "no-smsv", llvm::cl::init(false),
45 llvm::cl::desc("No Share Module Scope Variables: Avoid de-duplicating "
46 "module scope variables."));
47
David Neto482550a2018-03-24 05:21:07 -070048// By default, reuse the same descriptor set number for all arguments.
49// To turn that off, use -distinct-kernel-descriptor-sets
50llvm::cl::opt<bool> distinct_kernel_descriptor_sets(
51 "distinct-kernel-descriptor-sets", llvm::cl::init(false),
Alan Bakerfc6888e2018-08-20 20:54:33 -040052 llvm::cl::desc("Each kernel uses its own descriptor set for its arguments. "
53 "Turns off direct-resource-access optimizations."));
David Neto482550a2018-03-24 05:21:07 -070054
55// TODO(dneto): As per Neil Henning suggestion, might not need this if
56// you can trace the pointer back far enough to see that it's 32-bit
57// aligned. However, even in the vstore_half case, you'll probably get
58// better performance if you can rely on SPV_KHR_16bit_storage since in
59// the alternate case you're using a (relaxed) atomic, and therefore
60// have to write through to the cache.
61llvm::cl::opt<bool> f16bit_storage(
62 "f16bit_storage", llvm::cl::init(false),
63 llvm::cl::desc("Assume the target supports SPV_KHR_16bit_storage"));
64
David Netob6e2e062018-04-25 10:32:06 -040065llvm::cl::opt<bool> hack_initializers(
66 "hack-initializers", llvm::cl::init(false),
67 llvm::cl::desc(
68 "At the start of each kernel, explicitly write the initializer "
69 "value for a compiler-generated variable containing the workgroup "
70 "size. Required by some drivers to make the get_global_size builtin "
71 "function work when used with non-constant dimension index."));
72
David Neto862b7d82018-06-14 18:48:37 -040073llvm::cl::opt<bool> hack_dis(
74 "hack-dis", llvm::cl::init(false),
Alan Bakerfc6888e2018-08-20 20:54:33 -040075 llvm::cl::desc("Force use of a distinct image or sampler variable for each "
76 "image or sampler kernel argument. This prevents sharing "
77 "of resource variables."));
David Neto862b7d82018-06-14 18:48:37 -040078
David Neto482550a2018-03-24 05:21:07 -070079llvm::cl::opt<bool> hack_inserts(
80 "hack-inserts", llvm::cl::init(false),
81 llvm::cl::desc(
82 "Avoid all single-index OpCompositInsert instructions "
83 "into struct types by using complete composite construction and "
84 "extractions"));
85
David Neto3a0df832018-08-03 14:35:42 -040086llvm::cl::opt<bool> hack_signed_compare_fixup(
87 "hack-scf", llvm::cl::init(false),
88 llvm::cl::desc("Rewrite signed integer comparisons to use other kinds of "
89 "instructions"));
90
David Neto482550a2018-03-24 05:21:07 -070091// Some drivers don't like to see constant composite values constructed
92// from scalar Undef values. Replace numeric scalar and vector Undef with
93// corresponding OpConstantNull. We need to keep Undef for image values,
94// for example. In the LLVM domain, image values are passed as pointer to
95// struct.
96// See https://github.com/google/clspv/issues/95
97llvm::cl::opt<bool> hack_undef(
98 "hack-undef", llvm::cl::init(false),
99 llvm::cl::desc("Use OpConstantNull instead of OpUndef for floating point, "
100 "integer, or vectors of them"));
101
Alan Baker33376ea2018-08-30 12:02:31 -0400102llvm::cl::opt<bool> hack_phis(
103 "hack-phis", llvm::cl::init(false),
104 llvm::cl::desc(
105 "Scalarize phi instructions of struct type before code generation"));
106
alan-baker3fa76d92018-11-12 14:54:40 -0500107llvm::cl::opt<bool> hack_block_order(
108 "hack-block-order", llvm::cl::init(false),
109 llvm::cl::desc("Order basic blocks using structured order"));
110
David Neto482550a2018-03-24 05:21:07 -0700111llvm::cl::opt<bool>
112 pod_ubo("pod-ubo", llvm::cl::init(false),
113 llvm::cl::desc("POD kernel arguments are in uniform buffers"));
114
alan-baker9b0ec3c2020-04-06 14:45:34 -0400115llvm::cl::opt<bool> pod_pushconstant(
116 "pod-pushconstant",
117 llvm::cl::desc("POD kernel arguments are in the push constant interface"),
118 llvm::cl::init(false));
119
David Neto85082642018-03-24 06:55:20 -0700120llvm::cl::opt<bool> module_constants_in_storage_buffer(
121 "module-constants-in-storage-buffer", llvm::cl::init(false),
122 llvm::cl::desc(
123 "Module-scope __constants are collected into a single storage buffer. "
124 "The binding and initialization data are reported in the descriptor "
125 "map."));
126
David Neto482550a2018-03-24 05:21:07 -0700127llvm::cl::opt<bool> show_ids("show-ids", llvm::cl::init(false),
128 llvm::cl::desc("Show SPIR-V IDs for functions"));
129
Alan Bakerfcda9482018-10-02 17:09:59 -0400130llvm::cl::opt<bool> constant_args_in_uniform_buffer(
131 "constant-args-ubo", llvm::cl::init(false),
132 llvm::cl::desc("Put pointer-to-constant kernel args in UBOs."));
133
alan-baker3d9e2012019-01-11 14:55:30 -0500134// Default to 64kB.
135llvm::cl::opt<int> maximum_ubo_size(
136 "max-ubo-size", llvm::cl::init(64 << 10),
137 llvm::cl::desc("Specify the maximum UBO array size in bytes."));
138
alan-baker9b0ec3c2020-04-06 14:45:34 -0400139llvm::cl::opt<int> maximum_pushconstant_size(
140 "max-pushconstant-size", llvm::cl::init(128),
141 llvm::cl::desc(
142 "Specify the maximum push constant interface size in bytes."));
143
alan-baker3d9e2012019-01-11 14:55:30 -0500144llvm::cl::opt<bool> relaxed_ubo_layout(
145 "relaxed-ubo-layout",
146 llvm::cl::desc("Allow UBO layouts, that do not satisfy the restriction "
147 "that ArrayStride is a multiple of array alignment. This "
148 "does not generate valid SPIR-V for the Vulkan environment; "
149 "however, some drivers may accept it."));
150
alan-bakera3e02382019-02-15 08:27:27 -0500151llvm::cl::opt<bool> std430_ubo_layout(
alan-baker4217b322019-03-06 08:56:12 -0500152 "std430-ubo-layout", llvm::cl::init(false),
alan-bakera3e02382019-02-15 08:27:27 -0500153 llvm::cl::desc("Allow UBO layouts that conform to std430 (SSBO) layout "
154 "requirements. This does not generate valid SPIR-V for the "
155 "Vulkan environment; however, some drivers may accept it."));
156
alan-baker4217b322019-03-06 08:56:12 -0500157llvm::cl::opt<bool> keep_unused_arguments(
158 "keep-unused-arguments", llvm::cl::init(false),
159 llvm::cl::desc("Do not remove unused non-kernel function arguments."));
160
alan-bakerace4e592019-04-09 08:43:22 -0400161llvm::cl::opt<bool> int8_support("int8", llvm::cl::init(true),
alan-bakerb39c8262019-03-08 14:03:37 -0500162 llvm::cl::desc("Allow 8-bit integers"));
163
Kévin Petitf0515712020-01-07 18:29:20 +0000164llvm::cl::opt<clspv::Option::SourceLanguage> cl_std(
165 "cl-std", llvm::cl::desc("Select OpenCL standard"),
166 llvm::cl::init(clspv::Option::SourceLanguage::OpenCL_C_12),
167 llvm::cl::values(clEnumValN(clspv::Option::SourceLanguage::OpenCL_C_10,
168 "CL1.0", "OpenCL C 1.0"),
169 clEnumValN(clspv::Option::SourceLanguage::OpenCL_C_11,
170 "CL1.1", "OpenCL C 1.1"),
171 clEnumValN(clspv::Option::SourceLanguage::OpenCL_C_12,
172 "CL1.2", "OpenCL C 1.2"),
173 clEnumValN(clspv::Option::SourceLanguage::OpenCL_C_20,
174 "CL2.0", "OpenCL C 2.0"),
175 clEnumValN(clspv::Option::SourceLanguage::OpenCL_CPP,
176 "CLC++", "C++ for OpenCL")));
Kévin Petita624c0c2019-05-07 20:27:43 +0800177
178static llvm::cl::opt<bool> images("images", llvm::cl::init(true),
179 llvm::cl::desc("Enable support for images"));
alan-baker09cb9802019-12-10 13:16:27 -0500180
Kévin Petitbbbda972020-03-03 19:16:31 +0000181static llvm::cl::opt<bool>
182 scalar_block_layout("scalar-block-layout", llvm::cl::init(false),
183 llvm::cl::desc("Assume VK_EXT_scalar_block_layout"));
184
185static llvm::cl::opt<bool> work_dim(
alan-bakerbed3a882020-04-21 14:42:41 -0400186 "work-dim", llvm::cl::init(true),
Kévin Petitbbbda972020-03-03 19:16:31 +0000187 llvm::cl::desc("Enable support for get_work_dim() built-in function"));
188
189static llvm::cl::opt<bool>
190 global_offset("global-offset", llvm::cl::init(false),
191 llvm::cl::desc("Enable support for global offsets"));
192
alan-baker09cb9802019-12-10 13:16:27 -0500193static bool use_sampler_map = false;
alan-baker9b0ec3c2020-04-06 14:45:34 -0400194
195static llvm::cl::opt<bool> cluster_non_pointer_kernel_args(
alan-baker374ce1a2020-04-07 20:37:20 -0400196 "cluster-pod-kernel-args", llvm::cl::init(true),
alan-baker9b0ec3c2020-04-06 14:45:34 -0400197 llvm::cl::desc("Collect plain-old-data kernel arguments into a struct in "
198 "a single storage buffer, using a binding number after "
199 "other arguments. Use this to reduce storage buffer "
200 "descriptors."));
201
David Neto482550a2018-03-24 05:21:07 -0700202} // namespace
203
204namespace clspv {
205namespace Option {
206
Alan Bakeraf289ab2018-08-29 11:26:44 -0400207bool InlineEntryPoints() { return inline_entry_points; }
Alan Baker0dd3fd22018-08-24 11:03:12 -0400208bool InlineSingleCallSite() { return !no_inline_single_call_site; }
David Netoc5fb5242018-07-30 13:28:31 -0400209bool DirectResourceAccess() {
210 return !(no_direct_resource_access || distinct_kernel_descriptor_sets);
211}
Alan Bakerfc6888e2018-08-20 20:54:33 -0400212bool ShareModuleScopeVariables() { return !no_share_module_scope_variables; }
David Neto482550a2018-03-24 05:21:07 -0700213bool DistinctKernelDescriptorSets() { return distinct_kernel_descriptor_sets; }
214bool F16BitStorage() { return f16bit_storage; }
David Neto862b7d82018-06-14 18:48:37 -0400215bool HackDistinctImageSampler() { return hack_dis; }
David Netob6e2e062018-04-25 10:32:06 -0400216bool HackInitializers() { return hack_initializers; }
David Neto482550a2018-03-24 05:21:07 -0700217bool HackInserts() { return hack_inserts; }
David Neto3a0df832018-08-03 14:35:42 -0400218bool HackSignedCompareFixup() { return hack_signed_compare_fixup; }
David Neto482550a2018-03-24 05:21:07 -0700219bool HackUndef() { return hack_undef; }
Alan Baker33376ea2018-08-30 12:02:31 -0400220bool HackPhis() { return hack_phis; }
alan-baker3fa76d92018-11-12 14:54:40 -0500221bool HackBlockOrder() { return hack_block_order; }
Alan Bakerfc6888e2018-08-20 20:54:33 -0400222bool ModuleConstantsInStorageBuffer() {
223 return module_constants_in_storage_buffer;
224}
David Neto482550a2018-03-24 05:21:07 -0700225bool PodArgsInUniformBuffer() { return pod_ubo; }
alan-baker9b0ec3c2020-04-06 14:45:34 -0400226bool PodArgsInPushConstants() { return pod_pushconstant; }
David Neto482550a2018-03-24 05:21:07 -0700227bool ShowIDs() { return show_ids; }
alan-baker3fa76d92018-11-12 14:54:40 -0500228bool ConstantArgsInUniformBuffer() { return constant_args_in_uniform_buffer; }
alan-baker3d9e2012019-01-11 14:55:30 -0500229uint64_t MaxUniformBufferSize() { return maximum_ubo_size; }
alan-baker9b0ec3c2020-04-06 14:45:34 -0400230uint32_t MaxPushConstantsSize() { return maximum_pushconstant_size; }
alan-baker3d9e2012019-01-11 14:55:30 -0500231bool RelaxedUniformBufferLayout() { return relaxed_ubo_layout; }
alan-bakera3e02382019-02-15 08:27:27 -0500232bool Std430UniformBufferLayout() { return std430_ubo_layout; }
alan-baker4217b322019-03-06 08:56:12 -0500233bool KeepUnusedArguments() { return keep_unused_arguments; }
alan-bakerb39c8262019-03-08 14:03:37 -0500234bool Int8Support() { return int8_support; }
Kévin Petita624c0c2019-05-07 20:27:43 +0800235bool ImageSupport() { return images; }
alan-baker09cb9802019-12-10 13:16:27 -0500236bool UseSamplerMap() { return use_sampler_map; }
237void SetUseSamplerMap(bool use) { use_sampler_map = use; }
Kévin Petitf0515712020-01-07 18:29:20 +0000238SourceLanguage Language() { return cl_std; }
Kévin Petitbbbda972020-03-03 19:16:31 +0000239bool ScalarBlockLayout() { return scalar_block_layout; }
240bool WorkDim() { return work_dim; }
241bool GlobalOffset() { return global_offset; }
alan-baker9b0ec3c2020-04-06 14:45:34 -0400242bool ClusterPodKernelArgs() { return cluster_non_pointer_kernel_args; }
David Neto482550a2018-03-24 05:21:07 -0700243
244} // namespace Option
245} // namespace clspv