Halide
Target.h
Go to the documentation of this file.
1 #ifndef HALIDE_TARGET_H
2 #define HALIDE_TARGET_H
3 
4 /** \file
5  * Defines the structure that describes a Halide target.
6  */
7 
8 #include <bitset>
9 #include <cstdint>
10 #include <string>
11 
12 #include "DeviceAPI.h"
13 #include "Type.h"
14 #include "runtime/HalideRuntime.h"
15 
16 namespace Halide {
17 
18 /** A struct representing a target machine and os to generate code for. */
19 struct Target {
20  /** The operating system used by the target. Determines which
21  * system calls to generate.
22  * Corresponds to os_name_map in Target.cpp. */
23  enum OS {
24  OSUnknown = 0,
27  OSX,
29  IOS,
34  } os = OSUnknown;
35 
36  /** The architecture used by the target. Determines the
37  * instruction set to use.
38  * Corresponds to arch_name_map in Target.cpp. */
39  enum Arch {
41  X86,
42  ARM,
47  } arch = ArchUnknown;
48 
49  /** The bit-width of the target machine. Must be 0 for unknown, or 32 or 64. */
50  int bits = 0;
51 
52  /** The bit-width of a vector register for targets where this is configurable and
53  * targeting a fixed size is desired. The default of 0 indicates no assumption of
54  * fixed size is allowed. */
55  int vector_bits = 0;
56 
57  /** The specific processor to be targeted, tuned for.
58  * Corresponds to processor_name_map in Target.cpp.
59  *
60  * New entries should be added to the end. */
61  enum Processor {
62  /// Do not tune for any specific CPU. In practice, this means that halide will decide the tune CPU based on the enabled features.
64  K8, /// Tune for AMD K8 Hammer CPU (AMD Family 0Fh, launched 2003).
65  K8_SSE3, /// Tune for later versions of AMD K8 CPU, with SSE3 support.
66  AMDFam10, /// Tune for AMD K10 "Barcelona" CPU (AMD Family 10h, launched 2007).
67  BtVer1, /// Tune for AMD Bobcat CPU (AMD Family 14h, launched 2011).
68  BdVer1, /// Tune for AMD Bulldozer CPU (AMD Family 15h, launched 2011).
69  BdVer2, /// Tune for AMD Piledriver CPU (AMD Family 15h (2nd-gen), launched 2012).
70  BdVer3, /// Tune for AMD Steamroller CPU (AMD Family 15h (3nd-gen), launched 2014).
71  BdVer4, /// Tune for AMD Excavator CPU (AMD Family 15h (4th-gen), launched 2015).
72  BtVer2, /// Tune for AMD Jaguar CPU (AMD Family 16h, launched 2013).
73  ZnVer1, /// Tune for AMD Zen CPU (AMD Family 17h, launched 2017).
74  ZnVer2, /// Tune for AMD Zen 2 CPU (AMD Family 17h, launched 2019).
75  ZnVer3, /// Tune for AMD Zen 3 CPU (AMD Family 19h, launched 2020).
77 
78  /** Optional features a target can have.
79  * Corresponds to feature_name_map in Target.cpp.
80  * See definitions in HalideRuntime.h for full information.
81  */
82  enum Feature {
111  OpenGLCompute = halide_target_feature_openglcompute, // NOTE: This feature is deprecated and will be removed in Halide 17.
171  };
172  Target() = default;
173  Target(OS o, Arch a, int b, Processor pt, const std::vector<Feature> &initial_features = std::vector<Feature>(),
174  int vb = 0)
175  : os(o), arch(a), bits(b), vector_bits(vb), processor_tune(pt) {
176  for (const auto &f : initial_features) {
177  set_feature(f);
178  }
179  }
180 
181  Target(OS o, Arch a, int b, const std::vector<Feature> &initial_features = std::vector<Feature>())
182  : Target(o, a, b, ProcessorGeneric, initial_features) {
183  }
184 
185  /** Given a string of the form used in HL_TARGET
186  * (e.g. "x86-64-avx"), construct the Target it specifies. Note
187  * that this always starts with the result of get_host_target(),
188  * replacing only the parts found in the target string, so if you
189  * omit (say) an OS specification, the host OS will be used
190  * instead. An empty string is exactly equivalent to
191  * get_host_target().
192  *
193  * Invalid target strings will fail with a user_error.
194  */
195  // @{
196  explicit Target(const std::string &s);
197  explicit Target(const char *s);
198  // @}
199 
200  /** Check if a target string is valid. */
201  static bool validate_target_string(const std::string &s);
202 
203  /** Return true if any of the arch/bits/os fields are "unknown"/0;
204  return false otherwise. */
205  bool has_unknowns() const;
206 
207  void set_feature(Feature f, bool value = true);
208 
209  void set_features(const std::vector<Feature> &features_to_set, bool value = true);
210 
211  bool has_feature(Feature f) const;
212 
213  inline bool has_feature(halide_target_feature_t f) const {
214  return has_feature((Feature)f);
215  }
216 
217  bool features_any_of(const std::vector<Feature> &test_features) const;
218 
219  bool features_all_of(const std::vector<Feature> &test_features) const;
220 
221  /** Return a copy of the target with the given feature set.
222  * This is convenient when enabling certain features (e.g. NoBoundsQuery)
223  * in an initialization list, where the target to be mutated may be
224  * a const reference. */
225  Target with_feature(Feature f) const;
226 
227  /** Return a copy of the target with the given feature cleared.
228  * This is convenient when disabling certain features (e.g. NoBoundsQuery)
229  * in an initialization list, where the target to be mutated may be
230  * a const reference. */
231  Target without_feature(Feature f) const;
232 
233  /** Is a fully feature GPU compute runtime enabled? I.e. is
234  * Func::gpu_tile and similar going to work? Currently includes
235  * CUDA, OpenCL, Metal and D3D12Compute. We do not include OpenGL,
236  * because it is not capable of gpgpu, and is not scheduled via
237  * Func::gpu_tile.
238  * TODO: Should OpenGLCompute be included here? */
239  bool has_gpu_feature() const;
240 
241  /** Does this target allow using a certain type. Generally all
242  * types except 64-bit float and int/uint should be supported by
243  * all backends.
244  *
245  * It is likely better to call the version below which takes a DeviceAPI.
246  */
247  bool supports_type(const Type &t) const;
248 
249  /** Does this target allow using a certain type on a certain device.
250  * This is the prefered version of this routine.
251  */
252  bool supports_type(const Type &t, DeviceAPI device) const;
253 
254  /** Returns whether a particular device API can be used with this
255  * Target. */
256  bool supports_device_api(DeviceAPI api) const;
257 
258  /** If this Target (including all Features) requires a specific DeviceAPI,
259  * return it. If it doesn't, return DeviceAPI::None. If the Target has
260  * features with multiple (different) DeviceAPI requirements, the result
261  * will be an arbitrary DeviceAPI. */
263 
264  bool operator==(const Target &other) const {
265  return os == other.os &&
266  arch == other.arch &&
267  bits == other.bits &&
268  processor_tune == other.processor_tune &&
269  features == other.features;
270  }
271 
272  bool operator!=(const Target &other) const {
273  return !(*this == other);
274  }
275 
276  /**
277  * Create a "greatest common denominator" runtime target that is compatible with
278  * both this target and \p other. Used by generators to conveniently select a suitable
279  * runtime when linking together multiple functions.
280  *
281  * @param other The other target from which we compute the gcd target.
282  * @param[out] result The gcd target if we return true, otherwise unmodified. Can be the same as *this.
283  * @return Whether it was possible to find a compatible target (true) or not.
284  */
285  bool get_runtime_compatible_target(const Target &other, Target &result);
286 
287  /** Convert the Target into a string form that can be reconstituted
288  * by merge_string(), which will always be of the form
289  *
290  * arch-bits-os-processor-feature1-feature2...featureN.
291  *
292  * Note that is guaranteed that Target(t1.to_string()) == t1,
293  * but not that Target(s).to_string() == s (since there can be
294  * multiple strings that parse to the same Target)...
295  * *unless* t1 contains 'unknown' fields (in which case you'll get a string
296  * that can't be parsed, which is intentional).
297  */
298  std::string to_string() const;
299 
300  /** Given a data type, return an estimate of the "natural" vector size
301  * for that data type when compiling for this Target. */
302  int natural_vector_size(const Halide::Type &t) const;
303 
304  /** Given a data type, return an estimate of the "natural" vector size
305  * for that data type when compiling for this Target. */
306  template<typename data_t>
307  int natural_vector_size() const {
308  return natural_vector_size(type_of<data_t>());
309  }
310 
311  /** Return true iff 64 bits and has_feature(LargeBuffers). */
312  bool has_large_buffers() const {
313  return bits == 64 && has_feature(LargeBuffers);
314  }
315 
316  /** Return the maximum buffer size in bytes supported on this
317  * Target. This is 2^31 - 1 except on 64-bit targets when the LargeBuffers
318  * feature is enabled, which expands the maximum to 2^63 - 1. */
320  if (has_large_buffers()) {
321  return (((uint64_t)1) << 63) - 1;
322  } else {
323  return (((uint64_t)1) << 31) - 1;
324  }
325  }
326 
327  /** Get the minimum cuda capability found as an integer. Returns
328  * 20 (our minimum supported cuda compute capability) if no cuda
329  * features are set. */
331 
332  /** Get the minimum Vulkan capability found as an integer. Returns
333  * 10 (our minimum supported Vulkan compute capability) if no Vulkan
334  * features are set. */
336 
337  /** Was libHalide compiled with support for this target? */
338  bool supported() const;
339 
340  /** Return a bitset of the Featuress set in this Target (set = 1).
341  * Note that while this happens to be the current internal representation,
342  * that might not always be the case. */
343  const std::bitset<FeatureEnd> &get_features_bitset() const {
344  return features;
345  }
346 
347  /** Return the name corresponding to a given Feature, in the form
348  * used to construct Target strings (e.g., Feature::Debug is "debug" and not "Debug"). */
349  static std::string feature_to_name(Target::Feature feature);
350 
351  /** Return the feature corresponding to a given name, in the form
352  * used to construct Target strings (e.g., Feature::Debug is "debug" and not "Debug").
353  * If the string is not a known feature name, return FeatureEnd. */
354  static Target::Feature feature_from_name(const std::string &name);
355 
356 private:
357  /** A bitmask that stores the active features. */
358  std::bitset<FeatureEnd> features;
359 };
360 
361 /** Return the target corresponding to the host machine. */
362 Target get_host_target();
363 
364 /** Return the target that Halide will use. If HL_TARGET is set it
365  * uses that. Otherwise calls \ref get_host_target */
367 
368 /** Return the target that Halide will use for jit-compilation. If
369  * HL_JIT_TARGET is set it uses that. Otherwise calls \ref
370  * get_host_target. Throws an error if the architecture, bit width,
371  * and OS of the target do not match the host target, so this is only
372  * useful for controlling the feature set. */
374 
375 /** Get the Target feature corresponding to a DeviceAPI. For device
376  * apis that do not correspond to any single target feature, returns
377  * Target::FeatureEnd */
379 
380 namespace Internal {
381 
382 void target_test();
383 }
384 
385 } // namespace Halide
386 
387 #endif
halide_target_feature_no_bounds_query
@ halide_target_feature_no_bounds_query
Disable the bounds querying functionality.
Definition: HalideRuntime.h:1311
Halide::Target::has_unknowns
bool has_unknowns() const
Return true if any of the arch/bits/os fields are "unknown"/0; return false otherwise.
Halide::Target::Android
@ Android
Definition: Target.h:28
Halide::Target::CLDoubles
@ CLDoubles
Definition: Target.h:108
halide_target_feature_cl_half
@ halide_target_feature_cl_half
Enable half support on OpenCL targets.
Definition: HalideRuntime.h:1370
halide_target_feature_t
halide_target_feature_t
Optional features a compilation Target can have.
Definition: HalideRuntime.h:1307
Halide::Target::has_feature
bool has_feature(Feature f) const
Halide::Target::CUDACapability30
@ CUDACapability30
Definition: Target.h:98
Halide::Target::WasmSatFloatToInt
@ WasmSatFloatToInt
Definition: Target.h:146
Halide::Target::features_all_of
bool features_all_of(const std::vector< Feature > &test_features) const
halide_target_feature_sve
@ halide_target_feature_sve
Enable ARM Scalable Vector Extensions.
Definition: HalideRuntime.h:1385
Halide::Target::SPIRV
@ SPIRV
Definition: Target.h:159
Halide::Target::HexagonDma
@ HexagonDma
Definition: Target.h:119
Halide::Target::NoNEON
@ NoNEON
Definition: Target.h:94
Halide::Target::MSAN
@ MSAN
Definition: Target.h:127
Halide::Target::AVX
@ AVX
Definition: Target.h:88
Halide::Target::operator!=
bool operator!=(const Target &other) const
Definition: Target.h:272
halide_target_feature_vulkan
@ halide_target_feature_vulkan
Enable Vulkan runtime support.
Definition: HalideRuntime.h:1396
Halide::Target::BdVer1
@ BdVer1
Tune for AMD Bobcat CPU (AMD Family 14h, launched 2011).
Definition: Target.h:68
Halide::Target::get_vulkan_capability_lower_bound
int get_vulkan_capability_lower_bound() const
Get the minimum Vulkan capability found as an integer.
Halide::get_host_target
Target get_host_target()
Return the target corresponding to the host machine.
halide_target_feature_asan
@ halide_target_feature_asan
Enable hooks for ASAN support.
Definition: HalideRuntime.h:1373
Halide::Target::ZnVer1
@ ZnVer1
Tune for AMD Jaguar CPU (AMD Family 16h, launched 2013).
Definition: Target.h:73
Halide::Target::VulkanFloat64
@ VulkanFloat64
Definition: Target.h:165
Halide::Target::vector_bits
int vector_bits
The bit-width of a vector register for targets where this is configurable and targeting a fixed size ...
Definition: Target.h:55
Halide::Target::FuzzFloatStores
@ FuzzFloatStores
Definition: Target.h:125
Halide::Target::BtVer2
@ BtVer2
Tune for AMD Excavator CPU (AMD Family 15h (4th-gen), launched 2015).
Definition: Target.h:72
halide_target_feature_vulkan_version10
@ halide_target_feature_vulkan_version10
Enable Vulkan v1.0 runtime target support.
Definition: HalideRuntime.h:1402
Halide::Target::SVE2
@ SVE2
Definition: Target.h:151
Halide::target_feature_for_device_api
Target::Feature target_feature_for_device_api(DeviceAPI api)
Get the Target feature corresponding to a DeviceAPI.
Halide::Target::Linux
@ Linux
Definition: Target.h:25
Halide::Target::BdVer3
@ BdVer3
Tune for AMD Piledriver CPU (AMD Family 15h (2nd-gen), launched 2012).
Definition: Target.h:70
Halide::Target::WebAssembly
@ WebAssembly
Definition: Target.h:45
Halide::Target::LLVMLargeCodeModel
@ LLVMLargeCodeModel
Definition: Target.h:154
Halide::Target::Profile
@ Profile
Definition: Target.h:114
Halide::Target::VulkanInt64
@ VulkanInt64
Definition: Target.h:163
halide_target_feature_sse41
@ halide_target_feature_sse41
Use SSE 4.1 and earlier instructions. Only relevant on x86.
Definition: HalideRuntime.h:1313
Halide::Target::get_features_bitset
const std::bitset< FeatureEnd > & get_features_bitset() const
Return a bitset of the Featuress set in this Target (set = 1).
Definition: Target.h:343
Halide::Target::feature_from_name
static Target::Feature feature_from_name(const std::string &name)
Return the feature corresponding to a given name, in the form used to construct Target strings (e....
Halide::Target::JIT
@ JIT
Definition: Target.h:83
halide_target_feature_d3d12compute
@ halide_target_feature_d3d12compute
Enable Direct3D 12 Compute runtime.
Definition: HalideRuntime.h:1374
Halide::Target::SanitizerCoverage
@ SanitizerCoverage
Definition: Target.h:157
Halide::Target::supports_type
bool supports_type(const Type &t) const
Does this target allow using a certain type.
Halide::Target::Feature
Feature
Optional features a target can have.
Definition: Target.h:82
halide_target_feature_no_runtime
@ halide_target_feature_no_runtime
Do not include a copy of the Halide runtime in any generated object file or assembly.
Definition: HalideRuntime.h:1346
halide_target_feature_cuda_capability32
@ halide_target_feature_cuda_capability32
Enable CUDA compute capability 3.2 (Tegra K1)
Definition: HalideRuntime.h:1328
Halide::Target::set_feature
void set_feature(Feature f, bool value=true)
halide_target_feature_profile_by_timer
@ halide_target_feature_profile_by_timer
Alternative to halide_target_feature_profile using timer interrupt for systems without threads or app...
Definition: HalideRuntime.h:1394
Halide::Target::ARMFp16
@ ARMFp16
Definition: Target.h:153
Halide::Target::to_string
std::string to_string() const
Convert the Target into a string form that can be reconstituted by merge_string(),...
halide_target_feature_vulkan_version13
@ halide_target_feature_vulkan_version13
Enable Vulkan v1.3 runtime target support.
Definition: HalideRuntime.h:1404
halide_target_feature_embed_bitcode
@ halide_target_feature_embed_bitcode
Emulate clang -fembed-bitcode flag.
Definition: HalideRuntime.h:1377
Halide::Target::TraceStores
@ TraceStores
Definition: Target.h:134
Halide::Target::AVX512_KNL
@ AVX512_KNL
Definition: Target.h:129
Halide::Target::VulkanV13
@ VulkanV13
Definition: Target.h:168
halide_target_feature_trace_stores
@ halide_target_feature_trace_stores
Trace all stores done by the pipeline. Equivalent to calling Func::trace_stores on every non-inlined ...
Definition: HalideRuntime.h:1365
Halide::Target::UserContext
@ UserContext
Definition: Target.h:113
Halide::get_target_from_environment
Target get_target_from_environment()
Return the target that Halide will use.
halide_target_feature_armv7s
@ halide_target_feature_armv7s
Generate code for ARMv7s. Only relevant for 32-bit ARM.
Definition: HalideRuntime.h:1320
halide_target_feature_msan
@ halide_target_feature_msan
Enable hooks for MSAN support.
Definition: HalideRuntime.h:1358
Halide::Target::has_gpu_feature
bool has_gpu_feature() const
Is a fully feature GPU compute runtime enabled? I.e.
Halide::Target::ProcessorGeneric
@ ProcessorGeneric
Do not tune for any specific CPU. In practice, this means that halide will decide the tune CPU based ...
Definition: Target.h:63
Halide::Target::NoAsserts
@ NoAsserts
Definition: Target.h:85
halide_target_feature_armv81a
@ halide_target_feature_armv81a
Enable ARMv8.1-a instructions.
Definition: HalideRuntime.h:1392
halide_target_feature_tsan
@ halide_target_feature_tsan
Enable hooks for TSAN support.
Definition: HalideRuntime.h:1372
Halide::Target::HVX_128
@ HVX_128
Definition: Target.h:120
Halide::Target::bits
int bits
The bit-width of the target machine.
Definition: Target.h:50
halide_target_feature_fma
@ halide_target_feature_fma
Enable x86 FMA instruction.
Definition: HalideRuntime.h:1316
Halide::Target::Vulkan
@ Vulkan
Definition: Target.h:160
halide_target_feature_hvx_v65
@ halide_target_feature_hvx_v65
Enable Hexagon v65 architecture.
Definition: HalideRuntime.h:1368
Halide::Target::SSE41
@ SSE41
Definition: Target.h:87
halide_target_feature_cl_doubles
@ halide_target_feature_cl_doubles
Enable double support on OpenCL targets.
Definition: HalideRuntime.h:1338
uint64_t
unsigned __INT64_TYPE__ uint64_t
Definition: runtime_internal.h:23
Halide::Target::TraceLoads
@ TraceLoads
Definition: Target.h:133
Halide::Target::BdVer4
@ BdVer4
Tune for AMD Steamroller CPU (AMD Family 15h (3nd-gen), launched 2014).
Definition: Target.h:71
Halide::Type
Types in the halide type system.
Definition: Type.h:276
Halide::Target::OSX
@ OSX
Definition: Target.h:27
Halide
This file defines the class FunctionDAG, which is our representation of a Halide pipeline,...
Definition: AbstractGenerator.h:19
Halide::Target::FMA
@ FMA
Definition: Target.h:90
Halide::Target::Metal
@ Metal
Definition: Target.h:116
halide_target_feature_openglcompute
@ halide_target_feature_openglcompute
Enable OpenGL Compute runtime. NOTE: This feature is deprecated and will be removed in Halide 17.
Definition: HalideRuntime.h:1341
Halide::Target::CUDACapability32
@ CUDACapability32
Definition: Target.h:99
Halide::Target::get_required_device_api
DeviceAPI get_required_device_api() const
If this Target (including all Features) requires a specific DeviceAPI, return it.
Halide::Target::VulkanInt8
@ VulkanInt8
Definition: Target.h:161
halide_target_feature_wasm_threads
@ halide_target_feature_wasm_threads
Enable use of threads in WebAssembly codegen. Requires the use of a wasm runtime that provides pthrea...
Definition: HalideRuntime.h:1382
halide_target_feature_spirv
@ halide_target_feature_spirv
Enable SPIR-V code generation support.
Definition: HalideRuntime.h:1395
Halide::Target::HVX
@ HVX
Definition: Target.h:121
Halide::Target::OS
OS
The operating system used by the target.
Definition: Target.h:23
Halide::Target::supports_device_api
bool supports_device_api(DeviceAPI api) const
Returns whether a particular device API can be used with this Target.
Halide::Target::WasmSignExt
@ WasmSignExt
Definition: Target.h:145
halide_target_feature_profile
@ halide_target_feature_profile
Launch a sampling profiler alongside the Halide pipeline that monitors and reports the runtime used b...
Definition: HalideRuntime.h:1345
Halide::Target::CUDACapability86
@ CUDACapability86
Definition: Target.h:106
Halide::Target::ZnVer3
@ ZnVer3
Tune for AMD Zen 2 CPU (AMD Family 17h, launched 2019).
Definition: Target.h:75
Halide::Target::OpenCL
@ OpenCL
Definition: Target.h:107
Halide::Target::Debug
@ Debug
Definition: Target.h:84
halide_target_feature_avx2
@ halide_target_feature_avx2
Use AVX 2 instructions. Only relevant on x86.
Definition: HalideRuntime.h:1315
halide_target_feature_avx512
@ halide_target_feature_avx512
Enable the base AVX512 subset supported by all AVX512 architectures. The specific feature sets are AV...
Definition: HalideRuntime.h:1359
Halide::Target::EnableLLVMLoopOpt
@ EnableLLVMLoopOpt
Definition: Target.h:143
halide_target_feature_semihosting
@ halide_target_feature_semihosting
Used together with Target::NoOS for the baremetal target built with semihosting library and run with ...
Definition: HalideRuntime.h:1405
Halide::Target::natural_vector_size
int natural_vector_size() const
Given a data type, return an estimate of the "natural" vector size for that data type when compiling ...
Definition: Target.h:307
halide_target_feature_end
@ halide_target_feature_end
A sentinel. Every target is considered to have this feature, and setting this feature does nothing.
Definition: HalideRuntime.h:1406
Halide::Target::K8
@ K8
Definition: Target.h:64
Halide::Target::RVV
@ RVV
Definition: Target.h:155
Halide::Target::FeatureEnd
@ FeatureEnd
Definition: Target.h:170
Halide::Target::F16C
@ F16C
Definition: Target.h:92
Halide::Target::BtVer1
@ BtVer1
Tune for AMD K10 "Barcelona" CPU (AMD Family 10h, launched 2007).
Definition: Target.h:67
Halide::Target::RISCV
@ RISCV
Definition: Target.h:46
Halide::Target::maximum_buffer_size
int64_t maximum_buffer_size() const
Return the maximum buffer size in bytes supported on this Target.
Definition: Target.h:319
halide_target_feature_avx512_skylake
@ halide_target_feature_avx512_skylake
Enable the AVX512 features supported by Skylake Xeon server processors. This adds AVX512-VL,...
Definition: HalideRuntime.h:1361
Halide::Target::Windows
@ Windows
Definition: Target.h:26
Halide::Target::FMA4
@ FMA4
Definition: Target.h:91
halide_target_feature_vulkan_int64
@ halide_target_feature_vulkan_int64
Enable Vulkan 64-bit integer support.
Definition: HalideRuntime.h:1399
Halide::Target::D3D12Compute
@ D3D12Compute
Definition: Target.h:137
Halide::Target::AVX512_Skylake
@ AVX512_Skylake
Definition: Target.h:130
halide_target_feature_strict_float
@ halide_target_feature_strict_float
Turn off all non-IEEE floating-point optimization. Currently applies only to LLVM targets.
Definition: HalideRuntime.h:1371
Halide::Target::WebAssemblyRuntime
@ WebAssemblyRuntime
Definition: Target.h:33
halide_target_feature_wasm_simd128
@ halide_target_feature_wasm_simd128
Enable +simd128 instructions for WebAssembly codegen.
Definition: HalideRuntime.h:1379
halide_target_feature_user_context
@ halide_target_feature_user_context
Generated code takes a user_context pointer as first argument.
Definition: HalideRuntime.h:1343
Halide::Target::operator==
bool operator==(const Target &other) const
Definition: Target.h:264
Halide::Target::ZnVer2
@ ZnVer2
Tune for AMD Zen CPU (AMD Family 17h, launched 2017).
Definition: Target.h:74
Halide::Target::TraceRealizations
@ TraceRealizations
Definition: Target.h:135
Halide::Target::ProfileByTimer
@ ProfileByTimer
Definition: Target.h:158
Halide::Target::CLHalf
@ CLHalf
Definition: Target.h:109
Halide::Target::os
enum Halide::Target::OS os
Halide::Target::WasmThreads
@ WasmThreads
Definition: Target.h:147
Halide::Target::X86
@ X86
Definition: Target.h:41
halide_target_feature_jit
@ halide_target_feature_jit
Generate code that will run immediately inside the calling process.
Definition: HalideRuntime.h:1308
halide_target_feature_arm_fp16
@ halide_target_feature_arm_fp16
Enable ARMv8.2-a half-precision floating point data processing.
Definition: HalideRuntime.h:1389
Halide::Target::CUDACapability35
@ CUDACapability35
Definition: Target.h:100
Halide::Target::K8_SSE3
@ K8_SSE3
Tune for AMD K8 Hammer CPU (AMD Family 0Fh, launched 2003).
Definition: Target.h:65
Halide::Target::VSX
@ VSX
Definition: Target.h:95
Halide::Target::feature_to_name
static std::string feature_to_name(Target::Feature feature)
Return the name corresponding to a given Feature, in the form used to construct Target strings (e....
Halide::Target::Semihosting
@ Semihosting
Definition: Target.h:169
halide_target_feature_no_asserts
@ halide_target_feature_no_asserts
Disable all runtime checks, for slightly tighter code.
Definition: HalideRuntime.h:1310
int64_t
signed __INT64_TYPE__ int64_t
Definition: runtime_internal.h:22
Halide::Target::NoRuntime
@ NoRuntime
Definition: Target.h:115
halide_target_feature_wasm_signext
@ halide_target_feature_wasm_signext
Enable +sign-ext instructions for WebAssembly codegen.
Definition: HalideRuntime.h:1380
halide_target_feature_no_neon
@ halide_target_feature_no_neon
Avoid using NEON instructions. Only relevant for 32-bit ARM.
Definition: HalideRuntime.h:1321
Halide::Target::CPlusPlusMangling
@ CPlusPlusMangling
Definition: Target.h:117
Halide::Target::VulkanV10
@ VulkanV10
Definition: Target.h:166
halide_target_feature_hvx_v66
@ halide_target_feature_hvx_v66
Enable Hexagon v66 architecture.
Definition: HalideRuntime.h:1369
Halide::Target::CLAtomics64
@ CLAtomics64
Definition: Target.h:110
Halide::Target::WebGPU
@ WebGPU
Definition: Target.h:149
Halide::Target::AMDFam10
@ AMDFam10
Tune for later versions of AMD K8 CPU, with SSE3 support.
Definition: Target.h:66
halide_target_feature_power_arch_2_07
@ halide_target_feature_power_arch_2_07
Use POWER ISA 2.07 new instructions. Only relevant on POWERPC.
Definition: HalideRuntime.h:1324
Type.h
halide_target_feature_large_buffers
@ halide_target_feature_large_buffers
Enable 64-bit buffer indexing to support buffers > 2GB. Ignored if bits != 64.
Definition: HalideRuntime.h:1352
halide_target_feature_opencl
@ halide_target_feature_opencl
Enable the OpenCL runtime.
Definition: HalideRuntime.h:1337
Halide::Target::VulkanInt16
@ VulkanInt16
Definition: Target.h:162
Halide::Target::Processor
Processor
The specific processor to be targeted, tuned for.
Definition: Target.h:61
halide_target_feature_enable_llvm_loop_opt
@ halide_target_feature_enable_llvm_loop_opt
Enable loop vectorization + unrolling in LLVM. Overrides halide_target_feature_disable_llvm_loop_opt....
Definition: HalideRuntime.h:1378
Halide::Target::validate_target_string
static bool validate_target_string(const std::string &s)
Check if a target string is valid.
halide_target_feature_cuda_capability61
@ halide_target_feature_cuda_capability61
Enable CUDA compute capability 6.1 (Pascal)
Definition: HalideRuntime.h:1331
halide_target_feature_trace_pipeline
@ halide_target_feature_trace_pipeline
Trace the pipeline.
Definition: HalideRuntime.h:1367
halide_target_feature_cuda_capability75
@ halide_target_feature_cuda_capability75
Enable CUDA compute capability 7.5 (Turing)
Definition: HalideRuntime.h:1333
Halide::Target::processor_tune
enum Halide::Target::Processor processor_tune
DeviceAPI.h
Halide::Target::POWERPC
@ POWERPC
Definition: Target.h:44
Halide::Target::CUDACapability50
@ CUDACapability50
Definition: Target.h:101
halide_target_feature_cuda_capability50
@ halide_target_feature_cuda_capability50
Enable CUDA compute capability 5.0 (Maxwell)
Definition: HalideRuntime.h:1330
halide_target_feature_trace_realizations
@ halide_target_feature_trace_realizations
Trace all realizations done by the pipeline. Equivalent to calling Func::trace_realizations on every ...
Definition: HalideRuntime.h:1366
Halide::Target::CUDACapability75
@ CUDACapability75
Definition: Target.h:104
Halide::Target::HVX_v65
@ HVX_v65
Definition: Target.h:123
halide_target_feature_hvx_128
@ halide_target_feature_hvx_128
Enable HVX 128 byte mode.
Definition: HalideRuntime.h:1354
Halide::Target::Fuchsia
@ Fuchsia
Definition: Target.h:32
Halide::Target::AVX512_Cannonlake
@ AVX512_Cannonlake
Definition: Target.h:131
Halide::Target::QuRT
@ QuRT
Definition: Target.h:30
Halide::Target::TracePipeline
@ TracePipeline
Definition: Target.h:136
Halide::Target::set_features
void set_features(const std::vector< Feature > &features_to_set, bool value=true)
Halide::Target::WasmBulkMemory
@ WasmBulkMemory
Definition: Target.h:148
halide_target_feature_cuda_capability86
@ halide_target_feature_cuda_capability86
Enable CUDA compute capability 8.6 (Ampere)
Definition: HalideRuntime.h:1335
halide_target_feature_vulkan_int8
@ halide_target_feature_vulkan_int8
Enable Vulkan 8-bit integer support.
Definition: HalideRuntime.h:1397
Halide::Target::AVX512_SapphireRapids
@ AVX512_SapphireRapids
Definition: Target.h:132
Halide::Target::WasmSimd128
@ WasmSimd128
Definition: Target.h:144
Halide::Target::POWER_ARCH_2_07
@ POWER_ARCH_2_07
Definition: Target.h:96
Halide::Internal::target_test
void target_test()
Halide::Target::IOS
@ IOS
Definition: Target.h:29
Halide::Target::NoOS
@ NoOS
Definition: Target.h:31
halide_target_feature_webgpu
@ halide_target_feature_webgpu
Enable the WebGPU runtime.
Definition: HalideRuntime.h:1384
halide_target_feature_cuda_capability70
@ halide_target_feature_cuda_capability70
Enable CUDA compute capability 7.0 (Volta)
Definition: HalideRuntime.h:1332
halide_target_feature_cuda_capability35
@ halide_target_feature_cuda_capability35
Enable CUDA compute capability 3.5 (Kepler)
Definition: HalideRuntime.h:1329
Halide::Target::supported
bool supported() const
Was libHalide compiled with support for this target?
Halide::Target::TSAN
@ TSAN
Definition: Target.h:139
halide_target_feature_cuda_capability30
@ halide_target_feature_cuda_capability30
Enable CUDA compute capability 3.0 (Kepler)
Definition: HalideRuntime.h:1327
halide_target_feature_vulkan_float16
@ halide_target_feature_vulkan_float16
Enable Vulkan 16-bit float support.
Definition: HalideRuntime.h:1400
halide_target_feature_cl_atomic64
@ halide_target_feature_cl_atomic64
Enable 64-bit atomics operations on OpenCL targets.
Definition: HalideRuntime.h:1339
halide_target_feature_debug
@ halide_target_feature_debug
Turn on debug info and output for runtime code.
Definition: HalideRuntime.h:1309
Halide::Target::CUDACapability70
@ CUDACapability70
Definition: Target.h:103
halide_target_feature_wasm_bulk_memory
@ halide_target_feature_wasm_bulk_memory
Enable +bulk-memory instructions for WebAssembly codegen.
Definition: HalideRuntime.h:1383
Halide::Target::CheckUnsafePromises
@ CheckUnsafePromises
Definition: Target.h:141
halide_target_feature_avx
@ halide_target_feature_avx
Use AVX 1 instructions. Only relevant on x86.
Definition: HalideRuntime.h:1314
HalideRuntime.h
Halide::Target::Arch
Arch
The architecture used by the target.
Definition: Target.h:39
Halide::Target::VulkanV12
@ VulkanV12
Definition: Target.h:167
halide_target_feature_soft_float_abi
@ halide_target_feature_soft_float_abi
Enable soft float ABI. This only enables the soft float ABI calling convention, which does not necess...
Definition: HalideRuntime.h:1357
Halide::Target::ARMv81a
@ ARMv81a
Definition: Target.h:156
Halide::Target::ASAN
@ ASAN
Definition: Target.h:140
Halide::Target::HVX_v62
@ HVX_v62
Definition: Target.h:122
Halide::Target::with_feature
Target with_feature(Feature f) const
Return a copy of the target with the given feature set.
halide_target_feature_cuda
@ halide_target_feature_cuda
Enable the CUDA runtime. Defaults to compute capability 2.0 (Fermi)
Definition: HalideRuntime.h:1326
Halide::Target::EGL
@ EGL
Definition: Target.h:112
halide_target_feature_fuzz_float_stores
@ halide_target_feature_fuzz_float_stores
On every floating point store, set the last bit of the mantissa to zero. Pipelines for which the outp...
Definition: HalideRuntime.h:1356
halide_target_feature_avx512_knl
@ halide_target_feature_avx512_knl
Enable the AVX512 features supported by Knight's Landing chips, such as the Xeon Phi x200....
Definition: HalideRuntime.h:1360
halide_target_feature_cuda_capability80
@ halide_target_feature_cuda_capability80
Enable CUDA compute capability 8.0 (Ampere)
Definition: HalideRuntime.h:1334
halide_target_feature_check_unsafe_promises
@ halide_target_feature_check_unsafe_promises
Insert assertions for promises.
Definition: HalideRuntime.h:1375
Halide::get_jit_target_from_environment
Target get_jit_target_from_environment()
Return the target that Halide will use for jit-compilation.
halide_target_feature_vulkan_version12
@ halide_target_feature_vulkan_version12
Enable Vulkan v1.2 runtime target support.
Definition: HalideRuntime.h:1403
Halide::Target::arch
enum Halide::Target::Arch arch
Halide::Target::get_runtime_compatible_target
bool get_runtime_compatible_target(const Target &other, Target &result)
Create a "greatest common denominator" runtime target that is compatible with both this target and ot...
Halide::Target::ArchUnknown
@ ArchUnknown
Definition: Target.h:40
Halide::Target::Hexagon
@ Hexagon
Definition: Target.h:43
halide_target_feature_vulkan_int16
@ halide_target_feature_vulkan_int16
Enable Vulkan 16-bit integer support.
Definition: HalideRuntime.h:1398
Halide::Target::BdVer2
@ BdVer2
Tune for AMD Bulldozer CPU (AMD Family 15h, launched 2011).
Definition: Target.h:69
Halide::Target::has_feature
bool has_feature(halide_target_feature_t f) const
Definition: Target.h:213
Halide::Target::EmbedBitcode
@ EmbedBitcode
Definition: Target.h:142
halide_target_feature_avx512_cannonlake
@ halide_target_feature_avx512_cannonlake
Enable the AVX512 features expected to be supported by future Cannonlake processors....
Definition: HalideRuntime.h:1362
halide_llvm_large_code_model
@ halide_llvm_large_code_model
Use the LLVM large code model to compile.
Definition: HalideRuntime.h:1390
halide_target_feature_egl
@ halide_target_feature_egl
Force use of EGL support.
Definition: HalideRuntime.h:1387
halide_target_feature_trace_loads
@ halide_target_feature_trace_loads
Trace all loads done by the pipeline. Equivalent to calling Func::trace_loads on every non-inlined Fu...
Definition: HalideRuntime.h:1364
Halide::Target::AVX2
@ AVX2
Definition: Target.h:89
Halide::Target::Target
Target(OS o, Arch a, int b, Processor pt, const std::vector< Feature > &initial_features=std::vector< Feature >(), int vb=0)
Definition: Target.h:173
Halide::Target::StrictFloat
@ StrictFloat
Definition: Target.h:138
halide_target_feature_c_plus_plus_mangling
@ halide_target_feature_c_plus_plus_mangling
Generate C++ mangled names for result function, et al.
Definition: HalideRuntime.h:1350
halide_target_feature_wasm_sat_float_to_int
@ halide_target_feature_wasm_sat_float_to_int
Enable saturating (nontrapping) float-to-int instructions for WebAssembly codegen.
Definition: HalideRuntime.h:1381
Halide::Target::get_cuda_capability_lower_bound
int get_cuda_capability_lower_bound() const
Get the minimum cuda capability found as an integer.
halide_target_feature_sve2
@ halide_target_feature_sve2
Enable ARM Scalable Vector Extensions v2.
Definition: HalideRuntime.h:1386
halide_target_feature_metal
@ halide_target_feature_metal
Enable the (Apple) Metal runtime.
Definition: HalideRuntime.h:1348
Halide::Target::ARMDotProd
@ ARMDotProd
Definition: Target.h:152
Halide::Target::HVX_v66
@ HVX_v66
Definition: Target.h:124
Halide::Target::ARMv7s
@ ARMv7s
Definition: Target.h:93
halide_target_feature_hexagon_dma
@ halide_target_feature_hexagon_dma
Enable Hexagon DMA buffers.
Definition: HalideRuntime.h:1376
Halide::Target::NoBoundsQuery
@ NoBoundsQuery
Definition: Target.h:86
halide_target_feature_vsx
@ halide_target_feature_vsx
Use VSX instructions. Only relevant on POWERPC.
Definition: HalideRuntime.h:1323
halide_target_feature_hvx_v62
@ halide_target_feature_hvx_v62
Enable Hexagon v62 architecture.
Definition: HalideRuntime.h:1355
Halide::Target::without_feature
Target without_feature(Feature f) const
Return a copy of the target with the given feature cleared.
halide_target_feature_fma4
@ halide_target_feature_fma4
Enable x86 (AMD) FMA4 instruction set.
Definition: HalideRuntime.h:1317
Halide::Target::ARM
@ ARM
Definition: Target.h:42
halide_target_feature_vulkan_float64
@ halide_target_feature_vulkan_float64
Enable Vulkan 64-bit float support.
Definition: HalideRuntime.h:1401
halide_target_feature_avx512_sapphirerapids
@ halide_target_feature_avx512_sapphirerapids
Enable the AVX512 features supported by Sapphire Rapids processors. This include all of the Cannonlak...
Definition: HalideRuntime.h:1363
Halide::Target::OSUnknown
@ OSUnknown
Definition: Target.h:24
Halide::Target::SoftFloatABI
@ SoftFloatABI
Definition: Target.h:126
Halide::Target
A struct representing a target machine and os to generate code for.
Definition: Target.h:19
Halide::Target::features_any_of
bool features_any_of(const std::vector< Feature > &test_features) const
Halide::Target::CUDACapability80
@ CUDACapability80
Definition: Target.h:105
Halide::Target::Target
Target(OS o, Arch a, int b, const std::vector< Feature > &initial_features=std::vector< Feature >())
Definition: Target.h:181
halide_target_feature_arm_dot_prod
@ halide_target_feature_arm_dot_prod
Enable ARMv8.2-a dotprod extension (i.e. udot and sdot instructions)
Definition: HalideRuntime.h:1388
Halide::Target::CUDACapability61
@ CUDACapability61
Definition: Target.h:102
Halide::Target::VulkanFloat16
@ VulkanFloat16
Definition: Target.h:164
Halide::Target::AVX512
@ AVX512
Definition: Target.h:128
Halide::Target::CUDA
@ CUDA
Definition: Target.h:97
halide_target_feature_rvv
@ halide_target_feature_rvv
Enable RISCV "V" Vector Extension.
Definition: HalideRuntime.h:1391
Halide::Target::Target
Target()=default
halide_target_feature_f16c
@ halide_target_feature_f16c
Enable x86 16-bit float support.
Definition: HalideRuntime.h:1318
Halide::Target::has_large_buffers
bool has_large_buffers() const
Return true iff 64 bits and has_feature(LargeBuffers).
Definition: Target.h:312
Halide::Target::LargeBuffers
@ LargeBuffers
Definition: Target.h:118
Halide::DeviceAPI
DeviceAPI
An enum describing a type of device API.
Definition: DeviceAPI.h:15
halide_target_feature_sanitizer_coverage
@ halide_target_feature_sanitizer_coverage
Enable hooks for SanitizerCoverage support.
Definition: HalideRuntime.h:1393
Halide::Target::SVE
@ SVE
Definition: Target.h:150
Halide::Target::OpenGLCompute
@ OpenGLCompute
Definition: Target.h:111