Routines specific to the Halide Cuda runtime. More...

#include "HalideRuntime.h"

Macros
#define	HALIDE_RUNTIME_CUDA

Typedefs
typedef int(*	halide_cuda_acquire_context_t) (void , void *, bool)

typedef int(*	halide_cuda_release_context_t) (void *)

typedef int(*	halide_cuda_get_stream_t) (void , void , void **)

Functions
const struct halide_device_interface_t *	halide_cuda_device_interface ()

int	halide_cuda_initialize_kernels (void user_context, void state_ptr, const char src, int size)
	These are forward declared here to allow clients to override the Halide Cuda runtime.

int	halide_cuda_run (void user_context, void state_ptr, const char entry_name, int blocksX, int blocksY, int blocksZ, int threadsX, int threadsY, int threadsZ, int shared_mem_bytes, size_t arg_sizes[], void args[], int8_t arg_is_buffer[])

void	halide_cuda_finalize_kernels (void user_context, void state_ptr)

int	halide_cuda_wrap_device_ptr (void user_context, struct halide_buffer_t buf, uint64_t device_ptr)
	Set the underlying cuda device poiner for a buffer.

int	halide_cuda_detach_device_ptr (void user_context, struct halide_buffer_t buf)
	Disconnect this halide_buffer_t from the device pointer it was previously wrapped around.

uintptr_t	halide_cuda_get_device_ptr (void user_context, struct halide_buffer_t buf)
	Return the underlying device pointer for a halide_buffer_t.

int	halide_cuda_release_unused_device_allocations (void *user_context)
	Release any currently-unused device allocations back to the cuda driver.

halide_cuda_acquire_context_t	halide_set_cuda_acquire_context (halide_cuda_acquire_context_t handler)
	Set custom methods to acquire and release cuda contexts and streams.

halide_cuda_release_context_t	halide_set_cuda_release_context (halide_cuda_release_context_t handler)

halide_cuda_get_stream_t	halide_set_cuda_get_stream (halide_cuda_get_stream_t handler)

Detailed Description

Routines specific to the Halide Cuda runtime.

Definition in file HalideRuntimeCuda.h.

Macro Definition Documentation

◆ HALIDE_RUNTIME_CUDA

#define HALIDE_RUNTIME_CUDA

Definition at line 19 of file HalideRuntimeCuda.h.

Typedef Documentation

◆ halide_cuda_acquire_context_t

typedef int(* halide_cuda_acquire_context_t) (void *, void **, bool)

Definition at line 70 of file HalideRuntimeCuda.h.

◆ halide_cuda_release_context_t

typedef int(* halide_cuda_release_context_t) (void *)

Definition at line 73 of file HalideRuntimeCuda.h.

◆ halide_cuda_get_stream_t

typedef int(* halide_cuda_get_stream_t) (void *, void *, void **)

Definition at line 74 of file HalideRuntimeCuda.h.

Function Documentation

◆ halide_cuda_device_interface()

const struct halide_device_interface_t * halide_cuda_device_interface ( )

extern

◆ halide_cuda_initialize_kernels()

int halide_cuda_initialize_kernels	(	void *	user_context,
		void **	state_ptr,
		const char *	src,
		int	size )

extern

These are forward declared here to allow clients to override the Halide Cuda runtime.

Do not call them.

◆ halide_cuda_run()

int halide_cuda_run	(	void *	user_context,
		void *	state_ptr,
		const char *	entry_name,
		int	blocksX,
		int	blocksY,
		int	blocksZ,
		int	threadsX,
		int	threadsY,
		int	threadsZ,
		int	shared_mem_bytes,
		size_t	arg_sizes[],
		void *	args[],
		int8_t	arg_is_buffer[] )

extern

◆ halide_cuda_finalize_kernels()

void halide_cuda_finalize_kernels	(	void *	user_context,
		void *	state_ptr )

extern

◆ halide_cuda_wrap_device_ptr()

int halide_cuda_wrap_device_ptr	(	void *	user_context,
		struct halide_buffer_t *	buf,
		uint64_t	device_ptr )

extern

Set the underlying cuda device poiner for a buffer.

The device pointer should be allocated using cuMemAlloc or similar and must have an extent large enough to cover that specified by the halide_buffer_t extent fields. The dev field of the halide_buffer_t must be NULL when this routine is called. This call can fail due to being passed an invalid device pointer. The device and host dirty bits are left unmodified.

◆ halide_cuda_detach_device_ptr()

int halide_cuda_detach_device_ptr	(	void *	user_context,
		struct halide_buffer_t *	buf )

extern

Disconnect this halide_buffer_t from the device pointer it was previously wrapped around.

Should only be called for a halide_buffer_t that halide_cuda_wrap_device_ptr was previously called on. The device field of the halide_buffer_t will be NULL on return.

◆ halide_cuda_get_device_ptr()

uintptr_t halide_cuda_get_device_ptr	(	void *	user_context,
		struct halide_buffer_t *	buf )

extern

Return the underlying device pointer for a halide_buffer_t.

This buffer must be valid on a Cuda device, or not have any associated device memory. If there is no device memory (dev field is NULL), this returns 0.

◆ halide_cuda_release_unused_device_allocations()

int halide_cuda_release_unused_device_allocations ( void * user_context )

extern

Release any currently-unused device allocations back to the cuda driver.

See halide_reuse_device_allocations.

◆ halide_set_cuda_acquire_context()

halide_cuda_acquire_context_t halide_set_cuda_acquire_context ( halide_cuda_acquire_context_t handler )

extern

Set custom methods to acquire and release cuda contexts and streams.

◆ halide_set_cuda_release_context()

halide_cuda_release_context_t halide_set_cuda_release_context ( halide_cuda_release_context_t handler )

extern

◆ halide_set_cuda_get_stream()

halide_cuda_get_stream_t halide_set_cuda_get_stream ( halide_cuda_get_stream_t handler )

extern

Macros

Typedefs

Functions

Detailed Description

Macro Definition Documentation

◆ HALIDE_RUNTIME_CUDA

Typedef Documentation

◆ halide_cuda_acquire_context_t

◆ halide_cuda_release_context_t

◆ halide_cuda_get_stream_t

Function Documentation

◆ halide_cuda_device_interface()

◆ halide_cuda_initialize_kernels()

◆ halide_cuda_run()

◆ halide_cuda_finalize_kernels()

◆ halide_cuda_wrap_device_ptr()

◆ halide_cuda_detach_device_ptr()

◆ halide_cuda_get_device_ptr()

◆ halide_cuda_release_unused_device_allocations()

◆ halide_set_cuda_acquire_context()

◆ halide_set_cuda_release_context()

◆ halide_set_cuda_get_stream()