Data Structures
struct	dim3

Macros
#define	__global__ __attribute__((global))

#define	__device__ __attribute__((device))

#define	__device_builtin__ __attribute__((device_builtin))

#define	__align__(N) __attribute__((aligned(N)))

#define	__inline__ __inline__ __attribute__((always_inline))

#define	max(a, b) ((a) > (b) ? (a) : (b))

#define	min(a, b) ((a) < (b) ? (a) : (b))

#define	abs(x) ((x) < 0 ? -(x) : (x))

#define	atomicAdd(a, b) (__atomic_fetch_add(a, b, __ATOMIC_SEQ_CST))

#define	GETCOMP(reg, comp)

#define	GET(name, reg)

#define	blockIdx (getBlockIdx())

#define	blockDim (getBlockDim())

#define	threadIdx (getThreadIdx())

#define	make_int2(a, b) ((int2){.x = a, .y = b})

#define	make_uchar2(a, b) ((uchar2){.x = a, .y = b})

#define	make_ushort2(a, b) ((ushort2){.x = a, .y = b})

#define	make_float2(a, b) ((float2){.x = a, .y = b})

#define	make_int4(a, b, c, d) ((int4){.x = a, .y = b, .z = c, .w = d})

#define	make_uchar4(a, b, c, d) ((uchar4){.x = a, .y = b, .z = c, .w = d})

#define	make_ushort4(a, b, c, d) ((ushort4){.x = a, .y = b, .z = c, .w = d})

#define	make_float4(a, b, c, d) ((float4){.x = a, .y = b, .z = c, .w = d})

#define	TEX2D(type, ret) static inline __device__ void conv(type* out, unsigned a, unsigned b, unsigned c, unsigned d) {*out = (ret);}

Typedefs
typedef __device_builtin__ unsigned long long	cudaTextureObject_t

Functions
struct __device_builtin__	__align__ (2) uchar2

struct __device_builtin__	__align__ (4) ushort2

struct __device_builtin__	__align__ (8) float2

struct __device_builtin__	__align__ (16) int4

template<typename T >
__device__ T	tex2D (cudaTextureObject_t texObject, float x, float y)

template<>
__device__ float4	tex2D< float4 > (cudaTextureObject_t texObject, float x, float y)

template<>
__device__ float	tex2D< float > (cudaTextureObject_t texObject, float x, float y)

template<>
__device__ float2	tex2D< float2 > (cudaTextureObject_t texObject, float x, float y)

static __device__ float	floorf (float a)

static __device__ float	floor (float a)

static __device__ double	floor (double a)

static __device__ float	ceilf (float a)

static __device__ float	ceil (float a)

static __device__ double	ceil (double a)

static __device__ float	truncf (float a)

static __device__ float	trunc (float a)

static __device__ double	trunc (double a)

static __device__ float	fabsf (float a)

static __device__ float	fabs (float a)

static __device__ double	fabs (double a)

static __device__ float	__sinf (float a)

static __device__ float	__cosf (float a)

Variables
	uchar2

	ushort2

	float2

	int2

	uchar4

	ushort4

	int4

	float4

Macro Definition Documentation

◆ global

#define __global__ __attribute__((global))

Definition at line 27 of file cuda_runtime.h.

◆ device

#define __device__ __attribute__((device))

Definition at line 28 of file cuda_runtime.h.

◆ __device_builtin__

#define __device_builtin__ __attribute__((device_builtin))

Definition at line 29 of file cuda_runtime.h.

◆ align

#define __align__ ( N ) __attribute__((aligned(N)))

Definition at line 30 of file cuda_runtime.h.

◆ inline

#define __inline__ __inline__ __attribute__((always_inline))

Definition at line 31 of file cuda_runtime.h.

◆ max

#define max	(	a,
		b
	)	((a) > (b) ? (a) : (b))

Definition at line 33 of file cuda_runtime.h.

◆ min

#define min	(	a,
		b
	)	((a) < (b) ? (a) : (b))

Definition at line 34 of file cuda_runtime.h.

◆ abs

#define abs ( x ) ((x) < 0 ? -(x) : (x))

Examples: encode_audio.c.

Definition at line 35 of file cuda_runtime.h.

◆ atomicAdd

#define atomicAdd	(	a,
		b
	)	(__atomic_fetch_add(a, b, __ATOMIC_SEQ_CST))

Definition at line 37 of file cuda_runtime.h.

◆ GETCOMP

#define GETCOMP	(	reg,
		comp
	)

Value:

asm("mov.u32 %0, %%" #reg "." #comp ";" : "=r"(tmp)); \

ret.comp = tmp;

Definition at line 90 of file cuda_runtime.h.

◆ GET

#define GET	(	name,
		reg
	)

Value:

    static inline __device__ uint3 name() {\
    uint3 ret; \
    unsigned tmp; \
    GETCOMP(reg, x) \
    GETCOMP(reg, y) \
    GETCOMP(reg, z) \
    return ret; \
}

Definition at line 94 of file cuda_runtime.h.

◆ blockIdx

#define blockIdx (getBlockIdx())

Definition at line 108 of file cuda_runtime.h.

◆ blockDim

#define blockDim (getBlockDim())

Definition at line 109 of file cuda_runtime.h.

◆ threadIdx

#define threadIdx (getThreadIdx())

Definition at line 110 of file cuda_runtime.h.

◆ make_int2

#define make_int2	(	a,
		b
	)	((int2){.x = a, .y = b})

Definition at line 113 of file cuda_runtime.h.

◆ make_uchar2

#define make_uchar2	(	a,
		b
	)	((uchar2){.x = a, .y = b})

Definition at line 114 of file cuda_runtime.h.

◆ make_ushort2

#define make_ushort2	(	a,
		b
	)	((ushort2){.x = a, .y = b})

Definition at line 115 of file cuda_runtime.h.

◆ make_float2

#define make_float2	(	a,
		b
	)	((float2){.x = a, .y = b})

Definition at line 116 of file cuda_runtime.h.

◆ make_int4

#define make_int4	(	a,
		b,
		c,
		d
	)	((int4){.x = a, .y = b, .z = c, .w = d})

Definition at line 117 of file cuda_runtime.h.

◆ make_uchar4

#define make_uchar4	(	a,
		b,
		c,
		d
	)	((uchar4){.x = a, .y = b, .z = c, .w = d})

Definition at line 118 of file cuda_runtime.h.

◆ make_ushort4

#define make_ushort4	(	a,
		b,
		c,
		d
	)	((ushort4){.x = a, .y = b, .z = c, .w = d})

Definition at line 119 of file cuda_runtime.h.

◆ make_float4

#define make_float4	(	a,
		b,
		c,
		d
	)	((float4){.x = a, .y = b, .z = c, .w = d})

Definition at line 120 of file cuda_runtime.h.

◆ TEX2D

#define TEX2D	(	type,
		ret
	)	static inline __device__ void conv(type* out, unsigned a, unsigned b, unsigned c, unsigned d) {*out = (ret);}

Definition at line 123 of file cuda_runtime.h.

Typedef Documentation

◆ cudaTextureObject_t

typedef __device_builtin__ unsigned long long cudaTextureObject_t

Definition at line 40 of file cuda_runtime.h.

Function Documentation

◆ align() [1/4]

struct __device_builtin__ __align__ ( 2 )

Definition at line 42 of file cuda_runtime.h.

◆ align() [2/4]

struct __device_builtin__ __align__ ( 4 )

Definition at line 47 of file cuda_runtime.h.

◆ align() [3/4]

struct __device_builtin__ __align__ ( 8 )

Definition at line 52 of file cuda_runtime.h.

◆ align() [4/4]

struct __device_builtin__ __align__ ( 16 )

Definition at line 79 of file cuda_runtime.h.

◆ tex2D()

template<typename T >

__device__ T tex2D	(	cudaTextureObject_t	texObject,
		float	x,
		float	y
	)

inline

Definition at line 137 of file cuda_runtime.h.

◆ tex2D< float4 >()

template<>

__device__ float4 tex2D< float4 >	(	cudaTextureObject_t	texObject,
		float	x,
		float	y
	)

inline

Definition at line 149 of file cuda_runtime.h.

Referenced by tex2D< float >(), and tex2D< float2 >().

◆ tex2D< float >()

template<>

__device__ float tex2D< float >	(	cudaTextureObject_t	texObject,
		float	x,
		float	y
	)

inline

Definition at line 159 of file cuda_runtime.h.

◆ tex2D< float2 >()

template<>

__device__ float2 tex2D< float2 >	(	cudaTextureObject_t	texObject,
		float	x,
		float	y
	)

inline

Definition at line 165 of file cuda_runtime.h.

◆ floorf()

static __device__ float floorf ( float a )

inlinestatic

◆ floor() [1/2]

static __device__ float floor ( float a )

inlinestatic

◆ floor() [2/2]

static __device__ double floor ( double a )

inlinestatic

Definition at line 174 of file cuda_runtime.h.

◆ ceilf()

static __device__ float ceilf ( float a )

inlinestatic

Definition at line 175 of file cuda_runtime.h.

Referenced by config_input(), cube1x6_to_xyz(), cube3x2_to_xyz(), cube6x1_to_xyz(), ff_opus_psy_init(), kaiser_params(), opus_encode_init(), select_frame(), set_special_band_scalefactors(), xyz_to_cube1x6(), xyz_to_cube3x2(), xyz_to_cube6x1(), and xyz_to_dfisheye().

◆ ceil() [1/2]

static __device__ float ceil ( float a )

inlinestatic

◆ ceil() [2/2]

static __device__ double ceil ( double a )

inlinestatic

Definition at line 177 of file cuda_runtime.h.

◆ truncf()

static __device__ float truncf ( float a )

inlinestatic

Definition at line 178 of file cuda_runtime.h.

Referenced by amrnb_decode_frame(), and amrwb_decode_frame().

◆ trunc() [1/2]

static __device__ float trunc ( float a )

inlinestatic

Definition at line 179 of file cuda_runtime.h.

Referenced by eval_expr(), and fwht_1d().

◆ trunc() [2/2]

static __device__ double trunc ( double a )

inlinestatic

Definition at line 180 of file cuda_runtime.h.

◆ fabsf()

static __device__ float fabsf ( float a )

inlinestatic

Definition at line 181 of file cuda_runtime.h.

Referenced by aac_encode_frame(), abs_pow34_v(), adaptive_gain_control(), amplify_frame(), calculate_cubic_bc_coeffs(), checkasm_check_synth_filter(), decode_spectrum_and_dequant(), elliott(), envelope(), equal(), ff_pnm_decode_header(), filter_2_1(), filter_5_0_side(), filter_5_1_back(), filter_5_1_side(), filter_frame(), filter_stereo(), filter_surround(), find_form_factor(), fir_to_phase(), float_near_abs_eps(), headphone_convolute(), headphone_fast_convolute(), IsAlmostEqual(), main(), octahedron_to_xyz(), quantize_and_encode_band_cost_template(), search_for_quantizers_anmr(), search_for_quantizers_twoloop(), set_params(), smooth(), sofalizer_convolute(), sofalizer_fast_convolute(), stereo_transform(), synthesis(), tetrahedron_to_xyz(), thresholding(), to_linear(), upmix_1_0(), upmix_3_0(), upmix_3_1(), upmix_4_0(), upmix_4_1(), upmix_5_0_back(), upmix_5_1_back(), upmix_5_1_back_2_1(), upmix_6_0(), upmix_6_1(), upmix_7_0(), upmix_7_1(), upmix_7_1_5_0_side(), upmix_7_1_5_1(), xyz_to_dfisheye(), xyz_to_flat(), and xyz_to_octahedron().

◆ fabs() [1/2]

static __device__ float fabs ( float a )

inlinestatic

Definition at line 182 of file cuda_runtime.h.

Referenced by aac_encode_frame(), av_d2q(), av_guess_frame_rate(), avformat_find_stream_info(), avresample_build_matrix(), bessel(), bitreduction(), build_filter(), butter_filter_stereo_samples(), calc_thr_3gpp(), check_diff(), check_external_clock_speed(), check_values(), compand_delay(), compand_nodelay(), compare(), compressor(), compute_acc_den(), compute_acc_num(), compute_peak(), compute_quant_matrix(), compute_target_delay(), config_filter(), config_input(), config_output(), config_props(), configure_input_video_filter(), configure_video_device(), cubic_interpolate_func(), D(), dct_error(), decfloat(), decode_lspf(), decompose_zp2biquads(), detect_clicks(), detect_clips(), detect_peak(), detect_scene_change(), double_near_abs_eps(), draw_response(), dump_fir(), encode_block(), evrc_decode_frame(), expand(), factor(), ff_inlink_evaluate_timeline_at_frame(), ff_lpc_calc_coefs(), ff_mdct15_init(), ff_mdct_init(), ff_pca(), ff_rfps_calculate(), filter_frame(), filter_slice(), filter_slice_grey_edge(), find_peak_magnitude(), fir_to_phase(), fixed_gain_smooth(), frame_erasure(), gate(), gen_mdct_exptab(), generate_kernel(), generate_window_func(), get_coeff(), get_floor_average(), get_rotation(), get_scene_score(), get_video_frame(), hypot(), init(), init_muxer(), init_pass2(), init_video_param(), inv_cdf(), lfo_advance(), M(), main(), mcompand_channel(), mov_read_tkhd(), optimize_colors(), parse_points(), parse_primary(), perform_compression(), points_not_collinear(), precalc_coefs(), print_stats(), quantize_lpc_coefs(), random_ts(), ready_residue(), residue_encode(), run_psnr(), set_constqp(), set_metadata(), set_vbr(), ssim_db(), swr_build_matrix(), swr_next_pts(), sync_clock_to_slave(), synchronize_audio(), test(), test_broadcast_input0(), test_broadcast_input1(), test_fcmul_add(), test_no_broadcast(), test_vector_dmul(), test_vector_dmul_scalar(), test_vector_fmul(), test_vector_fmul_scalar(), test_with_mode_constant(), test_with_mode_reflect(), test_with_mode_symmetric(), test_with_same(), test_with_same_dilate(), test_with_valid(), true_peak_limiter(), twinvq_mulawinv(), update_peak(), update_stat(), video_thread(), X264_init(), XAVS_init(), and yule_filter_stereo_samples().

◆ fabs() [2/2]

static __device__ double fabs ( double a )

inlinestatic

Definition at line 183 of file cuda_runtime.h.

◆ __sinf()

static __device__ float __sinf ( float a )

inlinestatic

Definition at line 185 of file cuda_runtime.h.

◆ __cosf()

static __device__ float __cosf ( float a )

inlinestatic

Definition at line 186 of file cuda_runtime.h.

Variable Documentation

◆ uchar2

uchar2

Definition at line 45 of file cuda_runtime.h.

◆ ushort2

ushort2

Definition at line 50 of file cuda_runtime.h.

◆ float2

float2

Definition at line 55 of file cuda_runtime.h.

◆ int2

int2

Definition at line 60 of file cuda_runtime.h.

◆ uchar4

uchar4

Definition at line 72 of file cuda_runtime.h.

◆ ushort4

ushort4

Definition at line 77 of file cuda_runtime.h.

◆ int4

int4

Definition at line 82 of file cuda_runtime.h.

◆ float4

float4

Definition at line 87 of file cuda_runtime.h.

Referenced by tex2D< float2 >(), and tex2D< float4 >().

Data Structures

Macros

Typedefs

Functions

Variables

Macro Definition Documentation

◆ __global__

◆ __device__

◆ __device_builtin__

◆ __align__

◆ __inline__

◆ max

◆ min

◆ abs

◆ atomicAdd

◆ GETCOMP

◆ GET

◆ blockIdx

◆ blockDim

◆ threadIdx

◆ make_int2

◆ make_uchar2

◆ make_ushort2

◆ make_float2

◆ make_int4

◆ make_uchar4

◆ make_ushort4

◆ make_float4

◆ TEX2D

Typedef Documentation

◆ cudaTextureObject_t

Function Documentation

◆ __align__() [1/4]

◆ __align__() [2/4]

◆ __align__() [3/4]

◆ __align__() [4/4]

◆ tex2D()

◆ tex2D< float4 >()

◆ tex2D< float >()

◆ tex2D< float2 >()

◆ floorf()

◆ floor() [1/2]

◆ floor() [2/2]

◆ ceilf()

◆ ceil() [1/2]

◆ ceil() [2/2]

◆ truncf()

◆ trunc() [1/2]

◆ trunc() [2/2]

◆ fabsf()

◆ fabs() [1/2]

◆ fabs() [2/2]

◆ __sinf()

◆ __cosf()

Variable Documentation

◆ uchar2

◆ ushort2

◆ float2

◆ int2

◆ uchar4

◆ ushort4

◆ int4

◆ float4

◆ global

◆ device

◆ align

◆ inline

◆ align() [1/4]

◆ align() [2/4]

◆ align() [3/4]

◆ align() [4/4]