Go to the documentation of this file.
50 #define DIV_UP(a, b) ( ((a) + (b) - 1) / (b) )
51 #define ALIGN_UP(a, b) (((a) + (b) - 1) & ~((b) - 1))
56 #define CHECK_CU(x) FF_CUDA_CHECK_DL(ctx, s->hwctx->internal->cuda_dl, x)
139 int in_sw, in_sh, out_sw, out_sh;
144 if (!
s->planes_out[0].width) {
145 s->planes_out[0].width =
s->planes_in[0].width;
146 s->planes_out[0].height =
s->planes_in[0].height;
150 s->planes_in[
i].width =
s->planes_in[0].width >> in_sw;
151 s->planes_in[
i].height =
s->planes_in[0].height >> in_sh;
152 s->planes_out[
i].width =
s->planes_out[0].width >> out_sw;
153 s->planes_out[
i].height =
s->planes_out[0].height >> out_sh;
175 s->frame->width =
s->planes_out[0].width;
176 s->frame->height =
s->planes_out[0].height;
179 s->frames_ctx = out_ref;
198 int out_width,
int out_height)
209 if (!
ctx->inputs[0]->hw_frames_ctx) {
228 if (in_width == out_width && in_height == out_height)
231 s->in_fmt = in_format;
232 s->out_fmt = out_format;
234 s->planes_in[0].width = in_width;
235 s->planes_in[0].height = in_height;
236 s->planes_out[0].width = out_width;
237 s->planes_out[0].height = out_height;
244 if (!
ctx->outputs[0]->hw_frames_ctx)
257 CUcontext
dummy, cuda_ctx = device_hwctx->cuda_ctx;
258 CudaFunctions *cu = device_hwctx->internal->cuda_dl;
262 extern char vf_scale_cuda_ptx[];
264 s->hwctx = device_hwctx;
265 s->cu_stream =
s->hwctx->stream;
271 ret =
CHECK_CU(cu->cuModuleLoadData(&
s->cu_module, vf_scale_cuda_ptx));
275 CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_uchar,
s->cu_module,
"Subsample_Bilinear_uchar"));
279 CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_uchar2,
s->cu_module,
"Subsample_Bilinear_uchar2"));
283 CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_uchar4,
s->cu_module,
"Subsample_Bilinear_uchar4"));
287 CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_ushort,
s->cu_module,
"Subsample_Bilinear_ushort"));
291 CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_ushort2,
s->cu_module,
"Subsample_Bilinear_ushort2"));
295 CHECK_CU(cu->cuModuleGetFunction(&
s->cu_func_ushort4,
s->cu_module,
"Subsample_Bilinear_ushort4"));
303 s->w_expr,
s->h_expr,
308 if (((int64_t)
h *
inlink->w) > INT_MAX ||
309 ((int64_t)
w *
inlink->h) > INT_MAX)
322 if (
inlink->sample_aspect_ratio.num) {
325 inlink->sample_aspect_ratio);
342 CudaFunctions *cu =
s->hwctx->internal->cuda_dl;
343 CUdeviceptr dst_devptr = (CUdeviceptr)dst_dptr;
345 void *args_uchar[] = { &tex, &dst_devptr, &dst_width, &dst_height, &
dst_pitch, &src_width, &src_height };
348 CUDA_TEXTURE_DESC tex_desc = {
349 .filterMode = CU_TR_FILTER_MODE_LINEAR,
350 .flags = CU_TRSF_READ_AS_INTEGER,
353 CUDA_RESOURCE_DESC res_desc = {
354 .resType = CU_RESOURCE_TYPE_PITCH2D,
355 .res.pitch2D.format = pixel_size == 1 ?
356 CU_AD_FORMAT_UNSIGNED_INT8 :
357 CU_AD_FORMAT_UNSIGNED_INT16,
358 .res.pitch2D.numChannels =
channels,
359 .res.pitch2D.width = src_width,
360 .res.pitch2D.height = src_height,
361 .res.pitch2D.pitchInBytes =
src_pitch * pixel_size,
362 .res.pitch2D.devPtr = (CUdeviceptr)src_dptr,
365 ret =
CHECK_CU(cu->cuTexObjectCreate(&tex, &res_desc, &tex_desc,
NULL));
375 CHECK_CU(cu->cuTexObjectDestroy(tex));
389 in->data[0],
in->width,
in->height,
in->linesize[0],
390 out->data[0],
out->width,
out->height,
out->linesize[0],
393 in->data[1],
in->width/2,
in->height/2,
in->linesize[0]/2,
394 out->data[1],
out->width/2,
out->height/2,
out->linesize[0]/2,
397 in->data[2],
in->width/2,
in->height/2,
in->linesize[0]/2,
398 out->data[2],
out->width/2,
out->height/2,
out->linesize[0]/2,
403 in->data[0],
in->width,
in->height,
in->linesize[0],
404 out->data[0],
out->width,
out->height,
out->linesize[0],
407 in->data[1],
in->width,
in->height,
in->linesize[0],
408 out->data[1],
out->width,
out->height,
out->linesize[0],
411 in->data[2],
in->width,
in->height,
in->linesize[0],
412 out->data[2],
out->width,
out->height,
out->linesize[0],
417 in->data[0],
in->width,
in->height,
in->linesize[0] / 2,
418 out->data[0],
out->width,
out->height,
out->linesize[0] / 2,
421 in->data[1],
in->width,
in->height,
in->linesize[1] / 2,
422 out->data[1],
out->width,
out->height,
out->linesize[1] / 2,
425 in->data[2],
in->width,
in->height,
in->linesize[2] / 2,
426 out->data[2],
out->width,
out->height,
out->linesize[2] / 2,
431 in->data[0],
in->width,
in->height,
in->linesize[0],
432 out->data[0],
out->width,
out->height,
out->linesize[0],
435 in->data[1],
in->width/2,
in->height/2,
in->linesize[1],
436 out->data[1],
out->width/2,
out->height/2,
out->linesize[1]/2,
441 in->data[0],
in->width,
in->height,
in->linesize[0]/2,
442 out->data[0],
out->width,
out->height,
out->linesize[0]/2,
445 in->data[1],
in->width / 2,
in->height / 2,
in->linesize[1]/2,
446 out->data[1],
out->width / 2,
out->height / 2,
out->linesize[1] / 4,
451 in->data[0],
in->width,
in->height,
in->linesize[0] / 2,
452 out->data[0],
out->width,
out->height,
out->linesize[0] / 2,
455 in->data[1],
in->width / 2,
in->height / 2,
in->linesize[1] / 2,
456 out->data[1],
out->width / 2,
out->height / 2,
out->linesize[1] / 4,
484 s->frame->width =
s->planes_out[0].width;
485 s->frame->height =
s->planes_out[0].height;
499 CudaFunctions *cu =
s->hwctx->internal->cuda_dl;
511 ret =
CHECK_CU(cu->cuCtxPushCurrent(
s->hwctx->cuda_ctx));
521 av_reduce(&
out->sample_aspect_ratio.num, &
out->sample_aspect_ratio.den,
522 (int64_t)
in->sample_aspect_ratio.num * outlink->
h *
link->w,
523 (int64_t)
in->sample_aspect_ratio.den * outlink->
w *
link->h,
534 #define OFFSET(x) offsetof(CUDAScaleContext, x)
535 #define FLAGS (AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM)
568 .
name =
"scale_cuda",
static const AVOption options[]
int(* func)(AVBPrint *dst, const char *in, const char *arg)
void * hwctx
The format-specific data, allocated and freed by libavutil along with this context.
@ AV_PIX_FMT_CUDA
HW acceleration through CUDA.
AVPixelFormat
Pixel format.
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
static av_cold int cudascale_init(AVFilterContext *ctx)
#define FF_FILTER_FLAG_HWFRAME_AWARE
The filter is aware of hardware frames, and any hardware frame context should not be automatically pr...
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
uint8_t * data
The data buffer.
enum AVPixelFormat format
The pixel format identifying the underlying HW surface type.
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
static av_cold void cudascale_uninit(AVFilterContext *ctx)
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
static int call_resize_kernel(AVFilterContext *ctx, CUfunction func, int channels, uint8_t *src_dptr, int src_width, int src_height, int src_pitch, uint8_t *dst_dptr, int dst_width, int dst_height, int dst_pitch, int pixel_size)
int av_hwframe_ctx_init(AVBufferRef *ref)
Finalize the context before use.
char * w_expr
width expression string
This structure describes decoded (raw) audio or video data.
AVBufferRef * av_hwframe_ctx_alloc(AVBufferRef *device_ref_in)
Allocate an AVHWFramesContext tied to a given device context.
#define AV_LOG_VERBOSE
Detailed information.
CUfunction cu_func_ushort4
const char * name
Filter name.
int width
The allocated dimensions of the frames in this pool.
A link between two filters.
static av_cold int init_stage(CUDAScaleContext *s, AVBufferRef *device_ctx)
static int scalecuda_resize(AVFilterContext *ctx, AVFrame *out, AVFrame *in)
int av_pix_fmt_get_chroma_sub_sample(enum AVPixelFormat pix_fmt, int *h_shift, int *v_shift)
Utility function to access log2_chroma_w log2_chroma_h from the pixel format AVPixFmtDescriptor.
int av_reduce(int *dst_num, int *dst_den, int64_t num, int64_t den, int64_t max)
Reduce a fraction.
A filter pad used for either input or output.
AVFrame * av_frame_alloc(void)
Allocate an AVFrame and set its fields to default values.
static const AVClass cudascale_class
static av_cold int cudascale_config_props(AVFilterLink *outlink)
AVCUDADeviceContext * hwctx
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
CUfunction cu_func_ushort
#define AV_PIX_FMT_YUV444P16
AVRational sample_aspect_ratio
agreed upon sample aspect ratio
static const AVFilterPad outputs[]
static enum AVPixelFormat pix_fmts[]
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
static int format_is_supported(enum AVPixelFormat fmt)
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a link
#define LIBAVUTIL_VERSION_INT
Describe the class of an AVClass context structure.
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
char * h_expr
height expression string
Rational number (pair of numerator and denominator).
AVBufferRef * device_ref
A reference to the parent AVHWDeviceContext.
AVFilterLink ** inputs
array of pointers to input links
const char * av_default_item_name(void *ptr)
Return the context name.
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several inputs
static const AVFilterPad cudascale_inputs[]
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
struct CUDAScaleContext::@240 planes_out[3]
CUfunction cu_func_uchar2
static int cudascale_query_formats(AVFilterContext *ctx)
AVFilterContext * src
source filter
CUfunction cu_func_ushort2
BYTE int const BYTE int src_pitch
int ff_scale_eval_dimensions(void *log_ctx, const char *w_expr, const char *h_expr, AVFilterLink *inlink, AVFilterLink *outlink, int *ret_w, int *ret_h)
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> in
static enum AVPixelFormat supported_formats[]
#define i(width, name, range_min, range_max)
int w
agreed upon image width
void av_frame_move_ref(AVFrame *dst, AVFrame *src)
Move everything contained in src to dst and reset src.
void av_frame_unref(AVFrame *frame)
Unreference all the buffers referenced by frame and reset the frame fields.
struct CUDAScaleContext::@240 planes_in[3]
const char * name
Pad name.
This struct describes a set or pool of "hardware" frames (i.e.
This struct is allocated as AVHWDeviceContext.hwctx.
@ AV_PIX_FMT_NV12
planar YUV 4:2:0, 12bpp, 1 plane for Y and 1 plane for the UV components, which are interleaved (firs...
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
AVHWDeviceContext * device_ctx
The parent AVHWDeviceContext.
@ AV_PIX_FMT_P016LE
like NV12, with 16bpp per component, little-endian
#define FF_ARRAY_ELEMS(a)
int h
agreed upon image height
CUfunction cu_func_uchar4
AVRational av_mul_q(AVRational b, AVRational c)
Multiply two rationals.
AVBufferRef * av_buffer_ref(AVBufferRef *buf)
Create a new reference to an AVBuffer.
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
static const AVFilterPad cudascale_outputs[]
A reference to a data buffer.
@ AV_PIX_FMT_P010LE
like NV12, with 10bpp per component, data in the high bits, zeros in the low bits,...
static int cudascale_scale(AVFilterContext *ctx, AVFrame *out, AVFrame *in)
AVFilter ff_vf_scale_cuda
static int cudascale_filter_frame(AVFilterLink *link, AVFrame *in)
enum AVPixelFormat format
Output sw format.
enum AVPixelFormat in_fmt
static av_cold int init_processing_chain(AVFilterContext *ctx, int in_width, int in_height, int out_width, int out_height)
#define AVERROR_BUG
Internal bug, also see AVERROR_BUG2.
enum AVPixelFormat out_fmt
int av_hwframe_get_buffer(AVBufferRef *hwframe_ref, AVFrame *frame, int flags)
Allocate a new frame attached to the given AVHWFramesContext.
const char * av_get_pix_fmt_name(enum AVPixelFormat pix_fmt)
Return the short name for a pixel format, NULL in case pix_fmt is unknown.