FFmpeg
d3d12va_h264.c
Go to the documentation of this file.
1 /*
2  * Direct3D 12 h264 HW acceleration
3  *
4  * copyright (c) 2022-2023 Wu Jianhua <toqsxw@outlook.com>
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
23 #include "config_components.h"
24 #include "libavutil/avassert.h"
25 #include "h264dec.h"
26 #include "h264data.h"
27 #include "h264_ps.h"
28 #include "mpegutils.h"
29 #include "dxva2_internal.h"
30 #include "d3d12va_decode.h"
32 #include <dxva.h>
33 
34 typedef struct H264DecodePictureContext {
35  DXVA_PicParams_H264 pp;
36  DXVA_Qmatrix_H264 qm;
37  unsigned slice_count;
38  DXVA_Slice_H264_Short slice_short[MAX_SLICES];
39  const uint8_t *bitstream;
40  unsigned bitstream_size;
42 
43 static void fill_slice_short(DXVA_Slice_H264_Short *slice,
44  unsigned position, unsigned size)
45 {
46  memset(slice, 0, sizeof(*slice));
47  slice->BSNALunitDataLocation = position;
48  slice->SliceBytesInBuffer = size;
49  slice->wBadSliceChopping = 0;
50 }
51 
53  av_unused const AVBufferRef *buffer_ref,
54  av_unused const uint8_t *buffer,
55  av_unused uint32_t size)
56 {
57  const H264Context *h = avctx->priv_data;
58  H264DecodePictureContext *ctx_pic = h->cur_pic_ptr->hwaccel_picture_private;
60 
61  if (!ctx)
62  return -1;
63 
64  av_assert0(ctx_pic);
65 
66  ctx->used_mask = 0;
67 
69 
71 
72  ctx_pic->slice_count = 0;
73  ctx_pic->bitstream_size = 0;
74  ctx_pic->bitstream = NULL;
75 
76  return 0;
77 }
78 
79 static int d3d12va_h264_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
80 {
81  unsigned position;
82  const H264Context *h = avctx->priv_data;
83  const H264SliceContext *sl = &h->slice_ctx[0];
84  const H264Picture *current_picture = h->cur_pic_ptr;
85  H264DecodePictureContext *ctx_pic = current_picture->hwaccel_picture_private;
86 
87  if (ctx_pic->slice_count >= MAX_SLICES)
88  return AVERROR(ERANGE);
89 
90  if (!ctx_pic->bitstream)
91  ctx_pic->bitstream = buffer;
92  ctx_pic->bitstream_size += size;
93 
94  position = buffer - ctx_pic->bitstream;
95  fill_slice_short(&ctx_pic->slice_short[ctx_pic->slice_count], position, size);
96  ctx_pic->slice_count++;
97 
99  ctx_pic->pp.wBitFields &= ~(1 << 15); /* Set IntraPicFlag to 0 */
100 
101  return 0;
102 }
103 
104 #define START_CODE 65536
105 #define START_CODE_SIZE 3
106 static int update_input_arguments(AVCodecContext *avctx, D3D12_VIDEO_DECODE_INPUT_STREAM_ARGUMENTS *input_args, ID3D12Resource *buffer)
107 {
108  const H264Context *h = avctx->priv_data;
109  const H264Picture *current_picture = h->cur_pic_ptr;
110  H264DecodePictureContext *ctx_pic = current_picture->hwaccel_picture_private;
111 
112  int i;
113  uint8_t *mapped_data, *mapped_ptr;
114  DXVA_Slice_H264_Short *slice;
115  D3D12_VIDEO_DECODE_FRAME_ARGUMENT *args;
116 
117  if (FAILED(ID3D12Resource_Map(buffer, 0, NULL, (void **)&mapped_data))) {
118  av_log(avctx, AV_LOG_ERROR, "Failed to map D3D12 Buffer resource!\n");
119  return AVERROR(EINVAL);
120  }
121 
122  mapped_ptr = mapped_data;
123  for (i = 0; i < ctx_pic->slice_count; i++) {
124  UINT position, size;
125  slice = &ctx_pic->slice_short[i];
126 
127  position = slice->BSNALunitDataLocation;
128  size = slice->SliceBytesInBuffer;
129 
130  slice->SliceBytesInBuffer += START_CODE_SIZE;
131  slice->BSNALunitDataLocation = mapped_ptr - mapped_data;
132 
133  *(uint32_t *)mapped_ptr = START_CODE;
134  mapped_ptr += START_CODE_SIZE;
135 
136  memcpy(mapped_ptr, &ctx_pic->bitstream[position], size);
137  mapped_ptr += size;
138  }
139 
140  ID3D12Resource_Unmap(buffer, 0, NULL);
141 
142  input_args->CompressedBitstream = (D3D12_VIDEO_DECODE_COMPRESSED_BITSTREAM){
143  .pBuffer = buffer,
144  .Offset = 0,
145  .Size = mapped_ptr - mapped_data,
146  };
147 
148  args = &input_args->FrameArguments[input_args->NumFrameArguments++];
149  args->Type = D3D12_VIDEO_DECODE_ARGUMENT_TYPE_SLICE_CONTROL;
150  args->Size = sizeof(DXVA_Slice_H264_Short) * ctx_pic->slice_count;
151  args->pData = ctx_pic->slice_short;
152 
153  return 0;
154 }
155 
157 {
158  H264Context *h = avctx->priv_data;
159  H264DecodePictureContext *ctx_pic = h->cur_pic_ptr->hwaccel_picture_private;
160  H264SliceContext *sl = &h->slice_ctx[0];
161 
162  int ret;
163 
164  if (ctx_pic->slice_count <= 0 || ctx_pic->bitstream_size <= 0)
165  return -1;
166 
167  ret = ff_d3d12va_common_end_frame(avctx, h->cur_pic_ptr->f,
168  &ctx_pic->pp, sizeof(ctx_pic->pp),
169  &ctx_pic->qm, sizeof(ctx_pic->qm),
171  if (!ret)
172  ff_h264_draw_horiz_band(h, sl, 0, h->avctx->height);
173 
174  return ret;
175 }
176 
178 {
180  DXVA_PicParams_H264 pp;
181 
182  ctx->cfg.DecodeProfile = D3D12_VIDEO_DECODE_PROFILE_H264;
183 
184  ctx->max_num_ref = FF_ARRAY_ELEMS(pp.RefFrameList) + 1;
185 
186  return ff_d3d12va_decode_init(avctx);
187 }
188 
189 #if CONFIG_H264_D3D12VA_HWACCEL
191  .p.name = "h264_d3d12va",
192  .p.type = AVMEDIA_TYPE_VIDEO,
193  .p.id = AV_CODEC_ID_H264,
194  .p.pix_fmt = AV_PIX_FMT_D3D12,
195  .init = d3d12va_h264_decode_init,
196  .uninit = ff_d3d12va_decode_uninit,
197  .start_frame = d3d12va_h264_start_frame,
198  .decode_slice = d3d12va_h264_decode_slice,
199  .end_frame = d3d12va_h264_end_frame,
200  .frame_params = ff_d3d12va_common_frame_params,
201  .frame_priv_data_size = sizeof(H264DecodePictureContext),
202  .priv_data_size = sizeof(D3D12VADecodeContext),
203 };
204 #endif
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
av_unused
#define av_unused
Definition: attributes.h:131
FFHWAccel::p
AVHWAccel p
The public AVHWAccel.
Definition: hwaccel_internal.h:38
ff_dxva2_h264_fill_scaling_lists
void ff_dxva2_h264_fill_scaling_lists(const AVCodecContext *avctx, AVDXVAContext *ctx, DXVA_Qmatrix_H264 *qm)
Definition: dxva2_h264.c:168
mpegutils.h
H264SliceContext
Definition: h264dec.h:180
FFHWAccel
Definition: hwaccel_internal.h:34
d3d12va_h264_end_frame
static int d3d12va_h264_end_frame(AVCodecContext *avctx)
Definition: d3d12va_h264.c:156
MAX_SLICES
#define MAX_SLICES
Definition: d3d12va_hevc.c:33
avassert.h
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:209
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
av_cold
#define av_cold
Definition: attributes.h:90
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:40
h264data.h
ctx
AVFormatContext * ctx
Definition: movenc.c:49
ff_d3d12va_common_frame_params
int ff_d3d12va_common_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx)
d3d12va common frame params
Definition: d3d12va_decode.c:271
H264SliceContext::slice_type
int slice_type
Definition: h264dec.h:186
AV_CODEC_ID_H264
@ AV_CODEC_ID_H264
Definition: codec_id.h:79
ff_h264_draw_horiz_band
void ff_h264_draw_horiz_band(const H264Context *h, H264SliceContext *sl, int y, int height)
Definition: h264dec.c:103
dxva2_internal.h
fill_slice_short
static void fill_slice_short(DXVA_Slice_H264_Short *slice, unsigned position, unsigned size)
Definition: d3d12va_h264.c:43
NULL
#define NULL
Definition: coverity.c:32
AV_PICTURE_TYPE_SI
@ AV_PICTURE_TYPE_SI
Switching Intra.
Definition: avutil.h:283
AV_PICTURE_TYPE_I
@ AV_PICTURE_TYPE_I
Intra.
Definition: avutil.h:279
ff_d3d12va_common_end_frame
int ff_d3d12va_common_end_frame(AVCodecContext *avctx, AVFrame *frame, const void *pp, unsigned pp_size, const void *qm, unsigned qm_size, int(*update_input_arguments)(AVCodecContext *, D3D12_VIDEO_DECODE_INPUT_STREAM_ARGUMENTS *, ID3D12Resource *))
d3d12va common end frame
Definition: d3d12va_decode.c:434
AV_PIX_FMT_D3D12
@ AV_PIX_FMT_D3D12
Hardware surfaces for Direct3D 12.
Definition: pixfmt.h:440
D3D12VA_DECODE_CONTEXT
#define D3D12VA_DECODE_CONTEXT(avctx)
Definition: d3d12va_decode.h:128
h264_ps.h
START_CODE_SIZE
#define START_CODE_SIZE
Definition: d3d12va_h264.c:105
size
int size
Definition: twinvq_data.h:10344
AVDXVAContext
Definition: dxva2_internal.h:74
ff_h264_d3d12va_hwaccel
const struct FFHWAccel ff_h264_d3d12va_hwaccel
ff_dxva2_h264_fill_picture_parameters
void ff_dxva2_h264_fill_picture_parameters(const AVCodecContext *avctx, AVDXVAContext *ctx, DXVA_PicParams_H264 *pp)
Definition: dxva2_h264.c:51
AVHWAccel::name
const char * name
Name of the hardware accelerated codec.
Definition: avcodec.h:1948
h264dec.h
H264DecodePictureContext::bitstream_size
unsigned bitstream_size
Definition: d3d12va_h264.c:40
H264Context
H264Context.
Definition: h264dec.h:340
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
ff_d3d12va_decode_init
av_cold int ff_d3d12va_decode_init(AVCodecContext *avctx)
init D3D12VADecodeContext
Definition: d3d12va_decode.c:283
H264DecodePictureContext::slice_count
unsigned slice_count
Definition: d3d12va_h264.c:37
H264DecodePictureContext::slice_short
DXVA_Slice_H264_Short slice_short[MAX_SLICES]
Definition: d3d12va_h264.c:38
d3d12va_h264_decode_slice
static int d3d12va_h264_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
Definition: d3d12va_h264.c:79
ret
ret
Definition: filter_design.txt:187
AVCodecContext
main external API structure.
Definition: avcodec.h:431
buffer
the frame and frame reference mechanism is intended to as much as expensive copies of that data while still allowing the filters to produce correct results The data is stored in buffers represented by AVFrame structures Several references can point to the same frame buffer
Definition: filter_design.txt:49
H264Picture
Definition: h264dec.h:114
d3d12va_h264_start_frame
static int d3d12va_h264_start_frame(AVCodecContext *avctx, av_unused const AVBufferRef *buffer_ref, av_unused const uint8_t *buffer, av_unused uint32_t size)
Definition: d3d12va_h264.c:52
H264DecodePictureContext::qm
DXVA_Qmatrix_H264 qm
Definition: d3d12va_h264.c:36
H264DecodePictureContext::bitstream
const uint8_t * bitstream
Definition: d3d12va_h264.c:39
START_CODE
#define START_CODE
Definition: d3d12va_h264.c:104
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
AVBufferRef
A reference to a data buffer.
Definition: buffer.h:82
d3d12va_h264_decode_init
static av_cold int d3d12va_h264_decode_init(AVCodecContext *avctx)
Definition: d3d12va_h264.c:177
H264Picture::hwaccel_picture_private
void * hwaccel_picture_private
RefStruct reference for hardware accelerator private data.
Definition: h264dec.h:130
D3D12VADecodeContext
This structure is used to provide the necessary configurations and data to the FFmpeg Direct3D 12 HWA...
Definition: d3d12va_decode.h:37
update_input_arguments
static int update_input_arguments(AVCodecContext *avctx, D3D12_VIDEO_DECODE_INPUT_STREAM_ARGUMENTS *input_args, ID3D12Resource *buffer)
Definition: d3d12va_h264.c:106
AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:458
ff_d3d12va_decode_uninit
av_cold int ff_d3d12va_decode_uninit(AVCodecContext *avctx)
uninit D3D12VADecodeContext
Definition: d3d12va_decode.c:373
H264DecodePictureContext::pp
DXVA_PicParams_H264 pp
Definition: d3d12va_h264.c:35
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
h
h
Definition: vp9dsp_template.c:2070
hwcontext_d3d12va_internal.h
H264DecodePictureContext
Definition: d3d12va_h264.c:34
d3d12va_decode.h