FFmpeg
d3d12va_av1.c
Go to the documentation of this file.
1 /*
2  * Direct3D 12 AV1 HW acceleration
3  *
4  * copyright (c) 2022-2023 Wu Jianhua <toqsxw@outlook.com>
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
23 #include "config_components.h"
24 #include "libavutil/avassert.h"
26 #include "libavutil/mem.h"
27 #include "av1dec.h"
28 #include "dxva2_internal.h"
29 #include "d3d12va_decode.h"
30 
31 #define MAX_TILES 256
32 
33 typedef struct D3D12AV1DecodeContext {
35  uint8_t *bitstream_buffer;
37 
38 #define D3D12_AV1_DECODE_CONTEXT(avctx) ((D3D12AV1DecodeContext *)D3D12VA_DECODE_CONTEXT(avctx))
39 
40 typedef struct AV1DecodePictureContext {
41  DXVA_PicParams_AV1 pp;
42  unsigned tile_count;
43  DXVA_Tile_AV1 tiles[MAX_TILES];
44  uint8_t *bitstream;
45  unsigned bitstream_size;
47 
48 static int d3d12va_av1_start_frame(AVCodecContext *avctx, av_unused const uint8_t *buffer, av_unused uint32_t size)
49 {
50  const AV1DecContext *h = avctx->priv_data;
51  AV1DecodePictureContext *ctx_pic = h->cur_frame.hwaccel_picture_private;
53  if (!ctx)
54  return -1;
55 
56  av_assert0(ctx_pic);
57 
58  ctx->used_mask = 0;
59 
60  if (ff_dxva2_av1_fill_picture_parameters(avctx, (AVDXVAContext *)ctx, &ctx_pic->pp) < 0)
61  return -1;
62 
63  ctx_pic->bitstream = NULL;
64  ctx_pic->bitstream_size = 0;
65  ctx_pic->tile_count = 0;
66 
67  return 0;
68 }
69 
71  const uint8_t *buffer,
72  uint32_t size)
73 {
74  const AV1DecContext *h = avctx->priv_data;
75  const AV1RawFrameHeader *frame_header = h->raw_frame_header;
76  AV1DecodePictureContext *ctx_pic = h->cur_frame.hwaccel_picture_private;
77  int offset = 0;
78  uint32_t tg_start, tg_end;
79 
80  ctx_pic->tile_count = frame_header->tile_cols * frame_header->tile_rows;
81 
82  if (ctx_pic->tile_count > MAX_TILES)
83  return AVERROR(ENOSYS);
84 
85  if (ctx_pic->tile_count == h->tg_end - h->tg_start + 1) {
86  tg_start = 0;
87  tg_end = ctx_pic->tile_count - 1;
88  ctx_pic->bitstream = (uint8_t *)buffer;
89  ctx_pic->bitstream_size = size;
90  } else {
91  ctx_pic->bitstream = D3D12_AV1_DECODE_CONTEXT(avctx)->bitstream_buffer;
92  memcpy(ctx_pic->bitstream + ctx_pic->bitstream_size, buffer, size);
93  tg_start = h->tg_start;
94  tg_end = h->tg_end;
95  offset = ctx_pic->bitstream_size;
96  ctx_pic->bitstream_size += size;
97  }
98 
99  for (uint32_t tile_num = tg_start; tile_num <= tg_end; tile_num++) {
100  ctx_pic->tiles[tile_num].DataOffset = offset + h->tile_group_info[tile_num].tile_offset;
101  ctx_pic->tiles[tile_num].DataSize = h->tile_group_info[tile_num].tile_size;
102  ctx_pic->tiles[tile_num].row = h->tile_group_info[tile_num].tile_row;
103  ctx_pic->tiles[tile_num].column = h->tile_group_info[tile_num].tile_column;
104  ctx_pic->tiles[tile_num].anchor_frame = 0xFF;
105  }
106 
107  return 0;
108 }
109 
110 static int update_input_arguments(AVCodecContext *avctx, D3D12_VIDEO_DECODE_INPUT_STREAM_ARGUMENTS *input_args, ID3D12Resource *buffer)
111 {
112  const AV1DecContext *h = avctx->priv_data;
113  AV1DecodePictureContext *ctx_pic = h->cur_frame.hwaccel_picture_private;
114  void *mapped_data;
115 
116  D3D12_VIDEO_DECODE_FRAME_ARGUMENT *args = &input_args->FrameArguments[input_args->NumFrameArguments++];
117  args->Type = D3D12_VIDEO_DECODE_ARGUMENT_TYPE_SLICE_CONTROL;
118  args->Size = sizeof(DXVA_Tile_AV1) * ctx_pic->tile_count;
119  args->pData = ctx_pic->tiles;
120 
121  input_args->CompressedBitstream = (D3D12_VIDEO_DECODE_COMPRESSED_BITSTREAM){
122  .pBuffer = buffer,
123  .Offset = 0,
124  .Size = ctx_pic->bitstream_size,
125  };
126 
127  if (FAILED(ID3D12Resource_Map(buffer, 0, NULL, &mapped_data))) {
128  av_log(avctx, AV_LOG_ERROR, "Failed to map D3D12 Buffer resource!\n");
129  return AVERROR(EINVAL);
130  }
131 
132  memcpy(mapped_data, ctx_pic->bitstream, ctx_pic->bitstream_size);
133 
134  ID3D12Resource_Unmap(buffer, 0, NULL);
135 
136  return 0;
137 }
138 
140 {
141  int ret;
142  const AV1DecContext *h = avctx->priv_data;
143  AV1DecodePictureContext *ctx_pic = h->cur_frame.hwaccel_picture_private;
144 
145  if (ctx_pic->tiles <= 0 || ctx_pic->bitstream_size <= 0)
146  return -1;
147 
148  ret = ff_d3d12va_common_end_frame(avctx, h->cur_frame.f, &ctx_pic->pp, sizeof(ctx_pic->pp),
150 
151  return ret;
152 }
153 
155 {
158  DXVA_PicParams_AV1 pp;
159 
160  int ret;
161 
162  if (avctx->profile != AV_PROFILE_AV1_MAIN)
163  return AVERROR(EINVAL);
164 
165  ctx->cfg.DecodeProfile = D3D12_VIDEO_DECODE_PROFILE_AV1_PROFILE0;
166 
167  ctx->max_num_ref = FF_ARRAY_ELEMS(pp.RefFrameMapTextureIndex) + 1;
168 
169  ret = ff_d3d12va_decode_init(avctx);
170  if (ret < 0)
171  return ret;
172 
173  if (!av1_ctx->bitstream_buffer) {
175  if (!av1_ctx->bitstream_buffer)
176  return AVERROR(ENOMEM);
177  }
178 
179  return 0;
180 }
181 
183 {
185 
186  if (ctx->bitstream_buffer)
187  av_freep(&ctx->bitstream_buffer);
188 
189  return ff_d3d12va_decode_uninit(avctx);
190 }
191 
192 #if CONFIG_AV1_D3D12VA_HWACCEL
194  .p.name = "av1_d3d12va",
195  .p.type = AVMEDIA_TYPE_VIDEO,
196  .p.id = AV_CODEC_ID_AV1,
197  .p.pix_fmt = AV_PIX_FMT_D3D12,
198  .init = d3d12va_av1_decode_init,
199  .uninit = d3d12va_av1_decode_uninit,
200  .start_frame = d3d12va_av1_start_frame,
201  .decode_slice = d3d12va_av1_decode_slice,
202  .end_frame = d3d12va_av1_end_frame,
203  .frame_params = ff_d3d12va_common_frame_params,
204  .frame_priv_data_size = sizeof(AV1DecodePictureContext),
205  .priv_data_size = sizeof(D3D12AV1DecodeContext),
206 };
207 #endif
D3D12AV1DecodeContext::ctx
D3D12VADecodeContext ctx
Definition: d3d12va_av1.c:34
AV1DecodePictureContext
Definition: d3d12va_av1.c:40
d3d12va_av1_end_frame
static int d3d12va_av1_end_frame(AVCodecContext *avctx)
Definition: d3d12va_av1.c:139
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
ff_av1_d3d12va_hwaccel
const struct FFHWAccel ff_av1_d3d12va_hwaccel
MAX_TILES
#define MAX_TILES
Definition: d3d12va_av1.c:31
av_unused
#define av_unused
Definition: attributes.h:131
FFHWAccel::p
AVHWAccel p
The public AVHWAccel.
Definition: hwaccel_internal.h:38
AV1DecodePictureContext::tiles
DXVA_Tile_AV1 tiles[MAX_TILES]
Definition: d3d12va_av1.c:43
ff_d3d12va_decode_uninit
int ff_d3d12va_decode_uninit(AVCodecContext *avctx)
uninit D3D12VADecodeContext
Definition: d3d12va_decode.c:373
D3D12AV1DecodeContext
Definition: d3d12va_av1.c:33
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:30
FFHWAccel
Definition: hwaccel_internal.h:34
AV1DecodePictureContext::bitstream_size
unsigned bitstream_size
Definition: d3d12va_av1.c:45
avassert.h
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:40
ctx
AVFormatContext * ctx
Definition: movenc.c:49
AV1DecodePictureContext::bitstream
uint8_t * bitstream
Definition: d3d12va_av1.c:44
ff_d3d12va_common_frame_params
int ff_d3d12va_common_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx)
d3d12va common frame params
Definition: d3d12va_decode.c:271
av1dec.h
dxva2_internal.h
NULL
#define NULL
Definition: coverity.c:32
AV_CODEC_ID_AV1
@ AV_CODEC_ID_AV1
Definition: codec_id.h:280
AV1RawFrameHeader
Definition: cbs_av1.h:165
d3d12va_av1_start_frame
static int d3d12va_av1_start_frame(AVCodecContext *avctx, av_unused const uint8_t *buffer, av_unused uint32_t size)
Definition: d3d12va_av1.c:48
ff_d3d12va_common_end_frame
int ff_d3d12va_common_end_frame(AVCodecContext *avctx, AVFrame *frame, const void *pp, unsigned pp_size, const void *qm, unsigned qm_size, int(*update_input_arguments)(AVCodecContext *, D3D12_VIDEO_DECODE_INPUT_STREAM_ARGUMENTS *, ID3D12Resource *))
d3d12va common end frame
Definition: d3d12va_decode.c:434
AV_PIX_FMT_D3D12
@ AV_PIX_FMT_D3D12
Hardware surfaces for Direct3D 12.
Definition: pixfmt.h:440
D3D12VA_DECODE_CONTEXT
#define D3D12VA_DECODE_CONTEXT(avctx)
Definition: d3d12va_decode.h:128
AV1DecodePictureContext::pp
DXVA_PicParams_AV1 pp
Definition: d3d12va_av1.c:41
d3d12va_av1_decode_slice
static int d3d12va_av1_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
Definition: d3d12va_av1.c:70
size
int size
Definition: twinvq_data.h:10344
AV1DecContext
Definition: av1dec.h:85
AVDXVAContext
Definition: dxva2_internal.h:74
ff_d3d12va_get_suitable_max_bitstream_size
int ff_d3d12va_get_suitable_max_bitstream_size(AVCodecContext *avctx)
Get a suitable maximum bitstream size.
Definition: d3d12va_decode.c:44
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
AVHWAccel::name
const char * name
Name of the hardware accelerated codec.
Definition: avcodec.h:2095
D3D12_AV1_DECODE_CONTEXT
#define D3D12_AV1_DECODE_CONTEXT(avctx)
Definition: d3d12va_av1.c:38
ret
ret
Definition: filter_design.txt:187
AV1DecodePictureContext::tile_count
unsigned tile_count
Definition: d3d12va_av1.c:42
AVCodecContext
main external API structure.
Definition: avcodec.h:445
frame_header
Definition: truemotion1.c:88
D3D12AV1DecodeContext::bitstream_buffer
uint8_t * bitstream_buffer
Definition: d3d12va_av1.c:35
buffer
the frame and frame reference mechanism is intended to as much as expensive copies of that data while still allowing the filters to produce correct results The data is stored in buffers represented by AVFrame structures Several references can point to the same frame buffer
Definition: filter_design.txt:49
AVCodecContext::profile
int profile
profile
Definition: avcodec.h:1640
d3d12va_av1_decode_init
static int d3d12va_av1_decode_init(AVCodecContext *avctx)
Definition: d3d12va_av1.c:154
ff_dxva2_av1_fill_picture_parameters
int ff_dxva2_av1_fill_picture_parameters(const AVCodecContext *avctx, AVDXVAContext *ctx, DXVA_PicParams_AV1 *pp)
Definition: dxva2_av1.c:60
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
mem.h
D3D12VADecodeContext
This structure is used to provide the necessary configurations and data to the FFmpeg Direct3D 12 HWA...
Definition: d3d12va_decode.h:37
AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:472
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:34
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
d3d12va_av1_decode_uninit
static int d3d12va_av1_decode_uninit(AVCodecContext *avctx)
Definition: d3d12va_av1.c:182
h
h
Definition: vp9dsp_template.c:2038
update_input_arguments
static int update_input_arguments(AVCodecContext *avctx, D3D12_VIDEO_DECODE_INPUT_STREAM_ARGUMENTS *input_args, ID3D12Resource *buffer)
Definition: d3d12va_av1.c:110
hwcontext_d3d12va_internal.h
AV_PROFILE_AV1_MAIN
#define AV_PROFILE_AV1_MAIN
Definition: defs.h:168
ff_d3d12va_decode_init
int ff_d3d12va_decode_init(AVCodecContext *avctx)
init D3D12VADecodeContext
Definition: d3d12va_decode.c:283
d3d12va_decode.h