FFmpeg
d3d12va_encode.c
Go to the documentation of this file.
1 /*
2  * Direct3D 12 HW acceleration video encoder
3  *
4  * Copyright (c) 2024 Intel Corporation
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
23 #include "libavutil/avassert.h"
24 #include "libavutil/common.h"
25 #include "libavutil/internal.h"
26 #include "libavutil/log.h"
27 #include "libavutil/mem.h"
28 #include "libavutil/pixdesc.h"
31 
32 #include "avcodec.h"
33 #include "d3d12va_encode.h"
34 #include "encode.h"
35 
37  HW_CONFIG_ENCODER_FRAMES(D3D12, D3D12VA),
38  NULL,
39 };
40 
42 {
43  uint64_t completion = ID3D12Fence_GetCompletedValue(psync_ctx->fence);
44  if (completion < psync_ctx->fence_value) {
45  if (FAILED(ID3D12Fence_SetEventOnCompletion(psync_ctx->fence, psync_ctx->fence_value, psync_ctx->event)))
46  return AVERROR(EINVAL);
47 
48  WaitForSingleObjectEx(psync_ctx->event, INFINITE, FALSE);
49  }
50 
51  return 0;
52 }
53 
55 {
57 
58  DX_CHECK(ID3D12CommandQueue_Signal(ctx->command_queue, ctx->sync_ctx.fence, ++ctx->sync_ctx.fence_value));
59  return d3d12va_fence_completion(&ctx->sync_ctx);
60 
61 fail:
62  return AVERROR(EINVAL);
63 }
64 
65 typedef struct CommandAllocator {
66  ID3D12CommandAllocator *command_allocator;
67  uint64_t fence_value;
69 
70 static int d3d12va_get_valid_command_allocator(AVCodecContext *avctx, ID3D12CommandAllocator **ppAllocator)
71 {
72  HRESULT hr;
74  CommandAllocator allocator;
75 
76  if (av_fifo_peek(ctx->allocator_queue, &allocator, 1, 0) >= 0) {
77  uint64_t completion = ID3D12Fence_GetCompletedValue(ctx->sync_ctx.fence);
78  if (completion >= allocator.fence_value) {
79  *ppAllocator = allocator.command_allocator;
80  av_fifo_read(ctx->allocator_queue, &allocator, 1);
81  return 0;
82  }
83  }
84 
85  hr = ID3D12Device_CreateCommandAllocator(ctx->hwctx->device, D3D12_COMMAND_LIST_TYPE_VIDEO_ENCODE,
86  &IID_ID3D12CommandAllocator, (void **)ppAllocator);
87  if (FAILED(hr)) {
88  av_log(avctx, AV_LOG_ERROR, "Failed to create a new command allocator!\n");
89  return AVERROR(EINVAL);
90  }
91 
92  return 0;
93 }
94 
95 static int d3d12va_discard_command_allocator(AVCodecContext *avctx, ID3D12CommandAllocator *pAllocator, uint64_t fence_value)
96 {
98 
99  CommandAllocator allocator = {
100  .command_allocator = pAllocator,
101  .fence_value = fence_value,
102  };
103 
104  av_fifo_write(ctx->allocator_queue, &allocator, 1);
105 
106  return 0;
107 }
108 
111 {
113  FFHWBaseEncodePicture *base_pic = &pic->base;
114  uint64_t completion;
115 
116  av_assert0(base_pic->encode_issued);
117 
118  if (base_pic->encode_complete) {
119  // Already waited for this picture.
120  return 0;
121  }
122 
123  completion = ID3D12Fence_GetCompletedValue(ctx->sync_ctx.fence);
124  if (completion < pic->fence_value) {
125  if (FAILED(ID3D12Fence_SetEventOnCompletion(ctx->sync_ctx.fence, pic->fence_value,
126  ctx->sync_ctx.event)))
127  return AVERROR(EINVAL);
128 
129  WaitForSingleObjectEx(ctx->sync_ctx.event, INFINITE, FALSE);
130  }
131 
132  av_log(avctx, AV_LOG_DEBUG, "Sync to pic %"PRId64"/%"PRId64" "
133  "(input surface %p).\n", base_pic->display_order,
134  base_pic->encode_order, pic->input_surface->texture);
135 
136  av_frame_free(&base_pic->input_image);
137 
138  base_pic->encode_complete = 1;
139  return 0;
140 }
141 
144 {
146  int width = sizeof(D3D12_VIDEO_ENCODER_OUTPUT_METADATA) + sizeof(D3D12_VIDEO_ENCODER_FRAME_SUBREGION_METADATA);
147  D3D12_HEAP_PROPERTIES encoded_meta_props = { .Type = D3D12_HEAP_TYPE_DEFAULT }, resolved_meta_props;
148  D3D12_HEAP_TYPE resolved_heap_type = D3D12_HEAP_TYPE_READBACK;
149  HRESULT hr;
150 
151  D3D12_RESOURCE_DESC meta_desc = {
152  .Dimension = D3D12_RESOURCE_DIMENSION_BUFFER,
153  .Alignment = 0,
154  .Width = ctx->req.MaxEncoderOutputMetadataBufferSize,
155  .Height = 1,
156  .DepthOrArraySize = 1,
157  .MipLevels = 1,
158  .Format = DXGI_FORMAT_UNKNOWN,
159  .SampleDesc = { .Count = 1, .Quality = 0 },
160  .Layout = D3D12_TEXTURE_LAYOUT_ROW_MAJOR,
161  .Flags = D3D12_RESOURCE_FLAG_NONE,
162  };
163 
164  hr = ID3D12Device_CreateCommittedResource(ctx->hwctx->device, &encoded_meta_props, D3D12_HEAP_FLAG_NONE,
165  &meta_desc, D3D12_RESOURCE_STATE_COMMON, NULL,
166  &IID_ID3D12Resource, (void **)&pic->encoded_metadata);
167  if (FAILED(hr)) {
168  av_log(avctx, AV_LOG_ERROR, "Failed to create metadata buffer.\n");
169  return AVERROR_UNKNOWN;
170  }
171 
172  ctx->hwctx->device->lpVtbl->GetCustomHeapProperties(ctx->hwctx->device, &resolved_meta_props, 0, resolved_heap_type);
173 
174  meta_desc.Width = width;
175 
176  hr = ID3D12Device_CreateCommittedResource(ctx->hwctx->device, &resolved_meta_props, D3D12_HEAP_FLAG_NONE,
177  &meta_desc, D3D12_RESOURCE_STATE_COMMON, NULL,
178  &IID_ID3D12Resource, (void **)&pic->resolved_metadata);
179 
180  if (FAILED(hr)) {
181  av_log(avctx, AV_LOG_ERROR, "Failed to create output metadata buffer.\n");
182  return AVERROR_UNKNOWN;
183  }
184 
185  return 0;
186 }
187 
189  const FFHWBaseEncodePicture *base_pic)
190 {
191  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
193  AVD3D12VAFramesContext *frames_hwctx = base_ctx->input_frames->hwctx;
194  D3D12VAEncodePicture *pic = (D3D12VAEncodePicture *)base_pic;
195  int err, i, j;
196  HRESULT hr;
198  void *ptr;
199  size_t bit_len;
200  ID3D12CommandAllocator *command_allocator = NULL;
201  ID3D12VideoEncodeCommandList2 *cmd_list = ctx->command_list;
202  D3D12_RESOURCE_BARRIER barriers[32] = { 0 };
203  D3D12_VIDEO_ENCODE_REFERENCE_FRAMES d3d12_refs = { 0 };
204 
205  D3D12_VIDEO_ENCODER_ENCODEFRAME_INPUT_ARGUMENTS input_args = {
206  .SequenceControlDesc = {
207  .Flags = D3D12_VIDEO_ENCODER_SEQUENCE_CONTROL_FLAG_NONE,
208  .IntraRefreshConfig = { 0 },
209  .RateControl = ctx->rc,
210  .PictureTargetResolution = ctx->resolution,
211  .SelectedLayoutMode = D3D12_VIDEO_ENCODER_FRAME_SUBREGION_LAYOUT_MODE_FULL_FRAME,
212  .FrameSubregionsLayoutData = { 0 },
213  .CodecGopSequence = ctx->gop,
214  },
215  .pInputFrame = pic->input_surface->texture,
216  .InputFrameSubresource = 0,
217  };
218 
219  D3D12_VIDEO_ENCODER_ENCODEFRAME_OUTPUT_ARGUMENTS output_args = { 0 };
220 
221  D3D12_VIDEO_ENCODER_RESOLVE_METADATA_INPUT_ARGUMENTS input_metadata = {
222  .EncoderCodec = ctx->codec->d3d12_codec,
223  .EncoderProfile = ctx->profile->d3d12_profile,
224  .EncoderInputFormat = frames_hwctx->format,
225  .EncodedPictureEffectiveResolution = ctx->resolution,
226  };
227 
228  D3D12_VIDEO_ENCODER_RESOLVE_METADATA_OUTPUT_ARGUMENTS output_metadata = { 0 };
229 
230  memset(data, 0, sizeof(data));
231 
232  av_log(avctx, AV_LOG_DEBUG, "Issuing encode for pic %"PRId64"/%"PRId64" "
233  "as type %s.\n", base_pic->display_order, base_pic->encode_order,
235  if (base_pic->nb_refs[0] == 0 && base_pic->nb_refs[1] == 0) {
236  av_log(avctx, AV_LOG_DEBUG, "No reference pictures.\n");
237  } else {
238  av_log(avctx, AV_LOG_DEBUG, "L0 refers to");
239  for (i = 0; i < base_pic->nb_refs[0]; i++) {
240  av_log(avctx, AV_LOG_DEBUG, " %"PRId64"/%"PRId64,
241  base_pic->refs[0][i]->display_order, base_pic->refs[0][i]->encode_order);
242  }
243  av_log(avctx, AV_LOG_DEBUG, ".\n");
244 
245  if (base_pic->nb_refs[1]) {
246  av_log(avctx, AV_LOG_DEBUG, "L1 refers to");
247  for (i = 0; i < base_pic->nb_refs[1]; i++) {
248  av_log(avctx, AV_LOG_DEBUG, " %"PRId64"/%"PRId64,
249  base_pic->refs[1][i]->display_order, base_pic->refs[1][i]->encode_order);
250  }
251  av_log(avctx, AV_LOG_DEBUG, ".\n");
252  }
253  }
254 
255  av_assert0(!base_pic->encode_issued);
256  for (i = 0; i < base_pic->nb_refs[0]; i++) {
257  av_assert0(base_pic->refs[0][i]);
258  av_assert0(base_pic->refs[0][i]->encode_issued);
259  }
260  for (i = 0; i < base_pic->nb_refs[1]; i++) {
261  av_assert0(base_pic->refs[1][i]);
262  av_assert0(base_pic->refs[1][i]->encode_issued);
263  }
264 
265  av_log(avctx, AV_LOG_DEBUG, "Input surface is %p.\n", pic->input_surface->texture);
266 
267  err = av_hwframe_get_buffer(base_ctx->recon_frames_ref, base_pic->recon_image, 0);
268  if (err < 0) {
269  err = AVERROR(ENOMEM);
270  goto fail;
271  }
272 
273  pic->recon_surface = (AVD3D12VAFrame *)base_pic->recon_image->data[0];
274  av_log(avctx, AV_LOG_DEBUG, "Recon surface is %p.\n",
275  pic->recon_surface->texture);
276 
277  pic->output_buffer_ref = av_buffer_pool_get(ctx->output_buffer_pool);
278  if (!pic->output_buffer_ref) {
279  err = AVERROR(ENOMEM);
280  goto fail;
281  }
282  pic->output_buffer = (ID3D12Resource *)pic->output_buffer_ref->data;
283  av_log(avctx, AV_LOG_DEBUG, "Output buffer is %p.\n",
284  pic->output_buffer);
285 
286  err = d3d12va_encode_create_metadata_buffers(avctx, pic);
287  if (err < 0)
288  goto fail;
289 
290  if (ctx->codec->init_picture_params) {
291  err = ctx->codec->init_picture_params(avctx, pic);
292  if (err < 0) {
293  av_log(avctx, AV_LOG_ERROR, "Failed to initialise picture "
294  "parameters: %d.\n", err);
295  goto fail;
296  }
297  }
298 
299  if (base_pic->type == FF_HW_PICTURE_TYPE_IDR) {
300  if (ctx->codec->write_sequence_header) {
301  bit_len = 8 * sizeof(data);
302  err = ctx->codec->write_sequence_header(avctx, data, &bit_len);
303  if (err < 0) {
304  av_log(avctx, AV_LOG_ERROR, "Failed to write per-sequence "
305  "header: %d.\n", err);
306  goto fail;
307  }
308  }
309 
310  pic->header_size = (int)bit_len / 8;
311  pic->header_size = pic->header_size % ctx->req.CompressedBitstreamBufferAccessAlignment ?
312  FFALIGN(pic->header_size, ctx->req.CompressedBitstreamBufferAccessAlignment) :
313  pic->header_size;
314 
315  hr = ID3D12Resource_Map(pic->output_buffer, 0, NULL, (void **)&ptr);
316  if (FAILED(hr)) {
317  err = AVERROR_UNKNOWN;
318  goto fail;
319  }
320 
321  memcpy(ptr, data, pic->header_size);
322  ID3D12Resource_Unmap(pic->output_buffer, 0, NULL);
323  }
324 
325  d3d12_refs.NumTexture2Ds = base_pic->nb_refs[0] + base_pic->nb_refs[1];
326  if (d3d12_refs.NumTexture2Ds) {
327  d3d12_refs.ppTexture2Ds = av_calloc(d3d12_refs.NumTexture2Ds,
328  sizeof(*d3d12_refs.ppTexture2Ds));
329  if (!d3d12_refs.ppTexture2Ds) {
330  err = AVERROR(ENOMEM);
331  goto fail;
332  }
333 
334  i = 0;
335  for (j = 0; j < base_pic->nb_refs[0]; j++)
336  d3d12_refs.ppTexture2Ds[i++] = ((D3D12VAEncodePicture *)base_pic->refs[0][j])->recon_surface->texture;
337  for (j = 0; j < base_pic->nb_refs[1]; j++)
338  d3d12_refs.ppTexture2Ds[i++] = ((D3D12VAEncodePicture *)base_pic->refs[1][j])->recon_surface->texture;
339  }
340 
341  input_args.PictureControlDesc.IntraRefreshFrameIndex = 0;
342  if (base_pic->is_reference)
343  input_args.PictureControlDesc.Flags |= D3D12_VIDEO_ENCODER_PICTURE_CONTROL_FLAG_USED_AS_REFERENCE_PICTURE;
344 
345  input_args.PictureControlDesc.PictureControlCodecData = pic->pic_ctl;
346  input_args.PictureControlDesc.ReferenceFrames = d3d12_refs;
347  input_args.CurrentFrameBitstreamMetadataSize = pic->header_size;
348 
349  output_args.Bitstream.pBuffer = pic->output_buffer;
350  output_args.Bitstream.FrameStartOffset = pic->header_size;
351  output_args.ReconstructedPicture.pReconstructedPicture = pic->recon_surface->texture;
352  output_args.ReconstructedPicture.ReconstructedPictureSubresource = 0;
353  output_args.EncoderOutputMetadata.pBuffer = pic->encoded_metadata;
354  output_args.EncoderOutputMetadata.Offset = 0;
355 
356  input_metadata.HWLayoutMetadata.pBuffer = pic->encoded_metadata;
357  input_metadata.HWLayoutMetadata.Offset = 0;
358 
359  output_metadata.ResolvedLayoutMetadata.pBuffer = pic->resolved_metadata;
360  output_metadata.ResolvedLayoutMetadata.Offset = 0;
361 
362  err = d3d12va_get_valid_command_allocator(avctx, &command_allocator);
363  if (err < 0)
364  goto fail;
365 
366  hr = ID3D12CommandAllocator_Reset(command_allocator);
367  if (FAILED(hr)) {
368  err = AVERROR_UNKNOWN;
369  goto fail;
370  }
371 
372  hr = ID3D12VideoEncodeCommandList2_Reset(cmd_list, command_allocator);
373  if (FAILED(hr)) {
374  err = AVERROR_UNKNOWN;
375  goto fail;
376  }
377 
378 #define TRANSITION_BARRIER(res, before, after) \
379  (D3D12_RESOURCE_BARRIER) { \
380  .Type = D3D12_RESOURCE_BARRIER_TYPE_TRANSITION, \
381  .Flags = D3D12_RESOURCE_BARRIER_FLAG_NONE, \
382  .Transition = { \
383  .pResource = res, \
384  .Subresource = D3D12_RESOURCE_BARRIER_ALL_SUBRESOURCES, \
385  .StateBefore = before, \
386  .StateAfter = after, \
387  }, \
388  }
389 
390  barriers[0] = TRANSITION_BARRIER(pic->input_surface->texture,
391  D3D12_RESOURCE_STATE_COMMON,
392  D3D12_RESOURCE_STATE_VIDEO_ENCODE_READ);
393  barriers[1] = TRANSITION_BARRIER(pic->output_buffer,
394  D3D12_RESOURCE_STATE_COMMON,
395  D3D12_RESOURCE_STATE_VIDEO_ENCODE_WRITE);
396  barriers[2] = TRANSITION_BARRIER(pic->recon_surface->texture,
397  D3D12_RESOURCE_STATE_COMMON,
398  D3D12_RESOURCE_STATE_VIDEO_ENCODE_WRITE);
399  barriers[3] = TRANSITION_BARRIER(pic->encoded_metadata,
400  D3D12_RESOURCE_STATE_COMMON,
401  D3D12_RESOURCE_STATE_VIDEO_ENCODE_WRITE);
402  barriers[4] = TRANSITION_BARRIER(pic->resolved_metadata,
403  D3D12_RESOURCE_STATE_COMMON,
404  D3D12_RESOURCE_STATE_VIDEO_ENCODE_WRITE);
405 
406  ID3D12VideoEncodeCommandList2_ResourceBarrier(cmd_list, 5, barriers);
407 
408  if (d3d12_refs.NumTexture2Ds) {
409  D3D12_RESOURCE_BARRIER refs_barriers[3];
410 
411  for (i = 0; i < d3d12_refs.NumTexture2Ds; i++)
412  refs_barriers[i] = TRANSITION_BARRIER(d3d12_refs.ppTexture2Ds[i],
413  D3D12_RESOURCE_STATE_COMMON,
414  D3D12_RESOURCE_STATE_VIDEO_ENCODE_READ);
415 
416  ID3D12VideoEncodeCommandList2_ResourceBarrier(cmd_list, d3d12_refs.NumTexture2Ds,
417  refs_barriers);
418  }
419 
420  ID3D12VideoEncodeCommandList2_EncodeFrame(cmd_list, ctx->encoder, ctx->encoder_heap,
421  &input_args, &output_args);
422 
423  barriers[3] = TRANSITION_BARRIER(pic->encoded_metadata,
424  D3D12_RESOURCE_STATE_VIDEO_ENCODE_WRITE,
425  D3D12_RESOURCE_STATE_VIDEO_ENCODE_READ);
426 
427  ID3D12VideoEncodeCommandList2_ResourceBarrier(cmd_list, 1, &barriers[3]);
428 
429  ID3D12VideoEncodeCommandList2_ResolveEncoderOutputMetadata(cmd_list, &input_metadata, &output_metadata);
430 
431  if (d3d12_refs.NumTexture2Ds) {
432  D3D12_RESOURCE_BARRIER refs_barriers[3];
433 
434  for (i = 0; i < d3d12_refs.NumTexture2Ds; i++)
435  refs_barriers[i] = TRANSITION_BARRIER(d3d12_refs.ppTexture2Ds[i],
436  D3D12_RESOURCE_STATE_VIDEO_ENCODE_READ,
437  D3D12_RESOURCE_STATE_COMMON);
438 
439  ID3D12VideoEncodeCommandList2_ResourceBarrier(cmd_list, d3d12_refs.NumTexture2Ds,
440  refs_barriers);
441  }
442 
443  barriers[0] = TRANSITION_BARRIER(pic->input_surface->texture,
444  D3D12_RESOURCE_STATE_VIDEO_ENCODE_READ,
445  D3D12_RESOURCE_STATE_COMMON);
446  barriers[1] = TRANSITION_BARRIER(pic->output_buffer,
447  D3D12_RESOURCE_STATE_VIDEO_ENCODE_WRITE,
448  D3D12_RESOURCE_STATE_COMMON);
449  barriers[2] = TRANSITION_BARRIER(pic->recon_surface->texture,
450  D3D12_RESOURCE_STATE_VIDEO_ENCODE_WRITE,
451  D3D12_RESOURCE_STATE_COMMON);
452  barriers[3] = TRANSITION_BARRIER(pic->encoded_metadata,
453  D3D12_RESOURCE_STATE_VIDEO_ENCODE_READ,
454  D3D12_RESOURCE_STATE_COMMON);
455  barriers[4] = TRANSITION_BARRIER(pic->resolved_metadata,
456  D3D12_RESOURCE_STATE_VIDEO_ENCODE_WRITE,
457  D3D12_RESOURCE_STATE_COMMON);
458 
459  ID3D12VideoEncodeCommandList2_ResourceBarrier(cmd_list, 5, barriers);
460 
461  hr = ID3D12VideoEncodeCommandList2_Close(cmd_list);
462  if (FAILED(hr)) {
463  err = AVERROR_UNKNOWN;
464  goto fail;
465  }
466 
467  hr = ID3D12CommandQueue_Wait(ctx->command_queue, pic->input_surface->sync_ctx.fence,
469  if (FAILED(hr)) {
470  err = AVERROR_UNKNOWN;
471  goto fail;
472  }
473 
474  ID3D12CommandQueue_ExecuteCommandLists(ctx->command_queue, 1, (ID3D12CommandList **)&ctx->command_list);
475 
476  hr = ID3D12CommandQueue_Signal(ctx->command_queue, pic->input_surface->sync_ctx.fence,
478  if (FAILED(hr)) {
479  err = AVERROR_UNKNOWN;
480  goto fail;
481  }
482 
483  hr = ID3D12CommandQueue_Signal(ctx->command_queue, ctx->sync_ctx.fence, ++ctx->sync_ctx.fence_value);
484  if (FAILED(hr)) {
485  err = AVERROR_UNKNOWN;
486  goto fail;
487  }
488 
489  err = d3d12va_discard_command_allocator(avctx, command_allocator, ctx->sync_ctx.fence_value);
490  if (err < 0)
491  goto fail;
492 
493  pic->fence_value = ctx->sync_ctx.fence_value;
494 
495  if (d3d12_refs.ppTexture2Ds)
496  av_freep(&d3d12_refs.ppTexture2Ds);
497 
498  return 0;
499 
500 fail:
501  if (command_allocator)
502  d3d12va_discard_command_allocator(avctx, command_allocator, ctx->sync_ctx.fence_value);
503 
504  if (d3d12_refs.ppTexture2Ds)
505  av_freep(&d3d12_refs.ppTexture2Ds);
506 
507  if (ctx->codec->free_picture_params)
508  ctx->codec->free_picture_params(pic);
509 
511  pic->output_buffer = NULL;
514  return err;
515 }
516 
519 {
520  FFHWBaseEncodePicture *base_pic = &pic->base;
521  d3d12va_encode_wait(avctx, pic);
522 
523  if (pic->output_buffer_ref) {
524  av_log(avctx, AV_LOG_DEBUG, "Discard output for pic "
525  "%"PRId64"/%"PRId64".\n",
526  base_pic->display_order, base_pic->encode_order);
527 
529  pic->output_buffer = NULL;
530  }
531 
534 
535  return 0;
536 }
537 
539 {
541 
542  switch (ctx->rc.Mode)
543  {
544  case D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CQP:
545  av_freep(&ctx->rc.ConfigParams.pConfiguration_CQP);
546  break;
547  case D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CBR:
548  av_freep(&ctx->rc.ConfigParams.pConfiguration_CBR);
549  break;
550  case D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_VBR:
551  av_freep(&ctx->rc.ConfigParams.pConfiguration_VBR);
552  break;
553  case D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_QVBR:
554  av_freep(&ctx->rc.ConfigParams.pConfiguration_QVBR);
555  break;
556  default:
557  break;
558  }
559 
560  return 0;
561 }
562 
564  const AVFrame *frame)
565 {
568 
569  pic = av_mallocz(sizeof(*pic));
570  if (!pic)
571  return NULL;
572 
573  if (ctx->codec->picture_priv_data_size > 0) {
574  pic->base.priv_data = av_mallocz(ctx->codec->picture_priv_data_size);
575  if (!pic->base.priv_data) {
576  av_freep(&pic);
577  return NULL;
578  }
579  }
580 
581  pic->input_surface = (AVD3D12VAFrame *)frame->data[0];
582 
583  return &pic->base;
584 }
585 
587  FFHWBaseEncodePicture *base_pic)
588 {
590  D3D12VAEncodePicture *pic = (D3D12VAEncodePicture *)base_pic;
591 
592  if (base_pic->encode_issued)
593  d3d12va_encode_discard(avctx, pic);
594 
595  if (ctx->codec->free_picture_params)
596  ctx->codec->free_picture_params(pic);
597 
598  ff_hw_base_encode_free(base_pic);
599 
600  av_free(pic);
601 
602  return 0;
603 }
604 
606  D3D12VAEncodePicture *pic, size_t *size)
607 {
608  D3D12_VIDEO_ENCODER_OUTPUT_METADATA *meta = NULL;
609  uint8_t *data;
610  HRESULT hr;
611  int err;
612 
613  hr = ID3D12Resource_Map(pic->resolved_metadata, 0, NULL, (void **)&data);
614  if (FAILED(hr)) {
615  err = AVERROR_UNKNOWN;
616  return err;
617  }
618 
619  meta = (D3D12_VIDEO_ENCODER_OUTPUT_METADATA *)data;
620 
621  if (meta->EncodeErrorFlags != D3D12_VIDEO_ENCODER_ENCODE_ERROR_FLAG_NO_ERROR) {
622  av_log(avctx, AV_LOG_ERROR, "Encode failed %"PRIu64"\n", meta->EncodeErrorFlags);
623  err = AVERROR(EINVAL);
624  return err;
625  }
626 
627  if (meta->EncodedBitstreamWrittenBytesCount == 0) {
628  av_log(avctx, AV_LOG_ERROR, "No bytes were written to encoded bitstream\n");
629  err = AVERROR(EINVAL);
630  return err;
631  }
632 
633  *size = meta->EncodedBitstreamWrittenBytesCount;
634 
635  ID3D12Resource_Unmap(pic->resolved_metadata, 0, NULL);
636 
637  return 0;
638 }
639 
642 {
643  int err;
644  uint8_t *ptr, *mapped_data;
645  size_t total_size = 0;
646  HRESULT hr;
647 
648  err = d3d12va_encode_get_buffer_size(avctx, pic, &total_size);
649  if (err < 0)
650  goto end;
651 
652  total_size += pic->header_size;
653  av_log(avctx, AV_LOG_DEBUG, "Output buffer size %"PRId64"\n", total_size);
654 
655  hr = ID3D12Resource_Map(pic->output_buffer, 0, NULL, (void **)&mapped_data);
656  if (FAILED(hr)) {
657  err = AVERROR_UNKNOWN;
658  goto end;
659  }
660 
661  err = ff_get_encode_buffer(avctx, pkt, total_size, 0);
662  if (err < 0)
663  goto end;
664  ptr = pkt->data;
665 
666  memcpy(ptr, mapped_data, total_size);
667 
668  ID3D12Resource_Unmap(pic->output_buffer, 0, NULL);
669 
670 end:
672  pic->output_buffer = NULL;
673  return err;
674 }
675 
677  const FFHWBaseEncodePicture *base_pic, AVPacket *pkt)
678 {
679  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
680  D3D12VAEncodePicture *pic = (D3D12VAEncodePicture *)base_pic;
681  AVPacket *pkt_ptr = pkt;
682  int err;
683 
684  err = d3d12va_encode_wait(avctx, pic);
685  if (err < 0)
686  return err;
687 
688  err = d3d12va_encode_get_coded_data(avctx, pic, pkt);
689  if (err < 0)
690  return err;
691 
692  av_log(avctx, AV_LOG_DEBUG, "Output read for pic %"PRId64"/%"PRId64".\n",
693  base_pic->display_order, base_pic->encode_order);
694 
696  pkt_ptr, 0);
697 
698  return 0;
699 }
700 
702 {
703  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
706  const AVPixFmtDescriptor *desc;
707  int i, depth;
708 
710  if (!desc) {
711  av_log(avctx, AV_LOG_ERROR, "Invalid input pixfmt (%d).\n",
712  base_ctx->input_frames->sw_format);
713  return AVERROR(EINVAL);
714  }
715 
716  depth = desc->comp[0].depth;
717  for (i = 1; i < desc->nb_components; i++) {
718  if (desc->comp[i].depth != depth) {
719  av_log(avctx, AV_LOG_ERROR, "Invalid input pixfmt (%s).\n",
720  desc->name);
721  return AVERROR(EINVAL);
722  }
723  }
724  av_log(avctx, AV_LOG_VERBOSE, "Input surface format is %s.\n",
725  desc->name);
726 
727  av_assert0(ctx->codec->profiles);
728  for (i = 0; (ctx->codec->profiles[i].av_profile !=
729  AV_PROFILE_UNKNOWN); i++) {
730  profile = &ctx->codec->profiles[i];
731  if (depth != profile->depth ||
732  desc->nb_components != profile->nb_components)
733  continue;
734  if (desc->nb_components > 1 &&
735  (desc->log2_chroma_w != profile->log2_chroma_w ||
736  desc->log2_chroma_h != profile->log2_chroma_h))
737  continue;
738  if (avctx->profile != profile->av_profile &&
739  avctx->profile != AV_PROFILE_UNKNOWN)
740  continue;
741 
742  ctx->profile = profile;
743  break;
744  }
745  if (!ctx->profile) {
746  av_log(avctx, AV_LOG_ERROR, "No usable encoding profile found.\n");
747  return AVERROR(ENOSYS);
748  }
749 
750  avctx->profile = profile->av_profile;
751  return 0;
752 }
753 
755  // Bitrate Quality
756  // | Maxrate | HRD/VBV
757  { 0 }, // | | | |
758  { RC_MODE_CQP, "CQP", 0, 0, 1, 0, D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CQP },
759  { RC_MODE_CBR, "CBR", 1, 0, 0, 1, D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_CBR },
760  { RC_MODE_VBR, "VBR", 1, 1, 0, 1, D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_VBR },
761  { RC_MODE_QVBR, "QVBR", 1, 1, 1, 1, D3D12_VIDEO_ENCODER_RATE_CONTROL_MODE_QVBR },
762 };
763 
765 {
766  HRESULT hr;
768  D3D12_FEATURE_DATA_VIDEO_ENCODER_RATE_CONTROL_MODE d3d12_rc_mode = {
769  .Codec = ctx->codec->d3d12_codec,
770  };
771 
772  if (!rc_mode->d3d12_mode)
773  return 0;
774 
775  d3d12_rc_mode.IsSupported = 0;
776  d3d12_rc_mode.RateControlMode = rc_mode->d3d12_mode;
777 
778  hr = ID3D12VideoDevice3_CheckFeatureSupport(ctx->video_device3,
779  D3D12_FEATURE_VIDEO_ENCODER_RATE_CONTROL_MODE,
780  &d3d12_rc_mode, sizeof(d3d12_rc_mode));
781  if (FAILED(hr)) {
782  av_log(avctx, AV_LOG_ERROR, "Failed to check rate control support.\n");
783  return 0;
784  }
785 
786  return d3d12_rc_mode.IsSupported;
787 }
788 
790 {
792  int64_t rc_target_bitrate;
793  int64_t rc_peak_bitrate;
794  int rc_quality;
795  int64_t hrd_buffer_size;
796  int64_t hrd_initial_buffer_fullness;
797  int fr_num, fr_den;
799 
800  // Rate control mode selection:
801  // * If the user has set a mode explicitly with the rc_mode option,
802  // use it and fail if it is not available.
803  // * If an explicit QP option has been set, use CQP.
804  // * If the codec is CQ-only, use CQP.
805  // * If the QSCALE avcodec option is set, use CQP.
806  // * If bitrate and quality are both set, try QVBR.
807  // * If quality is set, try CQP.
808  // * If bitrate and maxrate are set and have the same value, try CBR.
809  // * If a bitrate is set, try VBR, then CBR.
810  // * If no bitrate is set, try CQP.
811 
812 #define TRY_RC_MODE(mode, fail) do { \
813  rc_mode = &d3d12va_encode_rc_modes[mode]; \
814  if (!(rc_mode->d3d12_mode && check_rate_control_support(avctx, rc_mode))) { \
815  if (fail) { \
816  av_log(avctx, AV_LOG_ERROR, "Driver does not support %s " \
817  "RC mode.\n", rc_mode->name); \
818  return AVERROR(EINVAL); \
819  } \
820  av_log(avctx, AV_LOG_DEBUG, "Driver does not support %s " \
821  "RC mode.\n", rc_mode->name); \
822  rc_mode = NULL; \
823  } else { \
824  goto rc_mode_found; \
825  } \
826  } while (0)
827 
828  if (ctx->explicit_rc_mode)
829  TRY_RC_MODE(ctx->explicit_rc_mode, 1);
830 
831  if (ctx->explicit_qp)
833 
836 
837  if (avctx->flags & AV_CODEC_FLAG_QSCALE)
839 
840  if (avctx->bit_rate > 0 && avctx->global_quality > 0)
842 
843  if (avctx->global_quality > 0) {
845  }
846 
847  if (avctx->bit_rate > 0 && avctx->rc_max_rate == avctx->bit_rate)
849 
850  if (avctx->bit_rate > 0) {
853  } else {
855  }
856 
857  av_log(avctx, AV_LOG_ERROR, "Driver does not support any "
858  "RC mode compatible with selected options.\n");
859  return AVERROR(EINVAL);
860 
861 rc_mode_found:
862  if (rc_mode->bitrate) {
863  if (avctx->bit_rate <= 0) {
864  av_log(avctx, AV_LOG_ERROR, "Bitrate must be set for %s "
865  "RC mode.\n", rc_mode->name);
866  return AVERROR(EINVAL);
867  }
868 
869  if (rc_mode->maxrate) {
870  if (avctx->rc_max_rate > 0) {
871  if (avctx->rc_max_rate < avctx->bit_rate) {
872  av_log(avctx, AV_LOG_ERROR, "Invalid bitrate settings: "
873  "bitrate (%"PRId64") must not be greater than "
874  "maxrate (%"PRId64").\n", avctx->bit_rate,
875  avctx->rc_max_rate);
876  return AVERROR(EINVAL);
877  }
878  rc_target_bitrate = avctx->bit_rate;
879  rc_peak_bitrate = avctx->rc_max_rate;
880  } else {
881  // We only have a target bitrate, but this mode requires
882  // that a maximum rate be supplied as well. Since the
883  // user does not want this to be a constraint, arbitrarily
884  // pick a maximum rate of double the target rate.
885  rc_target_bitrate = avctx->bit_rate;
886  rc_peak_bitrate = 2 * avctx->bit_rate;
887  }
888  } else {
889  if (avctx->rc_max_rate > avctx->bit_rate) {
890  av_log(avctx, AV_LOG_WARNING, "Max bitrate is ignored "
891  "in %s RC mode.\n", rc_mode->name);
892  }
893  rc_target_bitrate = avctx->bit_rate;
894  rc_peak_bitrate = 0;
895  }
896  } else {
897  rc_target_bitrate = 0;
898  rc_peak_bitrate = 0;
899  }
900 
901  if (rc_mode->quality) {
902  if (ctx->explicit_qp) {
903  rc_quality = ctx->explicit_qp;
904  } else if (avctx->global_quality > 0) {
905  if (avctx->flags & AV_CODEC_FLAG_QSCALE)
906  rc_quality = avctx->global_quality / FF_QP2LAMBDA;
907  else
908  rc_quality = avctx->global_quality;
909  } else {
910  rc_quality = ctx->codec->default_quality;
911  av_log(avctx, AV_LOG_WARNING, "No quality level set; "
912  "using default (%d).\n", rc_quality);
913  }
914  } else {
915  rc_quality = 0;
916  }
917 
918  if (rc_mode->hrd) {
919  if (avctx->rc_buffer_size)
920  hrd_buffer_size = avctx->rc_buffer_size;
921  else if (avctx->rc_max_rate > 0)
922  hrd_buffer_size = avctx->rc_max_rate;
923  else
924  hrd_buffer_size = avctx->bit_rate;
925  if (avctx->rc_initial_buffer_occupancy) {
926  if (avctx->rc_initial_buffer_occupancy > hrd_buffer_size) {
927  av_log(avctx, AV_LOG_ERROR, "Invalid RC buffer settings: "
928  "must have initial buffer size (%d) <= "
929  "buffer size (%"PRId64").\n",
930  avctx->rc_initial_buffer_occupancy, hrd_buffer_size);
931  return AVERROR(EINVAL);
932  }
933  hrd_initial_buffer_fullness = avctx->rc_initial_buffer_occupancy;
934  } else {
935  hrd_initial_buffer_fullness = hrd_buffer_size * 3 / 4;
936  }
937  } else {
938  if (avctx->rc_buffer_size || avctx->rc_initial_buffer_occupancy) {
939  av_log(avctx, AV_LOG_WARNING, "Buffering settings are ignored "
940  "in %s RC mode.\n", rc_mode->name);
941  }
942 
943  hrd_buffer_size = 0;
944  hrd_initial_buffer_fullness = 0;
945  }
946 
947  if (rc_target_bitrate > UINT32_MAX ||
948  hrd_buffer_size > UINT32_MAX ||
949  hrd_initial_buffer_fullness > UINT32_MAX) {
950  av_log(avctx, AV_LOG_ERROR, "RC parameters of 2^32 or "
951  "greater are not supported by D3D12.\n");
952  return AVERROR(EINVAL);
953  }
954 
955  ctx->rc_quality = rc_quality;
956 
957  av_log(avctx, AV_LOG_VERBOSE, "RC mode: %s.\n", rc_mode->name);
958 
959  if (rc_mode->quality)
960  av_log(avctx, AV_LOG_VERBOSE, "RC quality: %d.\n", rc_quality);
961 
962  if (rc_mode->hrd) {
963  av_log(avctx, AV_LOG_VERBOSE, "RC buffer: %"PRId64" bits, "
964  "initial fullness %"PRId64" bits.\n",
965  hrd_buffer_size, hrd_initial_buffer_fullness);
966  }
967 
968  if (avctx->framerate.num > 0 && avctx->framerate.den > 0)
969  av_reduce(&fr_num, &fr_den,
970  avctx->framerate.num, avctx->framerate.den, 65535);
971  else
972  av_reduce(&fr_num, &fr_den,
973  avctx->time_base.den, avctx->time_base.num, 65535);
974 
975  av_log(avctx, AV_LOG_VERBOSE, "RC framerate: %d/%d (%.2f fps).\n",
976  fr_num, fr_den, (double)fr_num / fr_den);
977 
978  ctx->rc.Flags = D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_NONE;
979  ctx->rc.TargetFrameRate.Numerator = fr_num;
980  ctx->rc.TargetFrameRate.Denominator = fr_den;
981  ctx->rc.Mode = rc_mode->d3d12_mode;
982 
983  switch (rc_mode->mode) {
984  case RC_MODE_CQP:
985  // cqp ConfigParams will be updated in ctx->codec->configure.
986  break;
987 
988  case RC_MODE_CBR:
989  D3D12_VIDEO_ENCODER_RATE_CONTROL_CBR *cbr_ctl;
990 
991  ctx->rc.ConfigParams.DataSize = sizeof(D3D12_VIDEO_ENCODER_RATE_CONTROL_CBR);
992  cbr_ctl = av_mallocz(ctx->rc.ConfigParams.DataSize);
993  if (!cbr_ctl)
994  return AVERROR(ENOMEM);
995 
996  cbr_ctl->TargetBitRate = rc_target_bitrate;
997  cbr_ctl->VBVCapacity = hrd_buffer_size;
998  cbr_ctl->InitialVBVFullness = hrd_initial_buffer_fullness;
999  ctx->rc.Flags |= D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
1000 
1001  if (avctx->qmin > 0 || avctx->qmax > 0) {
1002  cbr_ctl->MinQP = avctx->qmin;
1003  cbr_ctl->MaxQP = avctx->qmax;
1004  ctx->rc.Flags |= D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
1005  }
1006 
1007  ctx->rc.ConfigParams.pConfiguration_CBR = cbr_ctl;
1008  break;
1009 
1010  case RC_MODE_VBR:
1011  D3D12_VIDEO_ENCODER_RATE_CONTROL_VBR *vbr_ctl;
1012 
1013  ctx->rc.ConfigParams.DataSize = sizeof(D3D12_VIDEO_ENCODER_RATE_CONTROL_VBR);
1014  vbr_ctl = av_mallocz(ctx->rc.ConfigParams.DataSize);
1015  if (!vbr_ctl)
1016  return AVERROR(ENOMEM);
1017 
1018  vbr_ctl->TargetAvgBitRate = rc_target_bitrate;
1019  vbr_ctl->PeakBitRate = rc_peak_bitrate;
1020  vbr_ctl->VBVCapacity = hrd_buffer_size;
1021  vbr_ctl->InitialVBVFullness = hrd_initial_buffer_fullness;
1022  ctx->rc.Flags |= D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_VBV_SIZES;
1023 
1024  if (avctx->qmin > 0 || avctx->qmax > 0) {
1025  vbr_ctl->MinQP = avctx->qmin;
1026  vbr_ctl->MaxQP = avctx->qmax;
1027  ctx->rc.Flags |= D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
1028  }
1029 
1030  ctx->rc.ConfigParams.pConfiguration_VBR = vbr_ctl;
1031  break;
1032 
1033  case RC_MODE_QVBR:
1034  D3D12_VIDEO_ENCODER_RATE_CONTROL_QVBR *qvbr_ctl;
1035 
1036  ctx->rc.ConfigParams.DataSize = sizeof(D3D12_VIDEO_ENCODER_RATE_CONTROL_QVBR);
1037  qvbr_ctl = av_mallocz(ctx->rc.ConfigParams.DataSize);
1038  if (!qvbr_ctl)
1039  return AVERROR(ENOMEM);
1040 
1041  qvbr_ctl->TargetAvgBitRate = rc_target_bitrate;
1042  qvbr_ctl->PeakBitRate = rc_peak_bitrate;
1043  qvbr_ctl->ConstantQualityTarget = rc_quality;
1044 
1045  if (avctx->qmin > 0 || avctx->qmax > 0) {
1046  qvbr_ctl->MinQP = avctx->qmin;
1047  qvbr_ctl->MaxQP = avctx->qmax;
1048  ctx->rc.Flags |= D3D12_VIDEO_ENCODER_RATE_CONTROL_FLAG_ENABLE_QP_RANGE;
1049  }
1050 
1051  ctx->rc.ConfigParams.pConfiguration_QVBR = qvbr_ctl;
1052  break;
1053 
1054  default:
1055  break;
1056  }
1057  return 0;
1058 }
1059 
1061 {
1062  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
1064  uint32_t ref_l0, ref_l1;
1065  int err;
1066  HRESULT hr;
1067  D3D12_FEATURE_DATA_VIDEO_ENCODER_CODEC_PICTURE_CONTROL_SUPPORT support;
1068  union {
1069  D3D12_VIDEO_ENCODER_CODEC_PICTURE_CONTROL_SUPPORT_H264 h264;
1070  D3D12_VIDEO_ENCODER_CODEC_PICTURE_CONTROL_SUPPORT_HEVC hevc;
1071  } codec_support;
1072 
1073  support.NodeIndex = 0;
1074  support.Codec = ctx->codec->d3d12_codec;
1075  support.Profile = ctx->profile->d3d12_profile;
1076 
1077  switch (ctx->codec->d3d12_codec) {
1078  case D3D12_VIDEO_ENCODER_CODEC_H264:
1079  support.PictureSupport.DataSize = sizeof(codec_support.h264);
1080  support.PictureSupport.pH264Support = &codec_support.h264;
1081  break;
1082 
1083  case D3D12_VIDEO_ENCODER_CODEC_HEVC:
1084  support.PictureSupport.DataSize = sizeof(codec_support.hevc);
1085  support.PictureSupport.pHEVCSupport = &codec_support.hevc;
1086  break;
1087 
1088  default:
1089  av_assert0(0);
1090  }
1091 
1092  hr = ID3D12VideoDevice3_CheckFeatureSupport(ctx->video_device3, D3D12_FEATURE_VIDEO_ENCODER_CODEC_PICTURE_CONTROL_SUPPORT,
1093  &support, sizeof(support));
1094  if (FAILED(hr))
1095  return AVERROR(EINVAL);
1096 
1097  if (support.IsSupported) {
1098  switch (ctx->codec->d3d12_codec) {
1099  case D3D12_VIDEO_ENCODER_CODEC_H264:
1100  ref_l0 = FFMIN(support.PictureSupport.pH264Support->MaxL0ReferencesForP,
1101  support.PictureSupport.pH264Support->MaxL1ReferencesForB);
1102  ref_l1 = support.PictureSupport.pH264Support->MaxL1ReferencesForB;
1103  break;
1104 
1105  case D3D12_VIDEO_ENCODER_CODEC_HEVC:
1106  ref_l0 = FFMIN(support.PictureSupport.pHEVCSupport->MaxL0ReferencesForP,
1107  support.PictureSupport.pHEVCSupport->MaxL1ReferencesForB);
1108  ref_l1 = support.PictureSupport.pHEVCSupport->MaxL1ReferencesForB;
1109  break;
1110 
1111  default:
1112  av_assert0(0);
1113  }
1114  } else {
1115  ref_l0 = ref_l1 = 0;
1116  }
1117 
1118  if (ref_l0 > 0 && ref_l1 > 0 && ctx->bi_not_empty) {
1119  base_ctx->p_to_gpb = 1;
1120  av_log(avctx, AV_LOG_VERBOSE, "Driver does not support P-frames, "
1121  "replacing them with B-frames.\n");
1122  }
1123 
1124  err = ff_hw_base_init_gop_structure(base_ctx, avctx, ref_l0, ref_l1, ctx->codec->flags, 0);
1125  if (err < 0)
1126  return err;
1127 
1128  return 0;
1129 }
1130 
1132 {
1133  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
1135  AVD3D12VAFramesContext *frames_hwctx = base_ctx->input_frames->hwctx;
1136  HRESULT hr;
1137 
1138  D3D12_VIDEO_ENCODER_DESC desc = {
1139  .NodeMask = 0,
1140  .Flags = D3D12_VIDEO_ENCODER_FLAG_NONE,
1141  .EncodeCodec = ctx->codec->d3d12_codec,
1142  .EncodeProfile = ctx->profile->d3d12_profile,
1143  .InputFormat = frames_hwctx->format,
1144  .CodecConfiguration = ctx->codec_conf,
1145  .MaxMotionEstimationPrecision = D3D12_VIDEO_ENCODER_MOTION_ESTIMATION_PRECISION_MODE_MAXIMUM,
1146  };
1147 
1148  hr = ID3D12VideoDevice3_CreateVideoEncoder(ctx->video_device3, &desc, &IID_ID3D12VideoEncoder,
1149  (void **)&ctx->encoder);
1150  if (FAILED(hr)) {
1151  av_log(avctx, AV_LOG_ERROR, "Failed to create encoder.\n");
1152  return AVERROR(EINVAL);
1153  }
1154 
1155  return 0;
1156 }
1157 
1159 {
1161  HRESULT hr;
1162 
1163  D3D12_VIDEO_ENCODER_HEAP_DESC desc = {
1164  .NodeMask = 0,
1165  .Flags = D3D12_VIDEO_ENCODER_FLAG_NONE,
1166  .EncodeCodec = ctx->codec->d3d12_codec,
1167  .EncodeProfile = ctx->profile->d3d12_profile,
1168  .EncodeLevel = ctx->level,
1169  .ResolutionsListCount = 1,
1170  .pResolutionList = &ctx->resolution,
1171  };
1172 
1173  hr = ID3D12VideoDevice3_CreateVideoEncoderHeap(ctx->video_device3, &desc,
1174  &IID_ID3D12VideoEncoderHeap, (void **)&ctx->encoder_heap);
1175  if (FAILED(hr)) {
1176  av_log(avctx, AV_LOG_ERROR, "Failed to create encoder heap.\n");
1177  return AVERROR(EINVAL);
1178  }
1179 
1180  return 0;
1181 }
1182 
1183 static void d3d12va_encode_free_buffer(void *opaque, uint8_t *data)
1184 {
1185  ID3D12Resource *pResource;
1186 
1187  pResource = (ID3D12Resource *)data;
1188  D3D12_OBJECT_RELEASE(pResource);
1189 }
1190 
1192 {
1193  AVCodecContext *avctx = opaque;
1194  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
1196  ID3D12Resource *pResource = NULL;
1197  HRESULT hr;
1198  AVBufferRef *ref;
1199  D3D12_HEAP_PROPERTIES heap_props;
1200  D3D12_HEAP_TYPE heap_type = D3D12_HEAP_TYPE_READBACK;
1201 
1202  D3D12_RESOURCE_DESC desc = {
1203  .Dimension = D3D12_RESOURCE_DIMENSION_BUFFER,
1204  .Alignment = 0,
1205  .Width = FFALIGN(3 * base_ctx->surface_width * base_ctx->surface_height + (1 << 16),
1206  D3D12_TEXTURE_DATA_PLACEMENT_ALIGNMENT),
1207  .Height = 1,
1208  .DepthOrArraySize = 1,
1209  .MipLevels = 1,
1210  .Format = DXGI_FORMAT_UNKNOWN,
1211  .SampleDesc = { .Count = 1, .Quality = 0 },
1212  .Layout = D3D12_TEXTURE_LAYOUT_ROW_MAJOR,
1213  .Flags = D3D12_RESOURCE_FLAG_NONE,
1214  };
1215 
1216  ctx->hwctx->device->lpVtbl->GetCustomHeapProperties(ctx->hwctx->device, &heap_props, 0, heap_type);
1217 
1218  hr = ID3D12Device_CreateCommittedResource(ctx->hwctx->device, &heap_props, D3D12_HEAP_FLAG_NONE,
1219  &desc, D3D12_RESOURCE_STATE_COMMON, NULL, &IID_ID3D12Resource,
1220  (void **)&pResource);
1221 
1222  if (FAILED(hr)) {
1223  av_log(avctx, AV_LOG_ERROR, "Failed to create d3d12 buffer.\n");
1224  return NULL;
1225  }
1226 
1227  ref = av_buffer_create((uint8_t *)(uintptr_t)pResource,
1228  sizeof(pResource),
1230  avctx, AV_BUFFER_FLAG_READONLY);
1231  if (!ref) {
1232  D3D12_OBJECT_RELEASE(pResource);
1233  return NULL;
1234  }
1235 
1236  return ref;
1237 }
1238 
1240 {
1241  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
1243  AVD3D12VAFramesContext *frames_ctx = base_ctx->input_frames->hwctx;
1244  HRESULT hr;
1245 
1246  ctx->req.NodeIndex = 0;
1247  ctx->req.Codec = ctx->codec->d3d12_codec;
1248  ctx->req.Profile = ctx->profile->d3d12_profile;
1249  ctx->req.InputFormat = frames_ctx->format;
1250  ctx->req.PictureTargetResolution = ctx->resolution;
1251 
1252  hr = ID3D12VideoDevice3_CheckFeatureSupport(ctx->video_device3,
1253  D3D12_FEATURE_VIDEO_ENCODER_RESOURCE_REQUIREMENTS,
1254  &ctx->req, sizeof(ctx->req));
1255  if (FAILED(hr)) {
1256  av_log(avctx, AV_LOG_ERROR, "Failed to check encoder resource requirements support.\n");
1257  return AVERROR(EINVAL);
1258  }
1259 
1260  if (!ctx->req.IsSupported) {
1261  av_log(avctx, AV_LOG_ERROR, "Encoder resource requirements unsupported.\n");
1262  return AVERROR(EINVAL);
1263  }
1264 
1265  ctx->output_buffer_pool = av_buffer_pool_init2(sizeof(ID3D12Resource *), avctx,
1267  if (!ctx->output_buffer_pool)
1268  return AVERROR(ENOMEM);
1269 
1270  return 0;
1271 }
1272 
1274 {
1276  ID3D12CommandAllocator *command_allocator = NULL;
1277  int err;
1278  HRESULT hr;
1279 
1280  D3D12_COMMAND_QUEUE_DESC queue_desc = {
1281  .Type = D3D12_COMMAND_LIST_TYPE_VIDEO_ENCODE,
1282  .Priority = 0,
1283  .Flags = D3D12_COMMAND_QUEUE_FLAG_NONE,
1284  .NodeMask = 0,
1285  };
1286 
1289  if (!ctx->allocator_queue)
1290  return AVERROR(ENOMEM);
1291 
1292  hr = ID3D12Device_CreateFence(ctx->hwctx->device, 0, D3D12_FENCE_FLAG_NONE,
1293  &IID_ID3D12Fence, (void **)&ctx->sync_ctx.fence);
1294  if (FAILED(hr)) {
1295  av_log(avctx, AV_LOG_ERROR, "Failed to create fence(%lx)\n", (long)hr);
1296  err = AVERROR_UNKNOWN;
1297  goto fail;
1298  }
1299 
1300  ctx->sync_ctx.event = CreateEvent(NULL, FALSE, FALSE, NULL);
1301  if (!ctx->sync_ctx.event)
1302  goto fail;
1303 
1304  err = d3d12va_get_valid_command_allocator(avctx, &command_allocator);
1305  if (err < 0)
1306  goto fail;
1307 
1308  hr = ID3D12Device_CreateCommandQueue(ctx->hwctx->device, &queue_desc,
1309  &IID_ID3D12CommandQueue, (void **)&ctx->command_queue);
1310  if (FAILED(hr)) {
1311  av_log(avctx, AV_LOG_ERROR, "Failed to create command queue(%lx)\n", (long)hr);
1312  err = AVERROR_UNKNOWN;
1313  goto fail;
1314  }
1315 
1316  hr = ID3D12Device_CreateCommandList(ctx->hwctx->device, 0, queue_desc.Type,
1317  command_allocator, NULL, &IID_ID3D12CommandList,
1318  (void **)&ctx->command_list);
1319  if (FAILED(hr)) {
1320  av_log(avctx, AV_LOG_ERROR, "Failed to create command list(%lx)\n", (long)hr);
1321  err = AVERROR_UNKNOWN;
1322  goto fail;
1323  }
1324 
1325  hr = ID3D12VideoEncodeCommandList2_Close(ctx->command_list);
1326  if (FAILED(hr)) {
1327  av_log(avctx, AV_LOG_ERROR, "Failed to close the command list(%lx)\n", (long)hr);
1328  err = AVERROR_UNKNOWN;
1329  goto fail;
1330  }
1331 
1332  ID3D12CommandQueue_ExecuteCommandLists(ctx->command_queue, 1, (ID3D12CommandList **)&ctx->command_list);
1333 
1334  err = d3d12va_sync_with_gpu(avctx);
1335  if (err < 0)
1336  goto fail;
1337 
1338  err = d3d12va_discard_command_allocator(avctx, command_allocator, ctx->sync_ctx.fence_value);
1339  if (err < 0)
1340  goto fail;
1341 
1342  return 0;
1343 
1344 fail:
1345  D3D12_OBJECT_RELEASE(command_allocator);
1346  return err;
1347 }
1348 
1350 {
1351  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
1352  AVD3D12VAFramesContext *hwctx;
1353  enum AVPixelFormat recon_format;
1354  int err;
1355 
1356  err = ff_hw_base_get_recon_format(base_ctx, NULL, &recon_format);
1357  if (err < 0)
1358  return err;
1359 
1360  base_ctx->recon_frames_ref = av_hwframe_ctx_alloc(base_ctx->device_ref);
1361  if (!base_ctx->recon_frames_ref)
1362  return AVERROR(ENOMEM);
1363 
1364  base_ctx->recon_frames = (AVHWFramesContext *)base_ctx->recon_frames_ref->data;
1365  hwctx = (AVD3D12VAFramesContext *)base_ctx->recon_frames->hwctx;
1366 
1367  base_ctx->recon_frames->format = AV_PIX_FMT_D3D12;
1368  base_ctx->recon_frames->sw_format = recon_format;
1369  base_ctx->recon_frames->width = base_ctx->surface_width;
1370  base_ctx->recon_frames->height = base_ctx->surface_height;
1371 
1372  hwctx->flags = D3D12_RESOURCE_FLAG_VIDEO_ENCODE_REFERENCE_ONLY |
1373  D3D12_RESOURCE_FLAG_DENY_SHADER_RESOURCE;
1374 
1375  err = av_hwframe_ctx_init(base_ctx->recon_frames_ref);
1376  if (err < 0) {
1377  av_log(avctx, AV_LOG_ERROR, "Failed to initialise reconstructed "
1378  "frame context: %d.\n", err);
1379  return err;
1380  }
1381 
1382  return 0;
1383 }
1384 
1387 
1388  .issue = &d3d12va_encode_issue,
1389 
1390  .output = &d3d12va_encode_output,
1391 
1392  .free = &d3d12va_encode_free,
1393 };
1394 
1396 {
1397  return ff_hw_base_encode_receive_packet(avctx->priv_data, avctx, pkt);
1398 }
1399 
1401 {
1402  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
1404  D3D12_FEATURE_DATA_VIDEO_FEATURE_AREA_SUPPORT support = { 0 };
1405  int err;
1406  HRESULT hr;
1407 
1408  err = ff_hw_base_encode_init(avctx, base_ctx);
1409  if (err < 0)
1410  goto fail;
1411 
1412  base_ctx->op = &d3d12va_type;
1413 
1414  ctx->hwctx = base_ctx->device->hwctx;
1415 
1416  ctx->resolution.Width = base_ctx->input_frames->width;
1417  ctx->resolution.Height = base_ctx->input_frames->height;
1418 
1419  hr = ID3D12Device_QueryInterface(ctx->hwctx->device, &IID_ID3D12Device3, (void **)&ctx->device3);
1420  if (FAILED(hr)) {
1421  av_log(avctx, AV_LOG_ERROR, "ID3D12Device3 interface is not supported.\n");
1422  err = AVERROR_UNKNOWN;
1423  goto fail;
1424  }
1425 
1426  hr = ID3D12Device3_QueryInterface(ctx->device3, &IID_ID3D12VideoDevice3, (void **)&ctx->video_device3);
1427  if (FAILED(hr)) {
1428  av_log(avctx, AV_LOG_ERROR, "ID3D12VideoDevice3 interface is not supported.\n");
1429  err = AVERROR_UNKNOWN;
1430  goto fail;
1431  }
1432 
1433  if (FAILED(ID3D12VideoDevice3_CheckFeatureSupport(ctx->video_device3, D3D12_FEATURE_VIDEO_FEATURE_AREA_SUPPORT,
1434  &support, sizeof(support))) && !support.VideoEncodeSupport) {
1435  av_log(avctx, AV_LOG_ERROR, "D3D12 video device has no video encoder support.\n");
1436  err = AVERROR(EINVAL);
1437  goto fail;
1438  }
1439 
1440  err = d3d12va_encode_set_profile(avctx);
1441  if (err < 0)
1442  goto fail;
1443 
1444  err = d3d12va_encode_init_rate_control(avctx);
1445  if (err < 0)
1446  goto fail;
1447 
1448  if (ctx->codec->get_encoder_caps) {
1449  err = ctx->codec->get_encoder_caps(avctx);
1450  if (err < 0)
1451  goto fail;
1452  }
1453 
1454  err = d3d12va_encode_init_gop_structure(avctx);
1455  if (err < 0)
1456  goto fail;
1457 
1458  if (!(ctx->codec->flags & FF_HW_FLAG_SLICE_CONTROL) && avctx->slices > 0) {
1459  av_log(avctx, AV_LOG_WARNING, "Multiple slices were requested "
1460  "but this codec does not support controlling slices.\n");
1461  }
1462 
1464  if (err < 0)
1465  goto fail;
1466 
1468  if (err < 0)
1469  goto fail;
1470 
1472  if (err < 0)
1473  goto fail;
1474 
1475  if (ctx->codec->configure) {
1476  err = ctx->codec->configure(avctx);
1477  if (err < 0)
1478  goto fail;
1479  }
1480 
1481  if (ctx->codec->init_sequence_params) {
1482  err = ctx->codec->init_sequence_params(avctx);
1483  if (err < 0) {
1484  av_log(avctx, AV_LOG_ERROR, "Codec sequence initialisation "
1485  "failed: %d.\n", err);
1486  goto fail;
1487  }
1488  }
1489 
1490  if (ctx->codec->set_level) {
1491  err = ctx->codec->set_level(avctx);
1492  if (err < 0)
1493  goto fail;
1494  }
1495 
1496  base_ctx->output_delay = base_ctx->b_per_p;
1497  base_ctx->decode_delay = base_ctx->max_b_depth;
1498 
1499  err = d3d12va_create_encoder(avctx);
1500  if (err < 0)
1501  goto fail;
1502 
1503  err = d3d12va_create_encoder_heap(avctx);
1504  if (err < 0)
1505  goto fail;
1506 
1507  base_ctx->async_encode = 1;
1508  base_ctx->encode_fifo = av_fifo_alloc2(base_ctx->async_depth,
1509  sizeof(D3D12VAEncodePicture *), 0);
1510  if (!base_ctx->encode_fifo)
1511  return AVERROR(ENOMEM);
1512 
1513  return 0;
1514 
1515 fail:
1516  return err;
1517 }
1518 
1520 {
1521  int num_allocator = 0;
1522  FFHWBaseEncodeContext *base_ctx = avctx->priv_data;
1524  FFHWBaseEncodePicture *pic, *next;
1525  CommandAllocator allocator;
1526 
1527  if (!base_ctx->frame)
1528  return 0;
1529 
1530  for (pic = base_ctx->pic_start; pic; pic = next) {
1531  next = pic->next;
1532  d3d12va_encode_free(avctx, pic);
1533  }
1534 
1536 
1537  av_buffer_pool_uninit(&ctx->output_buffer_pool);
1538 
1539  D3D12_OBJECT_RELEASE(ctx->command_list);
1540  D3D12_OBJECT_RELEASE(ctx->command_queue);
1541 
1542  if (ctx->allocator_queue) {
1543  while (av_fifo_read(ctx->allocator_queue, &allocator, 1) >= 0) {
1544  num_allocator++;
1546  }
1547 
1548  av_log(avctx, AV_LOG_VERBOSE, "Total number of command allocators reused: %d\n", num_allocator);
1549  }
1550 
1551  av_fifo_freep2(&ctx->allocator_queue);
1552 
1553  D3D12_OBJECT_RELEASE(ctx->sync_ctx.fence);
1554  if (ctx->sync_ctx.event)
1555  CloseHandle(ctx->sync_ctx.event);
1556 
1557  D3D12_OBJECT_RELEASE(ctx->encoder_heap);
1558  D3D12_OBJECT_RELEASE(ctx->encoder);
1559  D3D12_OBJECT_RELEASE(ctx->video_device3);
1560  D3D12_OBJECT_RELEASE(ctx->device3);
1561 
1562  ff_hw_base_encode_close(base_ctx);
1563 
1564  return 0;
1565 }
FFHWBaseEncodeContext::output_delay
int64_t output_delay
Definition: hw_base_encode.h:164
AVHWDeviceContext::hwctx
void * hwctx
The format-specific data, allocated and freed by libavutil along with this context.
Definition: hwcontext.h:85
RC_MODE_QVBR
@ RC_MODE_QVBR
Definition: d3d12va_encode.h:98
d3d12va_encode_output
static int d3d12va_encode_output(AVCodecContext *avctx, const FFHWBaseEncodePicture *base_pic, AVPacket *pkt)
Definition: d3d12va_encode.c:676
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:71
FFHWBaseEncodeContext::recon_frames_ref
AVBufferRef * recon_frames_ref
Definition: hw_base_encode.h:151
FFHWBaseEncodePicture::next
struct FFHWBaseEncodePicture * next
Definition: hw_base_encode.h:61
d3d12va_encode_set_profile
static int d3d12va_encode_set_profile(AVCodecContext *avctx)
Definition: d3d12va_encode.c:701
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
FFHWEncodePictureOperation::alloc
FFHWBaseEncodePicture *(* alloc)(AVCodecContext *avctx, const AVFrame *frame)
Definition: hw_base_encode.h:108
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2965
AVBufferRef::data
uint8_t * data
The data buffer.
Definition: buffer.h:90
AVHWFramesContext::format
enum AVPixelFormat format
The pixel format identifying the underlying HW surface type.
Definition: hwcontext.h:197
AV_CODEC_FLAG_QSCALE
#define AV_CODEC_FLAG_QSCALE
Use fixed qscale.
Definition: avcodec.h:224
d3d12va_encode_create_recon_frames
static int d3d12va_encode_create_recon_frames(AVCodecContext *avctx)
Definition: d3d12va_encode.c:1349
av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:160
av_fifo_peek
int av_fifo_peek(const AVFifo *f, void *buf, size_t nb_elems, size_t offset)
Read data from a FIFO without modifying FIFO state.
Definition: fifo.c:255
av_hwframe_ctx_init
int av_hwframe_ctx_init(AVBufferRef *ref)
Finalize the context before use.
Definition: hwcontext.c:322
FF_HW_FLAG_SLICE_CONTROL
@ FF_HW_FLAG_SLICE_CONTROL
Definition: hw_base_encode.h:46
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:374
pixdesc.h
D3D12VAEncodePicture::input_surface
AVD3D12VAFrame * input_surface
Definition: d3d12va_encode.h:47
av_hwframe_ctx_alloc
AVBufferRef * av_hwframe_ctx_alloc(AVBufferRef *device_ref_in)
Allocate an AVHWFramesContext tied to a given device context.
Definition: hwcontext.c:248
AVPacket::data
uint8_t * data
Definition: packet.h:520
d3d12va_encode_discard
static int d3d12va_encode_discard(AVCodecContext *avctx, D3D12VAEncodePicture *pic)
Definition: d3d12va_encode.c:517
ff_hw_base_encode_init
int ff_hw_base_encode_init(AVCodecContext *avctx, FFHWBaseEncodeContext *ctx)
Definition: hw_base_encode.c:752
encode.h
d3d12va_encode.h
d3d12va_encode_get_coded_data
static int d3d12va_encode_get_coded_data(AVCodecContext *avctx, D3D12VAEncodePicture *pic, AVPacket *pkt)
Definition: d3d12va_encode.c:640
data
const char data[16]
Definition: mxf.c:148
FFHWBaseEncodePicture::recon_image
AVFrame * recon_image
Definition: hw_base_encode.h:78
AV_LOG_VERBOSE
#define AV_LOG_VERBOSE
Detailed information.
Definition: log.h:196
AVERROR_UNKNOWN
#define AVERROR_UNKNOWN
Unknown error, typically from an external library.
Definition: error.h:73
AVHWFramesContext::width
int width
The allocated dimensions of the frames in this pool.
Definition: hwcontext.h:217
AVCodecContext::qmax
int qmax
maximum quantizer
Definition: avcodec.h:1263
AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:395
D3D12VAEncodePicture::resolved_metadata
ID3D12Resource * resolved_metadata
Definition: d3d12va_encode.h:54
FFHWBaseEncodeContext
Definition: hw_base_encode.h:117
AVCodecContext::framerate
AVRational framerate
Definition: avcodec.h:560
ff_d3d12va_encode_hw_configs
const AVCodecHWConfigInternal *const ff_d3d12va_encode_hw_configs[]
Definition: d3d12va_encode.c:36
D3D12VAEncodePicture::output_buffer_ref
AVBufferRef * output_buffer_ref
Definition: d3d12va_encode.h:50
d3d12va_sync_with_gpu
static int d3d12va_sync_with_gpu(AVCodecContext *avctx)
Definition: d3d12va_encode.c:54
FFHWBaseEncodePicture::type
int type
Definition: hw_base_encode.h:72
ff_hw_base_encode_close
int ff_hw_base_encode_close(FFHWBaseEncodeContext *ctx)
Definition: hw_base_encode.c:785
FFHWBaseEncodePicture::is_reference
int is_reference
Definition: hw_base_encode.h:83
fail
#define fail()
Definition: checkasm.h:186
av_fifo_write
int av_fifo_write(AVFifo *f, const void *buf, size_t nb_elems)
Write data into a FIFO.
Definition: fifo.c:188
D3D12VAEncodePicture::output_buffer
ID3D12Resource * output_buffer
Definition: d3d12va_encode.h:51
CommandAllocator::command_allocator
ID3D12CommandAllocator * command_allocator
Definition: d3d12va_encode.c:66
D3D12VAEncodePicture::recon_surface
AVD3D12VAFrame * recon_surface
Definition: d3d12va_encode.h:48
av_buffer_pool_init2
AVBufferPool * av_buffer_pool_init2(size_t size, void *opaque, AVBufferRef *(*alloc)(void *opaque, size_t size), void(*pool_free)(void *opaque))
Allocate and initialize a buffer pool with a more complex allocator.
Definition: buffer.c:259
AVCodecContext::flags
int flags
AV_CODEC_FLAG_*.
Definition: avcodec.h:502
FFHWBaseEncodePicture::input_image
AVFrame * input_image
Definition: hw_base_encode.h:77
CommandAllocator::fence_value
uint64_t fence_value
Definition: d3d12va_encode.c:67
ff_hw_base_init_gop_structure
int ff_hw_base_init_gop_structure(FFHWBaseEncodeContext *ctx, AVCodecContext *avctx, uint32_t ref_l0, uint32_t ref_l1, int flags, int prediction_pre_only)
Definition: hw_base_encode.c:630
d3d12va_encode_alloc
static FFHWBaseEncodePicture * d3d12va_encode_alloc(AVCodecContext *avctx, const AVFrame *frame)
Definition: d3d12va_encode.c:563
av_reduce
int av_reduce(int *dst_num, int *dst_den, int64_t num, int64_t den, int64_t max)
Reduce a fraction.
Definition: rational.c:35
AVRational::num
int num
Numerator.
Definition: rational.h:59
FFHWBaseEncodeContext::device
AVHWDeviceContext * device
Definition: hw_base_encode.h:144
avassert.h
d3d12va_encode_rc_modes
static const D3D12VAEncodeRCMode d3d12va_encode_rc_modes[]
Definition: d3d12va_encode.c:754
check_rate_control_support
static int check_rate_control_support(AVCodecContext *avctx, const D3D12VAEncodeRCMode *rc_mode)
Definition: d3d12va_encode.c:764
ff_hw_base_get_recon_format
int ff_hw_base_get_recon_format(FFHWBaseEncodeContext *ctx, const void *hwconfig, enum AVPixelFormat *fmt)
Definition: hw_base_encode.c:683
d3d12va_encode_get_buffer_size
static int d3d12va_encode_get_buffer_size(AVCodecContext *avctx, D3D12VAEncodePicture *pic, size_t *size)
Definition: d3d12va_encode.c:605
pkt
AVPacket * pkt
Definition: movenc.c:60
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
d3d12va_encode_issue
static int d3d12va_encode_issue(AVCodecContext *avctx, const FFHWBaseEncodePicture *base_pic)
Definition: d3d12va_encode.c:188
AV_PROFILE_UNKNOWN
#define AV_PROFILE_UNKNOWN
Definition: defs.h:65
av_fifo_read
int av_fifo_read(AVFifo *f, void *buf, size_t nb_elems)
Read data from a FIFO.
Definition: fifo.c:240
AVCodecContext::rc_initial_buffer_occupancy
int rc_initial_buffer_occupancy
Number of bits which should be loaded into the rc buffer before decoding starts.
Definition: avcodec.h:1320
AVHWFramesContext::height
int height
Definition: hwcontext.h:217
av_buffer_pool_get
AVBufferRef * av_buffer_pool_get(AVBufferPool *pool)
Allocate a new AVBuffer, reusing an old buffer from the pool when available.
Definition: buffer.c:384
width
#define width
AVCodecContext::global_quality
int global_quality
Global quality for codecs which cannot change it per frame.
Definition: avcodec.h:1239
D3D12_OBJECT_RELEASE
#define D3D12_OBJECT_RELEASE(pInterface)
A release macro used by D3D12 objects highly frequently.
Definition: hwcontext_d3d12va_internal.h:51
D3D12VAEncodePicture::header_size
int header_size
Definition: d3d12va_encode.h:45
AV_BUFFER_FLAG_READONLY
#define AV_BUFFER_FLAG_READONLY
Always treat the buffer as read-only, even when it has only one reference.
Definition: buffer.h:114
AVFormatContext::flags
int flags
Flags modifying the (de)muxer behaviour.
Definition: avformat.h:1406
RC_MODE_CQP
@ RC_MODE_CQP
Definition: d3d12va_encode.h:95
FFHWBaseEncodeContext::max_b_depth
int max_b_depth
Definition: hw_base_encode.h:183
FFHWBaseEncodeContext::async_encode
int async_encode
Definition: hw_base_encode.h:207
AVD3D12VAFrame::sync_ctx
AVD3D12VASyncContext sync_ctx
The sync context for the texture.
Definition: hwcontext_d3d12va.h:119
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:40
d3d12va_create_encoder_heap
static int d3d12va_create_encoder_heap(AVCodecContext *avctx)
Definition: d3d12va_encode.c:1158
FF_HW_FLAG_CONSTANT_QUALITY_ONLY
@ FF_HW_FLAG_CONSTANT_QUALITY_ONLY
Definition: hw_base_encode.h:48
FFHWBaseEncodePicture::priv_data
void * priv_data
Definition: hw_base_encode.h:80
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:201
ctx
AVFormatContext * ctx
Definition: movenc.c:49
d3d12va_encode_wait
static int d3d12va_encode_wait(AVCodecContext *avctx, D3D12VAEncodePicture *pic)
Definition: d3d12va_encode.c:109
D3D12VAEncodePicture::pic_ctl
D3D12_VIDEO_ENCODER_PICTURE_CONTROL_CODEC_DATA pic_ctl
Definition: d3d12va_encode.h:56
AVD3D12VASyncContext
This struct is used to sync d3d12 execution.
Definition: hwcontext_d3d12va.h:84
FF_HW_PICTURE_TYPE_IDR
@ FF_HW_PICTURE_TYPE_IDR
Definition: hw_base_encode.h:38
AVCodecContext::rc_max_rate
int64_t rc_max_rate
maximum bitrate
Definition: avcodec.h:1292
AVD3D12VASyncContext::fence
ID3D12Fence * fence
D3D12 fence object.
Definition: hwcontext_d3d12va.h:88
D3D12VAEncodeRCMode
Definition: d3d12va_encode.h:103
FFHWBaseEncodeContext::pic_start
FFHWBaseEncodePicture * pic_start
Definition: hw_base_encode.h:155
FFHWBaseEncodeContext::b_per_p
int b_per_p
Definition: hw_base_encode.h:184
AVCodecContext::rc_buffer_size
int rc_buffer_size
decoder bitstream buffer size
Definition: avcodec.h:1277
d3d12va_discard_command_allocator
static int d3d12va_discard_command_allocator(AVCodecContext *avctx, ID3D12CommandAllocator *pAllocator, uint64_t fence_value)
Definition: d3d12va_encode.c:95
D3D12VAEncodePicture::fence_value
int fence_value
Definition: d3d12va_encode.h:58
NULL
#define NULL
Definition: coverity.c:32
AVHWFramesContext::sw_format
enum AVPixelFormat sw_format
The pixel format identifying the actual data layout of the hardware frames.
Definition: hwcontext.h:210
av_buffer_unref
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
Definition: buffer.c:139
AVCodecContext::bit_rate
int64_t bit_rate
the average bitrate
Definition: avcodec.h:495
av_buffer_pool_uninit
void av_buffer_pool_uninit(AVBufferPool **ppool)
Mark the pool as being available for freeing.
Definition: buffer.c:322
FFHWEncodePictureOperation
Definition: hw_base_encode.h:105
AVD3D12VAFramesContext
This struct is allocated as AVHWFramesContext.hwctx.
Definition: hwcontext_d3d12va.h:126
AV_PIX_FMT_D3D12
@ AV_PIX_FMT_D3D12
Hardware surfaces for Direct3D 12.
Definition: pixfmt.h:440
AVD3D12VAFrame::texture
ID3D12Resource * texture
The texture in which the frame is located.
Definition: hwcontext_d3d12va.h:112
hwcontext_d3d12va.h
av_buffer_create
AVBufferRef * av_buffer_create(uint8_t *data, size_t size, void(*free)(void *opaque, uint8_t *data), void *opaque, int flags)
Create an AVBuffer from an existing array.
Definition: buffer.c:55
AVD3D12VAFramesContext::flags
D3D12_RESOURCE_FLAGS flags
Options for working with resources.
Definition: hwcontext_d3d12va.h:139
MAX_PARAM_BUFFER_SIZE
@ MAX_PARAM_BUFFER_SIZE
Definition: vaapi_encode.h:47
AVCodecContext::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avcodec.h:544
ff_hw_base_encode_set_output_property
int ff_hw_base_encode_set_output_property(FFHWBaseEncodeContext *ctx, AVCodecContext *avctx, FFHWBaseEncodePicture *pic, AVPacket *pkt, int flag_no_delay)
Definition: hw_base_encode.c:486
d3d12va_encode_free_buffer
static void d3d12va_encode_free_buffer(void *opaque, uint8_t *data)
Definition: d3d12va_encode.c:1183
d3d12va_encode_create_metadata_buffers
static int d3d12va_encode_create_metadata_buffers(AVCodecContext *avctx, D3D12VAEncodePicture *pic)
Definition: d3d12va_encode.c:142
FFHWBaseEncodeContext::frame
AVFrame * frame
Definition: hw_base_encode.h:202
d3d12va_get_valid_command_allocator
static int d3d12va_get_valid_command_allocator(AVCodecContext *avctx, ID3D12CommandAllocator **ppAllocator)
Definition: d3d12va_encode.c:70
d3d12va_encode_create_command_objects
static int d3d12va_encode_create_command_objects(AVCodecContext *avctx)
Definition: d3d12va_encode.c:1273
ff_d3d12va_encode_init
int ff_d3d12va_encode_init(AVCodecContext *avctx)
Definition: d3d12va_encode.c:1400
FFHWBaseEncodePicture::nb_refs
int nb_refs[MAX_REFERENCE_LIST_NUM]
Definition: hw_base_encode.h:93
CommandAllocator
Definition: d3d12va_encode.c:65
d3d12va_type
static const FFHWEncodePictureOperation d3d12va_type
Definition: d3d12va_encode.c:1385
D3D12VAEncodeProfile
Definition: d3d12va_encode.h:61
FFHWBaseEncodeContext::decode_delay
int64_t decode_delay
Definition: hw_base_encode.h:168
size
int size
Definition: twinvq_data.h:10344
ff_hw_base_encode_receive_packet
int ff_hw_base_encode_receive_packet(FFHWBaseEncodeContext *ctx, AVCodecContext *avctx, AVPacket *pkt)
Definition: hw_base_encode.c:525
D3D12VAEncodePicture::base
FFHWBaseEncodePicture base
Definition: d3d12va_encode.h:43
RC_MODE_CBR
@ RC_MODE_CBR
Definition: d3d12va_encode.h:96
AVCodecHWConfigInternal
Definition: hwconfig.h:25
FFHWBaseEncodeContext::p_to_gpb
int p_to_gpb
Definition: hw_base_encode.h:189
FFHWBaseEncodePicture::encode_order
int64_t encode_order
Definition: hw_base_encode.h:64
AVD3D12VAFrame
D3D12VA frame descriptor for pool allocation.
Definition: hwcontext_d3d12va.h:106
D3D12VA_VIDEO_ENC_ASYNC_DEPTH
#define D3D12VA_VIDEO_ENC_ASYNC_DEPTH
Definition: d3d12va_encode.h:40
D3D12VAEncodePicture::encoded_metadata
ID3D12Resource * encoded_metadata
Definition: d3d12va_encode.h:53
D3D12VAEncodePicture
Definition: d3d12va_encode.h:42
d3d12va_encode_alloc_output_buffer
static AVBufferRef * d3d12va_encode_alloc_output_buffer(void *opaque, size_t size)
Definition: d3d12va_encode.c:1191
HW_CONFIG_ENCODER_FRAMES
#define HW_CONFIG_ENCODER_FRAMES(format, device_type_)
Definition: hwconfig.h:98
log.h
FFHWBaseEncodeContext::op
const struct FFHWEncodePictureOperation * op
Definition: hw_base_encode.h:122
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
internal.h
TRY_RC_MODE
#define TRY_RC_MODE(mode, fail)
common.h
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
FFHWBaseEncodePicture::refs
struct FFHWBaseEncodePicture * refs[MAX_REFERENCE_LIST_NUM][MAX_PICTURE_REFERENCES]
Definition: hw_base_encode.h:94
d3d12va_fence_completion
static int d3d12va_fence_completion(AVD3D12VASyncContext *psync_ctx)
Definition: d3d12va_encode.c:41
av_mallocz
void * av_mallocz(size_t size)
Allocate a memory block with alignment suitable for all memory accesses (including vectors if availab...
Definition: mem.c:256
ff_hw_base_encode_free
int ff_hw_base_encode_free(FFHWBaseEncodePicture *pic)
Definition: hw_base_encode.c:741
profile
int profile
Definition: mxfenc.c:2228
av_calloc
void * av_calloc(size_t nmemb, size_t size)
Definition: mem.c:264
d3d12va_create_encoder
static int d3d12va_create_encoder(AVCodecContext *avctx)
Definition: d3d12va_encode.c:1131
avcodec.h
AVD3D12VAFramesContext::format
DXGI_FORMAT format
DXGI_FORMAT format.
Definition: hwcontext_d3d12va.h:131
AVHWFramesContext
This struct describes a set or pool of "hardware" frames (i.e.
Definition: hwcontext.h:115
d3d12va_encode_init_rate_control
static int d3d12va_encode_init_rate_control(AVCodecContext *avctx)
Definition: d3d12va_encode.c:789
FFHWBaseEncodePicture
Definition: hw_base_encode.h:60
frame
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a frame
Definition: filter_design.txt:264
AVHWFramesContext::hwctx
void * hwctx
The format-specific data, allocated and freed automatically along with this context.
Definition: hwcontext.h:150
D3D12VAEncodeContext
Definition: d3d12va_encode.h:145
FFHWBaseEncodeContext::device_ref
AVBufferRef * device_ref
Definition: hw_base_encode.h:143
FFHWBaseEncodeContext::encode_fifo
AVFifo * encode_fifo
Definition: hw_base_encode.h:210
av_fifo_alloc2
AVFifo * av_fifo_alloc2(size_t nb_elems, size_t elem_size, unsigned int flags)
Allocate and initialize an AVFifo with a given element size.
Definition: fifo.c:47
ff_hw_base_encode_get_pictype_name
static const char * ff_hw_base_encode_get_pictype_name(const int type)
Definition: hw_base_encode.h:31
d3d12va_encode_prepare_output_buffers
static int d3d12va_encode_prepare_output_buffers(AVCodecContext *avctx)
Definition: d3d12va_encode.c:1239
FFHWBaseEncodeContext::surface_height
int surface_height
Definition: hw_base_encode.h:136
FFHWBaseEncodeContext::async_depth
int async_depth
Definition: hw_base_encode.h:212
AVCodecContext
main external API structure.
Definition: avcodec.h:445
AVD3D12VASyncContext::event
HANDLE event
A handle to the event object that's raised when the fence reaches a certain value.
Definition: hwcontext_d3d12va.h:94
ff_get_encode_buffer
int ff_get_encode_buffer(AVCodecContext *avctx, AVPacket *avpkt, int64_t size, int flags)
Get a buffer for a packet.
Definition: encode.c:106
AVCodecContext::qmin
int qmin
minimum quantizer
Definition: avcodec.h:1256
AVRational::den
int den
Denominator.
Definition: rational.h:60
AVCodecContext::profile
int profile
profile
Definition: avcodec.h:1640
d3d12va_encode_free_rc_params
static int d3d12va_encode_free_rc_params(AVCodecContext *avctx)
Definition: d3d12va_encode.c:538
ref
static int ref[MAX_W *MAX_W]
Definition: jpeg2000dwt.c:112
FFHWBaseEncodeContext::input_frames
AVHWFramesContext * input_frames
Definition: hw_base_encode.h:148
TRANSITION_BARRIER
#define TRANSITION_BARRIER(res, before, after)
FFHWBaseEncodeContext::surface_width
int surface_width
Definition: hw_base_encode.h:135
desc
const char * desc
Definition: libsvtav1.c:79
FFHWBaseEncodePicture::encode_complete
int encode_complete
Definition: hw_base_encode.h:75
mem.h
AVBufferRef
A reference to a data buffer.
Definition: buffer.h:82
d3d12va_encode_free
static int d3d12va_encode_free(AVCodecContext *avctx, FFHWBaseEncodePicture *base_pic)
Definition: d3d12va_encode.c:586
AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:69
ff_d3d12va_encode_close
int ff_d3d12va_encode_close(AVCodecContext *avctx)
Definition: d3d12va_encode.c:1519
av_free
#define av_free(p)
Definition: tableprint_vlc.h:33
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AVCodecContext::slices
int slices
Number of slices.
Definition: avcodec.h:1047
ff_d3d12va_encode_receive_packet
int ff_d3d12va_encode_receive_packet(AVCodecContext *avctx, AVPacket *pkt)
Definition: d3d12va_encode.c:1395
AVPacket
This structure stores compressed data.
Definition: packet.h:497
AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:472
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:34
d3d12va_encode_init_gop_structure
static int d3d12va_encode_init_gop_structure(AVCodecContext *avctx)
Definition: d3d12va_encode.c:1060
FFHWBaseEncodeContext::recon_frames
AVHWFramesContext * recon_frames
Definition: hw_base_encode.h:152
DX_CHECK
#define DX_CHECK(hr)
A check macro used by D3D12 functions highly frequently.
Definition: hwcontext_d3d12va_internal.h:40
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
av_fifo_freep2
void av_fifo_freep2(AVFifo **f)
Free an AVFifo and reset pointer to NULL.
Definition: fifo.c:286
AVD3D12VASyncContext::fence_value
uint64_t fence_value
The fence value used for sync.
Definition: hwcontext_d3d12va.h:99
FFHWBaseEncodePicture::encode_issued
int encode_issued
Definition: hw_base_encode.h:74
FF_QP2LAMBDA
#define FF_QP2LAMBDA
factor to convert from H.263 QP to lambda
Definition: avutil.h:227
rc_mode
mfxU16 rc_mode
Definition: qsvenc.c:143
RC_MODE_VBR
@ RC_MODE_VBR
Definition: d3d12va_encode.h:97
hwcontext_d3d12va_internal.h
FFHWBaseEncodePicture::display_order
int64_t display_order
Definition: hw_base_encode.h:63
int
int
Definition: ffmpeg_filter.c:424
av_hwframe_get_buffer
int av_hwframe_get_buffer(AVBufferRef *hwframe_ref, AVFrame *frame, int flags)
Allocate a new frame attached to the given AVHWFramesContext.
Definition: hwcontext.c:491
AV_FIFO_FLAG_AUTO_GROW
#define AV_FIFO_FLAG_AUTO_GROW
Automatically resize the FIFO on writes, so that the data fits.
Definition: fifo.h:63