WebRTC-集成qsv硬解码实现

2023-05-16

1.Window下QSV硬解码配置

在libavcodec/codec_list.c下添加

 &ff_h264_qsv_decoder,

在ffmpeg_generate.gni下加入

     "libavcodec/h264idct.c",
     "libavcodec/h264qpel.c",
     "libavcodec/startcode.c",
     "libavcodec/h264_mp4toannexb_bsf.c",
   ]
 }
 
 ffmpeg_c_sources += [
     "libavcodec/qsvenc_h264.c",
     "libavcodec/qsvenc.c",
     "libavcodec/qsv.c",
    "libavcodec/qsvdec.c",
    "libavcodec/qsvdec_h2645.c",
  ]

libavcodec/bsf_list.c下

static const AVBitStreamFilter * const bitstream_filters[] = {
    &ff_h264_mp4toannexb_bsf,
     &ff_null_bsf,
     NULL };

修改win-msvc/x64/config.h配置

#define CONFIG_H264_QSV_DECODER 1

2.QSV硬解码实现

h264_decoder_impl_ffmpeg.cc的实现

#include "modules/video_coding/codecs/h264/h264_decoder_impl_ffmpeg.h"

#include <algorithm>
#include <limits>

extern "C" {
#include "third_party/ffmpeg/libavcodec/avcodec.h"
#include "third_party/ffmpeg/libavformat/avformat.h"
#include "third_party/ffmpeg/libavutil/imgutils.h"
#include "third_party/ffmpeg/libavutil/opt.h"
}  // extern "C"

#include "base/checks.h"
#include "base/criticalsection.h"
#include "base/keep_ref_until_done.h"
#include "base/logging.h"
#include "system_wrappers/include/metrics.h"
#include "libyuv/convert.h"

namespace webrtc {
namespace {
#define PRINT_TIME_DECODE_DELAY 0
const AVPixelFormat kPixelFormat = AV_PIX_FMT_YUV420P;
const size_t kYPlaneIndex = 0;
const size_t kUPlaneIndex = 1;
const size_t kVPlaneIndex = 2;



// Used by histograms. Values of entries should not be changed.
enum H264DecoderImplEvent {
  kH264DecoderEventInit = 0,
  kH264DecoderEventError = 1,
  kH264DecoderEventMax = 16,
};

#if defined(WEBRTC_INITIALIZE_FFMPEG)

rtc::CriticalSection ffmpeg_init_lock;
bool ffmpeg_initialized = false;

// Called by FFmpeg to do mutex operations if initialized using
// |InitializeFFmpeg|.
int LockManagerOperation(void** lock, AVLockOp op)
    EXCLUSIVE_LOCK_FUNCTION() UNLOCK_FUNCTION() {
  switch (op) {
    case AV_LOCK_CREATE:
      *lock = new rtc::CriticalSection();
      return 0;
    case AV_LOCK_OBTAIN:
      static_cast<rtc::CriticalSection*>(*lock)->Enter();
      return 0;
    case AV_LOCK_RELEASE:
      static_cast<rtc::CriticalSection*>(*lock)->Leave();
      return 0;
    case AV_LOCK_DESTROY:
      delete static_cast<rtc::CriticalSection*>(*lock);
      *lock = nullptr;
      return 0;
  }
  RTC_NOTREACHED() << "Unrecognized AVLockOp.";
  return -1;
}

void InitializeFFmpeg() {
  LOG_F(LS_INFO);
  rtc::CritScope cs(&ffmpeg_init_lock);
  if (!ffmpeg_initialized) {
    if (av_lockmgr_register(LockManagerOperation) < 0) {
      RTC_NOTREACHED() << "av_lockmgr_register failed.";
      return;
    }
    av_register_all();
    ffmpeg_initialized = true;
  }
}

#endif  // defined(WEBRTC_INITIALIZE_FFMPEG)

}  // namespace

int H264DecoderImplFfmpeg::AVGetBuffer2(
    AVCodecContext* context, AVFrame* av_frame, int flags) {
  // Set in |InitDecode|.
  H264DecoderImplFfmpeg* decoder = static_cast<H264DecoderImplFfmpeg*>(context->opaque);
  // DCHECK values set in |InitDecode|.
  RTC_DCHECK(decoder);
  RTC_DCHECK_EQ(context->pix_fmt, kPixelFormat);
  // Necessary capability to be allowed to provide our own buffers.
  RTC_DCHECK(context->codec->capabilities | AV_CODEC_CAP_DR1);

  // |av_frame->width| and |av_frame->height| are set by FFmpeg. These are the
  // actual image's dimensions and may be different from |context->width| and
  // |context->coded_width| due to reordering.
  int width = av_frame->width;
  int height = av_frame->height;
  // See |lowres|, if used the decoder scales the image by 1/2^(lowres). This
  // has implications on which resolutions are valid, but we don't use it.
  RTC_CHECK_EQ(context->lowres, 0);
  // Adjust the |width| and |height| to values acceptable by the decoder.
  // Without this, FFmpeg may overflow the buffer. If modified, |width| and/or
  // |height| are larger than the actual image and the image has to be cropped
  // (top-left corner) after decoding to avoid visible borders to the right and
  // bottom of the actual image.
  avcodec_align_dimensions(context, &width, &height);

  RTC_CHECK_GE(width, 0);
  RTC_CHECK_GE(height, 0);
  int ret = av_image_check_size(static_cast<unsigned int>(width),
                                static_cast<unsigned int>(height), 0, nullptr);
  if (ret < 0) {
    LOG(LS_ERROR) << "Invalid picture size " << width << "x" << height;
    decoder->ReportError();
    return ret;
  }

  // The video frame is stored in |video_frame|. |av_frame| is FFmpeg's version
  // of a video frame and will be set up to reference |video_frame|'s buffers.
  VideoFrame* video_frame = new VideoFrame();
  // FFmpeg expects the initial allocation to be zero-initialized according to
  // http://crbug.com/390941. Our pool is set up to zero-initialize new buffers.
  video_frame->set_video_frame_buffer(
      decoder->pool_.CreateBuffer(width, height));
  // DCHECK that we have a continuous buffer as is required.
  RTC_DCHECK_EQ(video_frame->buffer(kUPlane),
      video_frame->buffer(kYPlane) + video_frame->allocated_size(kYPlane));
  RTC_DCHECK_EQ(video_frame->buffer(kVPlane),
      video_frame->buffer(kUPlane) + video_frame->allocated_size(kUPlane));
  int total_size = video_frame->allocated_size(kYPlane) +
                   video_frame->allocated_size(kUPlane) +
                   video_frame->allocated_size(kVPlane);

  av_frame->format = context->pix_fmt;
  av_frame->reordered_opaque = context->reordered_opaque;

  // Set |av_frame| members as required by FFmpeg.
  av_frame->data[kYPlaneIndex] = video_frame->buffer(kYPlane);
  av_frame->linesize[kYPlaneIndex] = video_frame->stride(kYPlane);
  av_frame->data[kUPlaneIndex] = video_frame->buffer(kUPlane);
  av_frame->linesize[kUPlaneIndex] = video_frame->stride(kUPlane);
  av_frame->data[kVPlaneIndex] = video_frame->buffer(kVPlane);
  av_frame->linesize[kVPlaneIndex] = video_frame->stride(kVPlane);
  RTC_DCHECK_EQ(av_frame->extended_data, av_frame->data);

  av_frame->buf[0] = av_buffer_create(av_frame->data[kYPlaneIndex],
                                      total_size,
                                      AVFreeBuffer2,
                                      static_cast<void*>(video_frame),
                                      0);
  RTC_CHECK(av_frame->buf[0]);
  return 0;
}

void H264DecoderImplFfmpeg::AVFreeBuffer2(void* opaque, uint8_t* data) {
  // The buffer pool recycles the buffer used by |video_frame| when there are no
  // more references to it. |video_frame| is a thin buffer holder and is not
  // recycled.
  VideoFrame* video_frame = static_cast<VideoFrame*>(opaque);
  delete video_frame;
}

H264DecoderImplFfmpeg::H264DecoderImplFfmpeg(bool is_hw) : pool_(true),
                                     decoded_image_callback_(nullptr),
                                     has_reported_init_(false),
                                     has_reported_error_(false),
                                     clock_(Clock::GetRealTimeClock()),
                                     isFirstFrame(true),
                                     is_hw_(is_hw) {
    start_time_ = clock_->TimeInMilliseconds();
}

H264DecoderImplFfmpeg::~H264DecoderImplFfmpeg() {
  Release();
  int64_t deltaTimeSec = (clock_->TimeInMilliseconds() - start_time_)/1000;
  LOG(LS_INFO) << "discard_cnt_:" << discard_cnt_
                << ", decode_cnt_:" << decode_cnt_
                << ", idr_cnt_:" << idr_cnt_
                << ", decoded_cnt_:" << decoded_cnt_
                << ", deltaTimeSec:" << deltaTimeSec
                << ", average framte rate:" << (deltaTimeSec ? (decoded_cnt_/deltaTimeSec) : decoded_cnt_);

}

void H264DecoderImplFfmpeg::PrintDecoderSettings(const VideoCodec* codec_settings, const AVCodecContext* codec_ctx) {
  LOG(LS_INFO) << " ";
  LOG(LS_INFO) << "#############################################################";
  LOG(LS_INFO) << "#               Decoder Parameter Setting:                  #";
  LOG(LS_INFO) << "#############################################################";
  LOG(LS_INFO) << "codec name                               :" << codec_ctx->codec->name;
  LOG(LS_INFO) << "codec type                               :" << codec_ctx->codec_type;
  LOG(LS_INFO) << "codec id                                 :" << codec_ctx->codec_id;
  LOG(LS_INFO) << "codec_settings.width                     :" << codec_settings->width;
  LOG(LS_INFO) << "codec_settings.height                    :" << codec_settings->height;
  LOG(LS_INFO) << "codec_settings.startBitrate              :" << codec_settings->startBitrate;
  LOG(LS_INFO) << "codec_settings.maxBitrate                :" << codec_settings->maxBitrate;
  LOG(LS_INFO) << "codec_settings.minBitrate                :" << codec_settings->minBitrate;
  LOG(LS_INFO) << "codec_settings.targetBitrate             :" << codec_settings->targetBitrate;
  LOG(LS_INFO) << "codec_settings.maxFramerate              :" << static_cast<int32_t>(codec_settings->maxFramerate);
  LOG(LS_INFO) << "------------------------------------------------------------ ";
  LOG(LS_INFO) << "codec_ctx.width                          :" << codec_ctx->width;
  LOG(LS_INFO) << "codec_ctx.height                         :" << codec_ctx->height;
  LOG(LS_INFO) << "codec_ctx.pix_fmt                        :" << codec_ctx->pix_fmt;
  LOG(LS_INFO) << "codec_ctx.flags                          :" << static_cast<uint32_t>(codec_ctx->flags);
  LOG(LS_INFO) << "codec_ctx.bit_rate                       :" << codec_ctx->bit_rate;
  LOG(LS_INFO) << "#############################################################";
}

int32_t H264DecoderImplFfmpeg::InitHwDecode(const VideoCodec* codec_settings) {
  AVCodec* codec = avcodec_find_decoder_by_name("h264_qsv");
  if (!codec) {
    // This is an indication that FFmpeg has not been initialized or it has not
    // been compiled/initialized with the correct set of codecs.
    LOG(LS_ERROR) << "FFmpeg H.264 HW decoder not found.";
    Release();
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  LOG(LS_INFO) << "Found decoder codec name " << codec->name;
  av_context_.reset(avcodec_alloc_context3(codec));
  if (codec_settings) {
    av_context_->coded_width = codec_settings->width;
    av_context_->coded_height = codec_settings->height;
  }
  av_context_->pix_fmt = AV_PIX_FMT_NV12;
  av_opt_set(av_context_->priv_data, "async_depth", "1", 0);
  int res = avcodec_open2(av_context_.get(), codec, nullptr);
  if (res < 0) {
    LOG(LS_ERROR) << "avcodec_open2 error: " << res;
    Release();
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  
  PrintDecoderSettings(codec_settings, av_context_.get());

  av_frame_.reset(av_frame_alloc());

  
  return WEBRTC_VIDEO_CODEC_OK;
}

int32_t H264DecoderImplFfmpeg::InitDecode(const VideoCodec* codec_settings,
                                    int32_t number_of_cores) {
  LOG_F(LS_INFO);
  ReportInit();
  isFirstFrame = true;
  if (codec_settings &&
      codec_settings->codecType != kVideoCodecH264) {
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  }

  // FFmpeg must have been initialized (with |av_lockmgr_register| and
  // |av_register_all|) before we proceed. |InitializeFFmpeg| does this, which
  // makes sense for WebRTC standalone. In other cases, such as Chromium, FFmpeg
  // is initialized externally and calling |InitializeFFmpeg| would be
  // thread-unsafe and result in FFmpeg being initialized twice, which could
  // break other FFmpeg usage. See the |rtc_initialize_ffmpeg| flag.
#if defined(WEBRTC_INITIALIZE_FFMPEG)
  // Make sure FFmpeg has been initialized. Subsequent |InitializeFFmpeg| calls
  // do nothing.
  InitializeFFmpeg();
#endif

  // Release necessary in case of re-initializing.
  int32_t ret = Release();
  if (ret != WEBRTC_VIDEO_CODEC_OK) {
    ReportError();
    return ret;
  }
  RTC_DCHECK(!av_context_);

  if (is_hw_) {
    return InitHwDecode(codec_settings);
  };
  // Initialize AVCodecContext.
  av_context_.reset(avcodec_alloc_context3(nullptr));

  av_context_->codec_type = AVMEDIA_TYPE_VIDEO;
  av_context_->codec_id = AV_CODEC_ID_H264;

  if (codec_settings) {
    av_context_->coded_width = codec_settings->width;
    av_context_->coded_height = codec_settings->height;
  }
  av_context_->pix_fmt = kPixelFormat;
  av_context_->extradata = nullptr;
  av_context_->extradata_size = 0;

  // If this is ever increased, look at |av_context_->thread_safe_callbacks| and
  // make it possible to disable the thread checker in the frame buffer pool.
  av_context_->thread_count = av_cpu_count() + 1;;
  av_context_->thread_type = FF_THREAD_SLICE;

  // Function used by FFmpeg to get buffers to store decoded frames in.
  av_context_->get_buffer2 = AVGetBuffer2;
  // |get_buffer2| is called with the context, there |opaque| can be used to get
  // a pointer |this|.
  av_context_->opaque = this;
  // Use ref counted frames (av_frame_unref).
  av_context_->refcounted_frames = 1;  // true

  AVCodec* codec = avcodec_find_decoder(av_context_->codec_id);

  if (!codec) {
    // This is an indication that FFmpeg has not been initialized or it has not
    // been compiled/initialized with the correct set of codecs.
    LOG(LS_ERROR) << "FFmpeg H.264 decoder not found.";
    Release();
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERROR;
  }

  int res = avcodec_open2(av_context_.get(), codec, nullptr);
  if (res < 0) {
    LOG(LS_ERROR) << "avcodec_open2 error: " << res;
    Release();
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERROR;
  }

  PrintDecoderSettings(codec_settings, av_context_.get());
  av_frame_.reset(av_frame_alloc());
  return WEBRTC_VIDEO_CODEC_OK;
}

int32_t H264DecoderImplFfmpeg::Release() {
  avcodec_close(av_context_.get());
  av_context_.reset();
  av_frame_.reset();
  return WEBRTC_VIDEO_CODEC_OK;
}

int32_t H264DecoderImplFfmpeg::RegisterDecodeCompleteCallback(
    DecodedImageCallback* callback) {
  decoded_image_callback_ = callback;
  return WEBRTC_VIDEO_CODEC_OK;
}

int32_t H264DecoderImplFfmpeg::Decode(const EncodedImage& input_image,
                                bool /*missing_frames*/,
                                const RTPFragmentationHeader* /*fragmentation*/,
                                const CodecSpecificInfo* codec_specific_info,
                                int64_t /*render_time_ms*/) {
  if (!IsInitialized()) {
    ReportError();
    return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
  }
  if (!decoded_image_callback_) {
    LOG(LS_WARNING) << "InitDecode() has been called, but a callback function "
        "has not been set with RegisterDecodeCompleteCallback()";
    ReportError();
    return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
  }
  if (!input_image._buffer || !input_image._length) {
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  }
  if (codec_specific_info &&
      codec_specific_info->codecType != kVideoCodecH264) {
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
  }
  if ((input_image._frameType != kVideoFrameKey) && isFirstFrame) {
    LOG_F(LS_WARNING) <<" first Frame must be IDR frame";
    ++discard_cnt_;
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  if (input_image._frameType == kVideoFrameKey) {
    ++idr_cnt_;
  }
  isFirstFrame = false;

  
#if PRINT_TIME_DECODE_DELAY
  int64_t h264_decode_start_time = clock_->TimeInMilliseconds();
#endif

  // FFmpeg requires padding due to some optimized bitstream readers reading 32
  // or 64 bits at once and could read over the end. See avcodec_decode_video2.
  RTC_CHECK_GE(input_image._size, input_image._length +
                   EncodedImage::GetBufferPaddingBytes(kVideoCodecH264));

  // "If the first 23 bits of the additional bytes are not 0, then damaged MPEG
  // bitstreams could cause overread and segfault." See
  // AV_INPUT_BUFFER_PADDING_SIZE. We'll zero the entire padding just in case.
  memset(input_image._buffer + input_image._length,
         0,
         EncodedImage::GetBufferPaddingBytes(kVideoCodecH264));

  AVPacket packet;
  av_init_packet(&packet);
  packet.data = input_image._buffer;
  if (input_image._length >
      static_cast<size_t>(std::numeric_limits<int>::max())) {
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  packet.size = static_cast<int>(input_image._length);
  av_context_->reordered_opaque = input_image.ntp_time_ms_ * 1000;  // ms -> us
  
  decode_cnt_++;
  int frame_decoded = 0;
  RTC_CHECK(av_frame_.get());
  int result = avcodec_decode_video2(av_context_.get(),
                                     av_frame_.get(),
                                     &frame_decoded,
                                     &packet);
  if (result < 0) {
    LOG(LS_ERROR) << "avcodec_decode_video2 error: " << result;
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERROR;
  }
  // |result| is number of bytes used, which should be all of them.
  if (result != packet.size) {
    LOG(LS_ERROR) << "avcodec_decode_video2 consumed " << result << " bytes "
        "when " << packet.size << " bytes were expected.";
    ReportError();
    return WEBRTC_VIDEO_CODEC_ERROR;
  }

  if (!frame_decoded) {
    LOG(LS_WARNING) << "avcodec_decode_video2 successful but no frame was "
        "decoded.";
    return WEBRTC_VIDEO_CODEC_OK;
  }
  decoded_cnt_++;
#if PRINT_TIME_DECODE_DELAY
  int64_t h264_decode_end_time = clock_->TimeInMilliseconds();
  int64_t h264_decode_use_time = h264_decode_end_time - h264_decode_start_time;
  LOG(LS_INFO) << "Decode: hardware enable: " << is_hw_ << " use_time_ms:" << h264_decode_use_time;
#endif

  if (is_hw_) {
    if (!temp_frame_) {
        temp_frame_.reset(av_frame_alloc());
        if (!temp_frame_) {
            LOG(LS_ERROR) << "Could not allocate video frame";
            return WEBRTC_VIDEO_CODEC_ERROR;
        }
        temp_frame_->format = AV_PIX_FMT_YUV420P; // FIXED
        temp_frame_->width = av_frame_->width;
        temp_frame_->height = av_frame_->height;
        int ret = av_frame_get_buffer(temp_frame_.get(), 32);
        if (ret < 0) {
            LOG(LS_ERROR) << "Could not allocate the video frame data";
            return WEBRTC_VIDEO_CODEC_ERROR;
        }
    }
    // Convert NV12 to YUV420
    int ret = libyuv::NV12ToI420(av_frame_->data[kYPlane], av_frame_->linesize[0],
                  av_frame_->data[kUPlane], av_frame_->linesize[1],
                  temp_frame_->data[kYPlane], av_frame_->linesize[0],
                  temp_frame_->data[kUPlane], av_frame_->linesize[1] / 2,
                  temp_frame_->data[kVPlane], av_frame_->linesize[1] / 2,
                  av_frame_->width, av_frame_->height);

    LOG(LS_VERBOSE) << "Decoded Video Frame. input_image._length[" << input_image._length
                  << "], input_image._size[" << input_image._size
                  << "], decode number[" << decoded_cnt_
                  << "], timestamp[" << input_image._timeStamp
                  << "], temp_frame width[" << temp_frame_->width
                  << "], temp_frame height[" << temp_frame_->height
                  << "], temp_frame strideY[" << temp_frame_->linesize[0]
                  << "], temp_frame strideU[" << temp_frame_->linesize[1]
                  << "], AVFrame width[" << av_frame_->width
                  << "], AVFrame height[" << av_frame_->height
                  << "], AVFrame lines[0][" << av_frame_->linesize[0]
                  << "], AVFrame lines[1][" << av_frame_->linesize[1] << "].";

    decoded_frame_.CreateEmptyFrame(av_frame_->width, av_frame_->height, av_frame_->width, av_frame_->width/2, av_frame_->width/2);
    uint8_t *dst_y = decoded_frame_.buffer(kYPlane);
    uint8_t *src_y = temp_frame_->data[kYPlane];

    uint8_t *dst_u = decoded_frame_.buffer(kUPlane);
    uint8_t *src_u = temp_frame_->data[kUPlane];

    uint8_t *dst_v = decoded_frame_.buffer(kVPlane);
    uint8_t *src_v = temp_frame_->data[kVPlane];

    memcpy(dst_y, src_y, av_frame_->width * av_frame_->height);

    memcpy(dst_u, src_u, av_frame_->width * av_frame_->height/4);

    memcpy(dst_v, src_v, av_frame_->width * av_frame_->height/4);

    decoded_frame_.set_timestamp(input_image._timeStamp);
    decoded_frame_.SetIncomingTimeMs(input_image._incomingTimeMs);    
    decoded_frame_.SetFrameCnt(decode_cnt_);
    ret = decoded_image_callback_->Decoded(decoded_frame_);

    // Stop referencing it, possibly freeing |video_frame|.
    av_frame_unref(av_frame_.get());
    if (ret) {
      LOG(LS_WARNING) << "DecodedImageCallback::Decoded returned " << ret;
      return ret;
    }
    return WEBRTC_VIDEO_CODEC_OK;
  } // end of is_hw_

  // Obtain the |video_frame| containing the decoded image.
  VideoFrame* video_frame = static_cast<VideoFrame*>(
      av_buffer_get_opaque(av_frame_->buf[0]));
  RTC_DCHECK(video_frame);
  RTC_CHECK_EQ(av_frame_->data[kYPlane], video_frame->buffer(kYPlane));
  RTC_CHECK_EQ(av_frame_->data[kUPlane], video_frame->buffer(kUPlane));
  RTC_CHECK_EQ(av_frame_->data[kVPlane], video_frame->buffer(kVPlane));
  video_frame->set_timestamp(input_image._timeStamp);
  video_frame->SetIncomingTimeMs(input_image._incomingTimeMs);
  LOG(LS_VERBOSE) << "Decoded Video Frame. input_image._length[" << input_image._length
                  << "], input_image._size[" << input_image._size
                  << "], decode number[" << decode_cnt_
                  << "], timestamp[" << input_image._timeStamp
                  << "], pointer[" << (void*)(video_frame->video_frame_buffer()->DataY())
                  << "],video frame width[" << video_frame->width()
                  << "],video frame height[" << video_frame->height()
                  << "],video frame strideY[" << video_frame->stride(kYPlane)
                  << "],video frame strideU[" << video_frame->stride(kUPlane)
                  << "],AVFrame width[" << av_frame_->width
                  << "],AVFrame height[" << av_frame_->height
                  << "],AVFrame lines[0][" << av_frame_->linesize[0]
                  << "],AVFrame lines[1][" << av_frame_->linesize[1] << "].";

  int32_t ret = 0;
  // The decoded image may be larger than what is supposed to be visible, see
  // |AVGetBuffer2|'s use of |avcodec_align_dimensions|. This crops the image
  // without copying the underlying buffer.
  rtc::scoped_refptr<VideoFrameBuffer> buf = video_frame->video_frame_buffer();
  if((av_frame_->width != buf->width()) || (av_frame_->height != buf->height())) {
    decoded_frame_.CreateEmptyFrame(av_frame_->width, av_frame_->height, av_frame_->width, av_frame_->width/2, av_frame_->width/2);

    uint8_t *dst_y = decoded_frame_.buffer(kYPlane);
    uint8_t *src_y = const_cast<uint8_t*>(video_frame->video_frame_buffer()->DataY());

    uint8_t *dst_u = decoded_frame_.buffer(kUPlane);
    uint8_t *src_u = const_cast<uint8_t*>(video_frame->video_frame_buffer()->DataU());

    uint8_t *dst_v = decoded_frame_.buffer(kVPlane);
    uint8_t *src_v = const_cast<uint8_t*>(video_frame->video_frame_buffer()->DataV());

    if(av_frame_->width == buf->width()) {
      memcpy(dst_y, src_y, av_frame_->width * av_frame_->height);

      memcpy(dst_u, src_u, av_frame_->width * av_frame_->height/4);

      memcpy(dst_v, src_v, av_frame_->width * av_frame_->height/4);
    } else {
      for(int i = 0; i < av_frame_->height; i++){
        memcpy(dst_y, src_y, av_frame_->width);
        dst_y += av_frame_->width;
        src_y += buf->width();
      }

      for(int i = 0; i < av_frame_->height/2; i++){
        memcpy(dst_u, src_u, av_frame_->width/2);
        dst_u += av_frame_->width/2;
        src_u += buf->width()/2;
      }

      for(int i = 0; i < av_frame_->height/2; i++){
        memcpy(dst_v, src_v, av_frame_->width/2);
        dst_v += av_frame_->width/2;
        src_v += buf->width()/2;
      }
    }

    decoded_frame_.set_timestamp(input_image._timeStamp);
    decoded_frame_.SetIncomingTimeMs(input_image._incomingTimeMs);    
    decoded_frame_.SetFrameCnt(decode_cnt_);
    ret = decoded_image_callback_->Decoded(decoded_frame_);
  } else {
    //now not reach here
    LOG(LS_ERROR) << "reach error area";

    video_frame->SetFrameCnt(decode_cnt_);
    ret = decoded_image_callback_->Decoded(*video_frame);
  }

  // Stop referencing it, possibly freeing |video_frame|.
  av_frame_unref(av_frame_.get());
  video_frame = nullptr;

  if (ret) {
    LOG(LS_WARNING) << "DecodedImageCallback::Decoded returned " << ret;
    return ret;
  }
  return WEBRTC_VIDEO_CODEC_OK;
}

bool H264DecoderImplFfmpeg::IsInitialized() const {
  return av_context_ != nullptr;
}

void H264DecoderImplFfmpeg::ReportInit() {
  if (has_reported_init_)
    return;
  RTC_HISTOGRAM_ENUMERATION("WebRTC.Video.H264DecoderImpl.Event",
                            kH264DecoderEventInit,
                            kH264DecoderEventMax);
  has_reported_init_ = true;
}

void H264DecoderImplFfmpeg::ReportError() {
  if (has_reported_error_)
    return;
  RTC_HISTOGRAM_ENUMERATION("WebRTC.Video.H264DecoderImpl.Event",
                            kH264DecoderEventError,
                            kH264DecoderEventMax);
  has_reported_error_ = true;
}

}  // namespace webrtc

3.问题分析和总结

qsv硬解码，解码器中会缓存2帧视频，按照fps=15算的话，一帧60ms，2帧的话会延迟120ms左右。用在播放器中可以，用在RTC中会导致时延变大，也可能有对应的优化参数，目前还没找到。

本文内容由网友自发贡献，版权归原作者所有，本站不承担相应法律责任。如您发现有涉嫌抄袭侵权的内容，请联系:hwhale#tublm.com(使用前将#替换为@)

WebRTC-集成qsv硬解码实现的相关文章

ZooKeeper集群安装后无法启动ZooKeeper JMX enabled by default

ZooKeeper做三节点集群 xff0c 启动后报错如下 xff1a root 64 centos conf zkServer sh start ZooKeeper JMX enabled by default Using config
Simulink建模：一阶滤波模型

本文研究一阶滤波算法的Simulink模型及其代码生成文章目录 1 一阶滤波算法2 Simulink建模2 1 对公式的理解2 2 建模过程2 3 模型配置 3 模型更新及代码生成3 1 模型更新3 2 代码生成 4 总结 1 一阶滤波算
CubeMX配置：FreeRTOS及串口配置

本文通过CubeMX配置F103RCT6的FreeRTOS和串口文章目录 1 引入2 配置过程2 1 配置时钟过程2 2 配置FreeRTOS过程2 3 配置串口过程 3 生成工程代码4 测试串口5 总结 1 引入拿到一个STM32控制
Simulink建模：PID控制-串级PID

本文研究串级PID控制的概念应用场景以及Simulink模型实现文章目录 1 问题引入2 串级PID控制3 Simulink建模3 1 建模前的理解3 2 建模过程3 3 代码生成 4 总结 1 问题引入在之前的博客 Simulink
ROS导航中的位姿描述

转载出处 xff1a http blog csdn net u013453604 article details 47320237 补充 xff1a turtlebot包如果没有安装成功或者文件夹做了改动运行不起来需要重装就需要uninst
Git托管：将本地项目代码上传(push)到自己的Git repository

首先下载并安装git版本控制软件 xff0c 我安装的是Git 1 9 2 preview20140411 xff0c 这里是我上传的有需要的可以download然后安装即可 http download csdn net detail u0
strstr函数用法小结

strstr 函数原型 xff1a char strstr char str1 char str2 功能就是找出在字符串str1中第一次出项字符串str2的位置也就是说字符串sr1中要包含有字符串str2 xff0c 找到就返回该字符串位
WebSphere宕机问题解决方法总结

Websphere参数调整涉及性能的参数 xff1a 1 数据源连接池连接数 2 线程池 xff1a default 参数 ORB THREAD POOL参数 Webcontainer 参数 3 jvm 堆最大最小值 xff0c 线程池调
使用GreenDao存储list集合数据

转载请注明出处 xff1a From李诗雨 http blog csdn net cjm2484836553 article details 78279493 不诗意的女程序猿不是好厨师点击下载Demo源代码 xff1a 源码不知道为什
catkin简析

题记 xff1a 转载一篇catkin总结不错的原创 xff1a http blog csdn net zyh821351004 article details 50388429 catkin简析 catkin 编译支持传入cmake的宏定
Package name is not valid解决

刚刚新建项目 xff0c 将com打成con xff0c 提示 Package name is not valid xff0c 在eclipse中有些单词不能命名
路由器与交换机

在工作中 xff0c 不管是办公上网还是设备调试 xff0c 经常都会用到路由器与交换机 xff0c 那他们二者的区别是什么呢 xff1f 笔者之前也没太搞明白恰好出差周末闲来无事 xff0c 特来梳理一下并共享 xff0c 希望对那些跟
用数据驱动思想来设计游戏

游戏由两部分组成 xff0c 逻辑和数据这是一种对游戏的有效划分逻辑部分定义游戏引擎的核心原则和算法 xff0c 数据部分则提供其内容和行为的具体细节在最初的游戏开发的过程中 xff0c 大家总是喜欢将逻辑和数据都写入代码中 xff
架构师之路：一个架构师需要掌握的知识技能

Java团长 2017 04 15 21 30 没有设计的思想 xff0c 你就不能成为一名架构师架构师是一个能撸的了一手好代码 xff0c 画的了一个漂亮的UML 原型 xff0c 写的了一篇技术文档 xff0c 更加能解决好项目关键技
【Python】Windows下PyCharm安装Numpy包及无法安装问题解决方案

step1 打开pycharm安装目录 xff0c 路径如下图 xff1a step2 在上个界面 xff0c 按 shift 43 右键 xff0c 打开命令窗口 xff0c 检查pip版本是否为最新 xff0c 如下图 xff1a st
【python/tensorflow】pycharm 2019，python 3.6.2， win7 64bit系统，安装tensorflow出错，错误如下，解决办法给出！

D aWork PycharmProjects Pro3 test venv Scripts python exe D aWork PycharmProjects Pro3 test test 1 py Traceback most rec
【C++】基于 OpenCV 的人脸识别(强烈推荐)

xfeff xfeff 原文网址 xff1a http www jianshu com p 96be2417cc98 一点背景知识 OpenCV 是一个开源的计算机视觉和机器学习库它包含成千上万优化过的算法 xff0c 为各种计算机视觉应
【matlab】雷达截面积（Radar Cross Section，RCS）（MATLAB部分仿真+Code）

xfeff xfeff 一 RCS定义任何具有确定极化的电磁波照射到目标上时 xff0c 都会产生各个方向上的折射或散射其中散射波分为两部分 xff1a 一是由与接收天线具有相同极化的散射波组成 xff1b 二是散射波具有不同的变化
【Get深一度】自适应波束形成算法之算法篇【二】（Adaptive Beamforming Algorithm）

神器镇楼 xff01 一自适应波束形成阶段划分 xff1a 自适应阵列信号处理的概念最早由 Van Atta 于 20 世纪 60 年代末提出本文总结了前30 年的研究成果 xff0c 将自适应阵列信号处理划分为三个阶段 xff1a 6
使用adb指令往机顶盒上安装应用

转载请注明出处 From李诗雨 https blog csdn net cjm2484836553 article details 82970881 不诗意的女程序猿不是好厨师已有一个机顶盒端应用的apk 想通过adb指令将其安装到机顶盒

随机推荐

多摄像机标定和去畸变

Table of Contents xff11 kalibr多摄像机标定 1 1 系统安装 xff0c 环境配置 xff1a 实测Ubuntu 16 04 1 2 多摄像机标定 2 OpenCV双目标定 3 Matlab多摄像机标定 4 利
【Get深一度】信号处理（三）——3db带宽

1 3db带宽定义 3dB 带宽指幅值等于最大值的二分之根号二倍时对应的频带宽度这个3分贝是多大呢 xff1f 由10log xff08 1 2 xff09 61 3 0103 xff0c 可知 xff0c 这时的输出功率是输入功率的1
Matlab中set-gca函数的使用

Matlab坐标修改gca 1 坐标轴删除 set gca xtick 去掉x轴的刻度 set gca ytick 去掉y轴的刻度 set gca xtick ytick 同时去掉x轴和y轴的刻度 2 Matlab中坐标轴刻度的不同风格
【matlab】函数meshgrid的用法详解(生成网格矩阵)和ndgrid的区别及用法

meshgrid 函数用来生成网格矩阵 xff0c 可以是二维网格矩阵 exp1 1 生成二维网格 xff0c 用法为 xff1a x y 61 meshgrid a b a 和b是一维数组 xff0c 如a 61 1 2 3 b 61
【matlab】./和/ .*和* 有什么区别

matlab中与有什么区别点运算是处理元素之间的运算直接在矩阵计算中只能处理符合矩阵运算法则的运算矩阵计算和作图都是点运算在对数值计算时 xff0c 和其实是没有区别的例 xff1a 对于矩阵A 61 a b c d xff0c
【matlab】 GMSK的调制与解调【附详尽注释】

简介code 1 简介 MSK调制是调制指数为0 5的二元数字频率调制 xff0c 具有很好的特性 xff0c 如恒包络相对窄的带宽并可以相干检测 MSK 最小频移键控信号在任一码元间隔内 xff0c 其相位变化为 2 xff0c 而
【matlab】利用matlab在图形中绘制箭头、标注、圈圈 - 很帅很酷炫

转载声明 xff1a 感谢 xff1a MyBear 尊重原作者劳动 xff1a http www 360doc com content 14 0527 21 1054746 381542462 shtml 一二维箭头 1 xff0e 调
【杂谈】甘于平凡？还是思索求生？

前言不觉然 xff0c 已19年 xff0c 不知不觉 xff0c 求学生涯至此告一段落有感觉 xff0c 岁月的痕迹开始发酵 xff0c 身体抑或精神 xff0c 今不如往思考下 xff0c 互联网浪潮之下 xff0c 之后 xff
匈牙利算法-看这篇绝对就够了！

本文讲述的是匈牙利算法 xff0c 即图论中寻找最大匹配的算法 xff0c 暂不考虑加权的最大匹配 xff08 用KM算法实现 xff09 xff0c 文章整体结构如下 xff1a 基础概念介绍算法的实现好的 xff0c 开始 xff0
面试的一般流程及其常见的问题

又是一年毕业季 xff0c 也要踏上求职之路 xff0c 在这段时间也关注很多求职方面的消息下面是一些面试的一般流程及其常见的问题 xff1a 面试职位 xff1a XXXX 开始语 xff1a 你好 xff0c 首先祝贺你通过了前几个环
构建库函数（STM32）

一定义外设的各基地址 xff0c 参考存储器映射 span class token comment 由存储器的映射可知 xff0c 片上外设基地址0x4000 0000 span span class token macro proper
PID控制器原理概述

PID控制 PID概述 xff1a 控制框图 xff1a 增量式PID和位置式PID特点 xff1a PID控制参数整定口诀 xff1a 注 xff1a 本文部分内容摘自先进PID控制MATLAB仿真 xff08 第4版 xff09 刘金
PyQt5 事件处理机制

PyQt5 事件处理机制 PyQt为事件处理提供了两种机制 xff1a 高级的信号与槽机制 xff0c 以及低级的事件处理机制信号与槽可以说是对事件处理机制的高级封装常见事件类型 xff1a 键盘事件 xff1a 按键按下和松开鼠标事
PyQt5 实现串口接数据波形显示工具

PyQt5 实现串口接数据波形显示工具工具简述主程序代码Qt Designer设计UI界面程序运行效果工具简述基于PyQt5开发UI界面使用QtDesigner设计 xff0c 需要使用到serial模块 xff08 串口库 xff0
ROS CMakeLists.txt的编写学习

调用ROS中的函数 xff0c cmakelists的编写学习过程如有错误 xff0c 请留言指教多谢 A 首先要了解的 CMakeLists txt是CMake的构建系统构建软件包的输入文件任何兼容的CMake都包含了描述如何构建代
【Node】Buffer 与 Stream

node 为什么会出现 Buffer 这个模块在最初的时候 xff0c JavaScript 只运行在浏览器端 xff0c 对于处理 Unicode 编码的字符串很容易 xff0c 但是对于处理二进制以及非 Unicode 编码的数据便无
ROS的tf包中坐标变换的方法

1 setRotation函数的参数在坐标变换的时候常有这样的写法 xff1a tfTutorialsAdding a frame C 43 43 transform setOrigin span class hljs symbol tf
卡尔曼滤波的理解以及参数调整

一前言卡尔曼滤波器是一种最优线性状态估计方法 xff08 等价于在最小均方误差准则下的最佳线性滤波器 xff09 xff0c 所谓状态估计就是通过数学方法寻求与观测数据最佳拟合的状态向量在移动机器人导航方面 xff0c 卡尔曼滤波是
ROS自定义msg类型及使用

一创建msg消息参考 xff1a CreatingMsgAndSrv 首先创建一个空的package单独存放msg类型 xff08 当然也可以在任意的package中自定义msg类型 xff09 这里为便于说明 xff0c 建立一个名为
WebRTC-集成qsv硬解码实现

1 Window下QSV硬解码配置在libavcodec codec list c下添加 amp ff h264 qsv decoder 在ffmpeg generate gni下加入 34 libavcodec h264idct c 3