#include "h265_encoder_impl.h"
#include <algorithm>
#include <limits>
#include <string>
#include "i420_buffer_cuda.h"
#include "absl/strings/match.h"
#include "absl/types/optional.h"
#include "api/video/video_codec_constants.h"
#include "api/video_codecs/scalability_mode.h"
#include "common_video/libyuv/include/webrtc_libyuv.h"
#include "modules/video_coding/include/video_codec_interface.h"
#include "modules/video_coding/include/video_error_codes.h"
#include "modules/video_coding/svc/create_scalability_structure.h"
#include "modules/video_coding/utility/simulcast_rate_allocator.h"
#include "modules/video_coding/utility/simulcast_utility.h"
#include "rtc_base/checks.h"
#include "rtc_base/logging.h"
#include "rtc_base/time_utils.h"
#include "system_wrappers/include/metrics.h"
#include "third_party/libyuv/include/libyuv/convert.h"
#include "third_party/libyuv/include/libyuv/scale.h"
namespace webrtc {
enum H265EncoderImplEvent {
kH265EncoderEventInit = 0,
kH265EncoderEventError = 1,
kH265EncoderEventMax = 16,
};
NvidiaH265EncoderImpl::NvidiaH265EncoderImpl(
const webrtc::Environment& env,
CUcontext context,
CUmemorytype memory_type,
NV_ENC_BUFFER_FORMAT nv_format,
const SdpVideoFormat& format)
: env_(env),
encoder_(nullptr),
cu_context_(context),
cu_memory_type_(memory_type),
cu_scaled_array_(nullptr),
nv_format_(nv_format),
format_(format) {
RTC_CHECK_NE(cu_memory_type_, CU_MEMORYTYPE_HOST);
}
NvidiaH265EncoderImpl::~NvidiaH265EncoderImpl() {
Release();
}
void NvidiaH265EncoderImpl::ReportInit() {
if (has_reported_init_)
return;
RTC_HISTOGRAM_ENUMERATION("WebRTC.Video.H265EncoderImpl.Event",
kH265EncoderEventInit, kH265EncoderEventMax);
has_reported_init_ = true;
}
void NvidiaH265EncoderImpl::ReportError() {
if (has_reported_error_)
return;
RTC_HISTOGRAM_ENUMERATION("WebRTC.Video.H265EncoderImpl.Event",
kH265EncoderEventError, kH265EncoderEventMax);
has_reported_error_ = true;
}
int32_t NvidiaH265EncoderImpl::InitEncode(
const VideoCodec* inst,
const VideoEncoder::Settings& settings) {
if (!inst || inst->codecType != kVideoCodecH265) {
ReportError();
return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
}
if (inst->maxFramerate == 0) {
ReportError();
return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
}
if (inst->width < 1 || inst->height < 1) {
ReportError();
return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
}
int32_t release_ret = Release();
if (release_ret != WEBRTC_VIDEO_CODEC_OK) {
ReportError();
return release_ret;
}
codec_ = *inst;
if (codec_.numberOfSimulcastStreams == 0) {
codec_.simulcastStream[0].width = codec_.width;
codec_.simulcastStream[0].height = codec_.height;
}
const size_t new_capacity =
CalcBufferSize(VideoType::kI420, codec_.width, codec_.height);
encoded_image_.SetEncodedData(EncodedImageBuffer::Create(new_capacity));
encoded_image_._encodedWidth = codec_.width;
encoded_image_._encodedHeight = codec_.height;
encoded_image_.set_size(0);
configuration_.sending = false;
configuration_.frame_dropping_on = codec_.GetFrameDropEnabled();
configuration_.key_frame_interval = 0;
configuration_.width = codec_.width;
configuration_.height = codec_.height;
configuration_.max_frame_rate = codec_.maxFramerate;
configuration_.target_bps = codec_.startBitrate * 1000;
configuration_.max_bps = codec_.maxBitrate * 1000;
const CUresult result = cuCtxSetCurrent(cu_context_);
if (result != CUDA_SUCCESS) {
return WEBRTC_VIDEO_CODEC_ENCODER_FAILURE;
}
try {
if (cu_memory_type_ == CU_MEMORYTYPE_DEVICE) {
encoder_ = std::make_unique<NvEncoderCuda>(cu_context_, codec_.width,
codec_.height, nv_format_, 0);
} else {
RTC_DCHECK_NOTREACHED();
}
} catch (const NVENCException& e) {
RTC_LOG(LS_ERROR) << "Failed Initialize NvEncoder " << e.what();
return WEBRTC_VIDEO_CODEC_ERROR;
}
nv_initialize_params_.version = NV_ENC_INITIALIZE_PARAMS_VER;
nv_encode_config_.version = NV_ENC_CONFIG_VER;
nv_initialize_params_.encodeConfig = &nv_encode_config_;
GUID encodeGuid = NV_ENC_CODEC_HEVC_GUID;
GUID presetGuid = NV_ENC_PRESET_P4_GUID;
encoder_->CreateDefaultEncoderParams(&nv_initialize_params_, encodeGuid,
presetGuid,
NV_ENC_TUNING_INFO_ULTRA_LOW_LATENCY);
nv_initialize_params_.frameRateNum =
static_cast<uint32_t>(configuration_.max_frame_rate);
nv_initialize_params_.frameRateDen = 1;
nv_initialize_params_.bufferFormat = nv_format_;
nv_encode_config_.profileGUID = NV_ENC_HEVC_PROFILE_MAIN_GUID;
nv_encode_config_.gopLength = NVENC_INFINITE_GOPLENGTH;
nv_encode_config_.frameIntervalP = 1;
nv_encode_config_.rcParams.version = NV_ENC_RC_PARAMS_VER;
nv_encode_config_.rcParams.rateControlMode = NV_ENC_PARAMS_RC_CBR;
nv_encode_config_.rcParams.averageBitRate = configuration_.target_bps;
nv_encode_config_.rcParams.vbvBufferSize =
(nv_encode_config_.rcParams.averageBitRate *
nv_initialize_params_.frameRateDen /
nv_initialize_params_.frameRateNum) *
5;
nv_encode_config_.rcParams.vbvInitialDelay =
nv_encode_config_.rcParams.vbvBufferSize;
try {
encoder_->CreateEncoder(&nv_initialize_params_);
} catch (const NVENCException& e) {
RTC_LOG(LS_ERROR) << "Failed Initialize NvEncoder " << e.what();
return WEBRTC_VIDEO_CODEC_ERROR;
}
RTC_LOG(LS_INFO) << "NVIDIA H265/HEVC NVENC initialized: "
<< codec_.width << "x" << codec_.height
<< " @ " << codec_.maxFramerate << "fps, target_bps="
<< configuration_.target_bps;
SimulcastRateAllocator init_allocator(env_, codec_);
VideoBitrateAllocation allocation =
init_allocator.Allocate(VideoBitrateAllocationParameters(
DataRate::KilobitsPerSec(codec_.startBitrate), codec_.maxFramerate));
SetRates(RateControlParameters(allocation, codec_.maxFramerate));
return WEBRTC_VIDEO_CODEC_OK;
}
int32_t NvidiaH265EncoderImpl::RegisterEncodeCompleteCallback(
EncodedImageCallback* callback) {
encoded_image_callback_ = callback;
return WEBRTC_VIDEO_CODEC_OK;
}
int32_t NvidiaH265EncoderImpl::Release() {
if (encoder_) {
encoder_->DestroyEncoder();
encoder_ = nullptr;
}
if (cu_scaled_array_) {
cuArrayDestroy(cu_scaled_array_);
cu_scaled_array_ = nullptr;
}
return WEBRTC_VIDEO_CODEC_OK;
}
int32_t NvidiaH265EncoderImpl::Encode(
const VideoFrame& input_frame,
const std::vector<VideoFrameType>* frame_types) {
if (!encoder_) {
ReportError();
return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
}
if (!encoded_image_callback_) {
RTC_LOG(LS_WARNING)
<< "InitEncode() has been called, but a callback function "
"has not been set with RegisterEncodeCompleteCallback()";
ReportError();
return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
}
webrtc::scoped_refptr<I420BufferInterface> frame_buffer =
input_frame.video_frame_buffer()->ToI420();
if (!frame_buffer) {
RTC_LOG(LS_ERROR) << "Failed to convert "
<< VideoFrameBufferTypeToString(
input_frame.video_frame_buffer()->type())
<< " image to I420. Can't encode frame.";
return WEBRTC_VIDEO_CODEC_ENCODER_FAILURE;
}
RTC_CHECK(frame_buffer->type() == VideoFrameBuffer::Type::kI420);
bool is_keyframe_needed = false;
if (configuration_.key_frame_request && configuration_.sending) {
is_keyframe_needed = true;
}
bool send_key_frame =
is_keyframe_needed ||
(frame_types && (*frame_types)[0] == VideoFrameType::kVideoFrameKey);
if (send_key_frame) {
is_keyframe_needed = true;
configuration_.key_frame_request = false;
}
RTC_DCHECK_EQ(configuration_.width, frame_buffer->width());
RTC_DCHECK_EQ(configuration_.height, frame_buffer->height());
if (!configuration_.sending) {
return WEBRTC_VIDEO_CODEC_NO_OUTPUT;
}
if (frame_types != nullptr) {
if ((*frame_types)[0] == VideoFrameType::kEmptyFrame) {
return WEBRTC_VIDEO_CODEC_NO_OUTPUT;
}
}
try {
const NvEncInputFrame* nv_enc_input_frame = encoder_->GetNextInputFrame();
if (cu_memory_type_ == CU_MEMORYTYPE_DEVICE) {
CopyI420BufferToDeviceFrame(cu_context_, *frame_buffer,
*nv_enc_input_frame);
}
NV_ENC_PIC_PARAMS pic_params = NV_ENC_PIC_PARAMS();
pic_params.version = NV_ENC_PIC_PARAMS_VER;
pic_params.encodePicFlags = 0;
if (is_keyframe_needed) {
pic_params.encodePicFlags = NV_ENC_PIC_FLAG_FORCEINTRA |
NV_ENC_PIC_FLAG_FORCEIDR |
NV_ENC_PIC_FLAG_OUTPUT_SPSPPS;
configuration_.key_frame_request = false;
}
current_encoding_is_keyframe_ = is_keyframe_needed;
std::vector<std::vector<uint8_t>> bit_stream;
encoder_->EncodeFrame(bit_stream, &pic_params);
for (std::vector<uint8_t>& packet : bit_stream) {
int32_t result = ProcessEncodedFrame(packet, input_frame);
if (result != WEBRTC_VIDEO_CODEC_OK) {
return result;
}
}
current_encoding_is_keyframe_ = false;
} catch (const NVENCException& e) {
RTC_LOG(LS_ERROR) << "Failed EncodeFrame NvEncoder " << e.what();
return WEBRTC_VIDEO_CODEC_ENCODER_FAILURE;
}
return WEBRTC_VIDEO_CODEC_OK;
}
int32_t NvidiaH265EncoderImpl::ProcessEncodedFrame(
std::vector<uint8_t>& packet,
const ::webrtc::VideoFrame& inputFrame) {
encoded_image_._encodedWidth = encoder_->GetEncodeWidth();
encoded_image_._encodedHeight = encoder_->GetEncodeHeight();
encoded_image_.SetRtpTimestamp(inputFrame.rtp_timestamp());
encoded_image_.SetSimulcastIndex(0);
encoded_image_.ntp_time_ms_ = inputFrame.ntp_time_ms();
encoded_image_.capture_time_ms_ = inputFrame.render_time_ms();
encoded_image_.rotation_ = inputFrame.rotation();
encoded_image_.content_type_ = VideoContentType::UNSPECIFIED;
encoded_image_.timing_.flags = VideoSendTiming::kInvalid;
encoded_image_._frameType =
current_encoding_is_keyframe_ ? VideoFrameType::kVideoFrameKey
: VideoFrameType::kVideoFrameDelta;
encoded_image_.SetColorSpace(inputFrame.color_space());
encoded_image_.SetEncodedData(
EncodedImageBuffer::Create(packet.data(), packet.size()));
encoded_image_.set_size(packet.size());
encoded_image_.qp_ = -1;
CodecSpecificInfo codecInfo;
codecInfo.codecType = kVideoCodecH265;
const auto result =
encoded_image_callback_->OnEncodedImage(encoded_image_, &codecInfo);
if (result.error != EncodedImageCallback::Result::OK) {
RTC_LOG(LS_ERROR) << "Encode m_encodedCompleteCallback failed "
<< result.error;
return WEBRTC_VIDEO_CODEC_ERROR;
}
return WEBRTC_VIDEO_CODEC_OK;
}
VideoEncoder::EncoderInfo NvidiaH265EncoderImpl::GetEncoderInfo() const {
EncoderInfo info;
info.supports_native_handle = false;
info.implementation_name = "NVIDIA H265 Encoder";
info.scaling_settings = VideoEncoder::ScalingSettings::kOff;
info.is_hardware_accelerated = true;
info.supports_simulcast = false;
info.preferred_pixel_formats = {VideoFrameBuffer::Type::kI420};
return info;
}
void NvidiaH265EncoderImpl::SetRates(
const RateControlParameters& parameters) {
if (!encoder_) {
RTC_LOG(LS_WARNING) << "SetRates() while uninitialized.";
return;
}
if (parameters.framerate_fps < 1.0) {
RTC_LOG(LS_WARNING) << "Invalid frame rate: " << parameters.framerate_fps;
return;
}
if (parameters.bitrate.get_sum_bps() == 0) {
configuration_.SetStreamState(false);
return;
}
codec_.maxFramerate = static_cast<uint32_t>(parameters.framerate_fps);
codec_.maxBitrate = parameters.bitrate.GetSpatialLayerSum(0);
configuration_.target_bps = parameters.bitrate.GetSpatialLayerSum(0);
configuration_.max_frame_rate = parameters.framerate_fps;
if (configuration_.target_bps) {
configuration_.SetStreamState(true);
} else {
configuration_.SetStreamState(false);
}
}
void NvidiaH265EncoderImpl::LayerConfig::SetStreamState(bool send_stream) {
if (send_stream && !sending) {
key_frame_request = true;
}
sending = send_stream;
}
}