From 971c66b11a122e897118cc7de656b64c399db94c Mon Sep 17 00:00:00 2001 From: cqm Date: Tue, 31 Dec 2024 17:48:40 +0800 Subject: [PATCH] =?UTF-8?q?rtc=E6=BA=90=E6=94=AF=E6=8C=81=E4=B8=A2264=20b?= =?UTF-8?q?=E5=B8=A7=E6=93=8D=E4=BD=9C?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- ext-codec/H264.cpp | 127 +++++++++++++++++++++++++++++++++++++ ext-codec/H264.h | 28 ++++++++ webrtc/RtcMediaSource.h | 17 ++++- webrtc/WebRtcTransport.cpp | 2 + webrtc/WebRtcTransport.h | 1 + 5 files changed, 173 insertions(+), 2 deletions(-) diff --git a/ext-codec/H264.cpp b/ext-codec/H264.cpp index 38c1d9bc25..227e795c05 100644 --- a/ext-codec/H264.cpp +++ b/ext-codec/H264.cpp @@ -26,6 +26,133 @@ using namespace std; using namespace toolkit; namespace mediakit { +/* Helpers to decode Exp-Golomb */ +static uint32_t h264_eg_getbit(uint8_t *base, uint32_t offset) { + return ((*(base + (offset >> 0x3))) >> (0x7 - (offset & 0x7))) & 0x1; +} + +uint32_t h264_eg_decode(uint8_t *base, uint32_t *offset) { + uint32_t zeros = 0; + while (h264_eg_getbit(base, (*offset)++) == 0) + zeros++; + uint32_t res = 1 << zeros; + if (zeros > 0) { + int32_t i = 0; + for (i = zeros - 1; i >= 0; i--) { + res |= h264_eg_getbit(base, (*offset)++) << i; + } + } + return res - 1; +} + +/* Helper to parse a SPS (only to get the video resolution) */ +static void h264_parse_sps(char *buffer, int *width, int *height) { + /* Let's check if it's the right profile, first */ + int index = 1; + int profile_idc = *(buffer + index); + if (profile_idc != 66) { + WarnL << "Profile is not baseline " << profile_idc; + } + /* Then let's skip 2 bytes and evaluate/skip the rest */ + index += 3; + uint32_t offset = 0; + uint8_t *base = (uint8_t *)(buffer + index); + /* Skip seq_parameter_set_id */ + h264_eg_decode(base, &offset); + if (profile_idc >= 100) { + /* Skip chroma_format_idc */ + h264_eg_decode(base, &offset); + /* Skip bit_depth_luma_minus8 */ + h264_eg_decode(base, &offset); + /* Skip bit_depth_chroma_minus8 */ + h264_eg_decode(base, &offset); + /* Skip qpprime_y_zero_transform_bypass_flag */ + h264_eg_getbit(base, offset++); + /* Skip seq_scaling_matrix_present_flag */ + h264_eg_getbit(base, offset++); + } + /* Skip log2_max_frame_num_minus4 */ + h264_eg_decode(base, &offset); + /* Evaluate pic_order_cnt_type */ + int pic_order_cnt_type = h264_eg_decode(base, &offset); + if (pic_order_cnt_type == 0) { + /* Skip log2_max_pic_order_cnt_lsb_minus4 */ + h264_eg_decode(base, &offset); + } else if (pic_order_cnt_type == 1) { + /* Skip delta_pic_order_always_zero_flag, offset_for_non_ref_pic, + * offset_for_top_to_bottom_field and num_ref_frames_in_pic_order_cnt_cycle */ + h264_eg_getbit(base, offset++); + h264_eg_decode(base, &offset); + h264_eg_decode(base, &offset); + int num_ref_frames_in_pic_order_cnt_cycle = h264_eg_decode(base, &offset); + int i = 0; + for (i = 0; i < num_ref_frames_in_pic_order_cnt_cycle; i++) { + h264_eg_decode(base, &offset); + } + } + /* Skip max_num_ref_frames and gaps_in_frame_num_value_allowed_flag */ + h264_eg_decode(base, &offset); + h264_eg_getbit(base, offset++); + /* We need the following three values */ + int pic_width_in_mbs_minus1 = h264_eg_decode(base, &offset); + int pic_height_in_map_units_minus1 = h264_eg_decode(base, &offset); + int frame_mbs_only_flag = h264_eg_getbit(base, offset++); + if (!frame_mbs_only_flag) { + /* Skip mb_adaptive_frame_field_flag */ + h264_eg_getbit(base, offset++); + } + /* Skip direct_8x8_inference_flag */ + h264_eg_getbit(base, offset++); + /* We need the following value to evaluate offsets, if any */ + int frame_cropping_flag = h264_eg_getbit(base, offset++); + int frame_crop_left_offset = 0, frame_crop_right_offset = 0, frame_crop_top_offset = 0, frame_crop_bottom_offset = 0; + if (frame_cropping_flag) { + frame_crop_left_offset = h264_eg_decode(base, &offset); + frame_crop_right_offset = h264_eg_decode(base, &offset); + frame_crop_top_offset = h264_eg_decode(base, &offset); + frame_crop_bottom_offset = h264_eg_decode(base, &offset); + } + /* Skip vui_parameters_present_flag */ + h264_eg_getbit(base, offset++); + + /* We skipped what we didn't care about and got what we wanted, compute width/height */ + if (width) + *width = ((pic_width_in_mbs_minus1 + 1) * 16) - frame_crop_left_offset * 2 - frame_crop_right_offset * 2; + if (height) + *height = ((2 - frame_mbs_only_flag) * (pic_height_in_map_units_minus1 + 1) * 16) - (frame_crop_top_offset * 2) - (frame_crop_bottom_offset * 2); +} + +bool h264_is_bframe(uint8_t *buffer, int size) { + uint8_t nalTye = buffer[0] & 0x1F; + if (nalTye != 1) { + return false; + } + buffer++; + uint32_t offset = 0; + /* i_first_mb */ + h264_eg_decode(buffer, &offset); + /* picture type */ + int frame_type = h264_eg_decode(buffer, &offset); + switch(frame_type) + { + case 0: case 5: // P + //nal->Frametype = FRAME_P; + break; + case 1: case 6: // B + return true; + break; + case 3: case 8: // SP + //nal->Frametype = FRAME_P; + break; + case 2: case 7: // I + //nal->Frametype = FRAME_I; + break; + case 4: case 9: // SI + //nal->Frametype = FRAME_I; + break; + } + return false; +} static bool getAVCInfo(const char *sps, size_t sps_len, int &iVideoWidth, int &iVideoHeight, float &iVideoFps) { if (sps_len < 4) { diff --git a/ext-codec/H264.h b/ext-codec/H264.h index 55b6f1ff50..b74efcc1d9 100644 --- a/ext-codec/H264.h +++ b/ext-codec/H264.h @@ -20,6 +20,8 @@ namespace mediakit{ void splitH264(const char *ptr, size_t len, size_t prefix, const std::function &cb); size_t prefixSize(const char *ptr, size_t len); +bool h264_is_bframe(uint8_t *buffer, int size); +uint32_t h264_eg_decode(uint8_t *base, uint32_t *offset); template class H264FrameHelper : public Parent{ @@ -72,6 +74,32 @@ class H264FrameHelper : public Parent{ // // In the case of multiple slices, first_mb_in_slice indicates the start of a frame return type >= NAL_B_P && type <= NAL_IDR && (nal_ptr[1] & 0x80); } + + enum SrsAvcSliceType { + SrsAvcSliceTypeP = 0, + SrsAvcSliceTypeB = 1, + SrsAvcSliceTypeI = 2, + SrsAvcSliceTypeSP = 3, + SrsAvcSliceTypeSI = 4, + SrsAvcSliceTypeP1 = 5, + SrsAvcSliceTypeB1 = 6, + SrsAvcSliceTypeI1 = 7, + SrsAvcSliceTypeSP1 = 8, + SrsAvcSliceTypeSI1 = 9, + }; + + bool bframe() const { + auto nal_ptr = (uint8_t *)this->data() + this->prefixSize(); + if (H264_TYPE(*nal_ptr) != NAL_B_P) + return false; + nal_ptr++; + uint32_t offset = 0; + /* i_first_mb */ + h264_eg_decode(nal_ptr, &offset); + /* picture type */ + int frame_type = h264_eg_decode(nal_ptr, &offset); + return SrsAvcSliceTypeB == frame_type || SrsAvcSliceTypeB1 == frame_type; + } }; /** diff --git a/webrtc/RtcMediaSource.h b/webrtc/RtcMediaSource.h index 6e18893a0b..bfba8ed804 100644 --- a/webrtc/RtcMediaSource.h +++ b/webrtc/RtcMediaSource.h @@ -3,8 +3,9 @@ #include "Rtsp/RtspMediaSourceMuxer.h" #include "Rtsp/RtspMediaSourceImp.h" +#include "webrtc/WebRtcTransport.h" namespace mediakit { - +extern bool h264_is_bframe(uint8_t *buffer, int size); class RtcMediaSourceImp : public RtspMediaSourceImp { public: using Ptr = std::shared_ptr; @@ -51,7 +52,19 @@ class RtcMediaSourceMuxer : public RtspMediaSourceMuxer { _trans->delDelegate(this); } } -protected: + + bool inputFrame(const Frame::Ptr &frame) override { + // skip b-frame for webrtc + GET_CONFIG(int, dropBFrame, Rtc::kDrop264BFrame); + if (dropBFrame && frame->getCodecId() == CodecH264) { + if (h264_is_bframe((uint8_t *)frame->data() + frame->prefixSize(), frame->size() - frame->prefixSize())) { + DebugL << "skipFrame " << frame->size() << " tsp:" << frame->pts() << "," << frame->dts(); + return true; + } + } + return RtspMediaSourceMuxer::inputFrame(frame); + } + protected: Track::Ptr _trans; }; diff --git a/webrtc/WebRtcTransport.cpp b/webrtc/WebRtcTransport.cpp index efc0f71b3b..cec4c9aa69 100644 --- a/webrtc/WebRtcTransport.cpp +++ b/webrtc/WebRtcTransport.cpp @@ -64,6 +64,7 @@ const string kMinBitrate = RTC_FIELD "min_bitrate"; // 数据通道设置 [AUTO-TRANSLATED:2dc48bc3] // Data channel setting const string kDataChannelEcho = RTC_FIELD "datachannel_echo"; +const string kDrop264BFrame = RTC_FIELD "drop_h264_bframe"; static onceToken token([]() { mINI::Instance()[kTimeOutSec] = 15; @@ -76,6 +77,7 @@ static onceToken token([]() { mINI::Instance()[kMaxBitrate] = 0; mINI::Instance()[kMinBitrate] = 0; + mINI::Instance()[kDrop264BFrame] = true; mINI::Instance()[kDataChannelEcho] = true; }); diff --git a/webrtc/WebRtcTransport.h b/webrtc/WebRtcTransport.h index b5cbe12da4..4c86d8b6e4 100644 --- a/webrtc/WebRtcTransport.h +++ b/webrtc/WebRtcTransport.h @@ -34,6 +34,7 @@ namespace Rtc { extern const std::string kPort; extern const std::string kTcpPort; extern const std::string kTimeOutSec; +extern const std::string kDrop264BFrame; }//namespace RTC class WebRtcInterface {