Skip to content

Commit

Permalink
rtc源支持丢264 b帧操作
Browse files Browse the repository at this point in the history
  • Loading branch information
cqm authored and mtdxc committed Jan 1, 2025
1 parent 4ddb88f commit 971c66b
Show file tree
Hide file tree
Showing 5 changed files with 173 additions and 2 deletions.
127 changes: 127 additions & 0 deletions ext-codec/H264.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,133 @@ using namespace std;
using namespace toolkit;

namespace mediakit {
/* Helpers to decode Exp-Golomb */
static uint32_t h264_eg_getbit(uint8_t *base, uint32_t offset) {
return ((*(base + (offset >> 0x3))) >> (0x7 - (offset & 0x7))) & 0x1;
}

uint32_t h264_eg_decode(uint8_t *base, uint32_t *offset) {
uint32_t zeros = 0;
while (h264_eg_getbit(base, (*offset)++) == 0)
zeros++;
uint32_t res = 1 << zeros;
if (zeros > 0) {
int32_t i = 0;
for (i = zeros - 1; i >= 0; i--) {
res |= h264_eg_getbit(base, (*offset)++) << i;
}
}
return res - 1;
}

/* Helper to parse a SPS (only to get the video resolution) */
static void h264_parse_sps(char *buffer, int *width, int *height) {
/* Let's check if it's the right profile, first */
int index = 1;
int profile_idc = *(buffer + index);
if (profile_idc != 66) {
WarnL << "Profile is not baseline " << profile_idc;
}
/* Then let's skip 2 bytes and evaluate/skip the rest */
index += 3;
uint32_t offset = 0;
uint8_t *base = (uint8_t *)(buffer + index);
/* Skip seq_parameter_set_id */
h264_eg_decode(base, &offset);
if (profile_idc >= 100) {
/* Skip chroma_format_idc */
h264_eg_decode(base, &offset);
/* Skip bit_depth_luma_minus8 */
h264_eg_decode(base, &offset);
/* Skip bit_depth_chroma_minus8 */
h264_eg_decode(base, &offset);
/* Skip qpprime_y_zero_transform_bypass_flag */
h264_eg_getbit(base, offset++);
/* Skip seq_scaling_matrix_present_flag */
h264_eg_getbit(base, offset++);
}
/* Skip log2_max_frame_num_minus4 */
h264_eg_decode(base, &offset);
/* Evaluate pic_order_cnt_type */
int pic_order_cnt_type = h264_eg_decode(base, &offset);
if (pic_order_cnt_type == 0) {
/* Skip log2_max_pic_order_cnt_lsb_minus4 */
h264_eg_decode(base, &offset);
} else if (pic_order_cnt_type == 1) {
/* Skip delta_pic_order_always_zero_flag, offset_for_non_ref_pic,
* offset_for_top_to_bottom_field and num_ref_frames_in_pic_order_cnt_cycle */
h264_eg_getbit(base, offset++);
h264_eg_decode(base, &offset);
h264_eg_decode(base, &offset);
int num_ref_frames_in_pic_order_cnt_cycle = h264_eg_decode(base, &offset);
int i = 0;
for (i = 0; i < num_ref_frames_in_pic_order_cnt_cycle; i++) {
h264_eg_decode(base, &offset);
}
}
/* Skip max_num_ref_frames and gaps_in_frame_num_value_allowed_flag */
h264_eg_decode(base, &offset);
h264_eg_getbit(base, offset++);
/* We need the following three values */
int pic_width_in_mbs_minus1 = h264_eg_decode(base, &offset);
int pic_height_in_map_units_minus1 = h264_eg_decode(base, &offset);
int frame_mbs_only_flag = h264_eg_getbit(base, offset++);
if (!frame_mbs_only_flag) {
/* Skip mb_adaptive_frame_field_flag */
h264_eg_getbit(base, offset++);
}
/* Skip direct_8x8_inference_flag */
h264_eg_getbit(base, offset++);
/* We need the following value to evaluate offsets, if any */
int frame_cropping_flag = h264_eg_getbit(base, offset++);
int frame_crop_left_offset = 0, frame_crop_right_offset = 0, frame_crop_top_offset = 0, frame_crop_bottom_offset = 0;
if (frame_cropping_flag) {
frame_crop_left_offset = h264_eg_decode(base, &offset);
frame_crop_right_offset = h264_eg_decode(base, &offset);
frame_crop_top_offset = h264_eg_decode(base, &offset);
frame_crop_bottom_offset = h264_eg_decode(base, &offset);
}
/* Skip vui_parameters_present_flag */
h264_eg_getbit(base, offset++);

/* We skipped what we didn't care about and got what we wanted, compute width/height */
if (width)
*width = ((pic_width_in_mbs_minus1 + 1) * 16) - frame_crop_left_offset * 2 - frame_crop_right_offset * 2;
if (height)
*height = ((2 - frame_mbs_only_flag) * (pic_height_in_map_units_minus1 + 1) * 16) - (frame_crop_top_offset * 2) - (frame_crop_bottom_offset * 2);
}

bool h264_is_bframe(uint8_t *buffer, int size) {
uint8_t nalTye = buffer[0] & 0x1F;
if (nalTye != 1) {
return false;
}
buffer++;
uint32_t offset = 0;
/* i_first_mb */
h264_eg_decode(buffer, &offset);
/* picture type */
int frame_type = h264_eg_decode(buffer, &offset);
switch(frame_type)
{
case 0: case 5: // P
//nal->Frametype = FRAME_P;
break;
case 1: case 6: // B
return true;
break;
case 3: case 8: // SP
//nal->Frametype = FRAME_P;
break;
case 2: case 7: // I
//nal->Frametype = FRAME_I;
break;
case 4: case 9: // SI
//nal->Frametype = FRAME_I;
break;
}
return false;
}

static bool getAVCInfo(const char *sps, size_t sps_len, int &iVideoWidth, int &iVideoHeight, float &iVideoFps) {
if (sps_len < 4) {
Expand Down
28 changes: 28 additions & 0 deletions ext-codec/H264.h
Original file line number Diff line number Diff line change
Expand Up @@ -20,6 +20,8 @@ namespace mediakit{

void splitH264(const char *ptr, size_t len, size_t prefix, const std::function<void(const char *, size_t, size_t)> &cb);
size_t prefixSize(const char *ptr, size_t len);
bool h264_is_bframe(uint8_t *buffer, int size);
uint32_t h264_eg_decode(uint8_t *base, uint32_t *offset);

template<typename Parent>
class H264FrameHelper : public Parent{
Expand Down Expand Up @@ -72,6 +74,32 @@ class H264FrameHelper : public Parent{
// // In the case of multiple slices, first_mb_in_slice indicates the start of a frame
return type >= NAL_B_P && type <= NAL_IDR && (nal_ptr[1] & 0x80);
}

enum SrsAvcSliceType {
SrsAvcSliceTypeP = 0,
SrsAvcSliceTypeB = 1,
SrsAvcSliceTypeI = 2,
SrsAvcSliceTypeSP = 3,
SrsAvcSliceTypeSI = 4,
SrsAvcSliceTypeP1 = 5,
SrsAvcSliceTypeB1 = 6,
SrsAvcSliceTypeI1 = 7,
SrsAvcSliceTypeSP1 = 8,
SrsAvcSliceTypeSI1 = 9,
};

bool bframe() const {
auto nal_ptr = (uint8_t *)this->data() + this->prefixSize();
if (H264_TYPE(*nal_ptr) != NAL_B_P)
return false;
nal_ptr++;
uint32_t offset = 0;
/* i_first_mb */
h264_eg_decode(nal_ptr, &offset);
/* picture type */
int frame_type = h264_eg_decode(nal_ptr, &offset);
return SrsAvcSliceTypeB == frame_type || SrsAvcSliceTypeB1 == frame_type;
}
};

/**
Expand Down
17 changes: 15 additions & 2 deletions webrtc/RtcMediaSource.h
Original file line number Diff line number Diff line change
Expand Up @@ -3,8 +3,9 @@

#include "Rtsp/RtspMediaSourceMuxer.h"
#include "Rtsp/RtspMediaSourceImp.h"
#include "webrtc/WebRtcTransport.h"
namespace mediakit {

extern bool h264_is_bframe(uint8_t *buffer, int size);
class RtcMediaSourceImp : public RtspMediaSourceImp {
public:
using Ptr = std::shared_ptr<RtcMediaSourceImp>;
Expand Down Expand Up @@ -51,7 +52,19 @@ class RtcMediaSourceMuxer : public RtspMediaSourceMuxer {
_trans->delDelegate(this);
}
}
protected:

bool inputFrame(const Frame::Ptr &frame) override {
// skip b-frame for webrtc
GET_CONFIG(int, dropBFrame, Rtc::kDrop264BFrame);
if (dropBFrame && frame->getCodecId() == CodecH264) {
if (h264_is_bframe((uint8_t *)frame->data() + frame->prefixSize(), frame->size() - frame->prefixSize())) {
DebugL << "skipFrame " << frame->size() << " tsp:" << frame->pts() << "," << frame->dts();
return true;
}
}
return RtspMediaSourceMuxer::inputFrame(frame);
}
protected:
Track::Ptr _trans;
};

Expand Down
2 changes: 2 additions & 0 deletions webrtc/WebRtcTransport.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -64,6 +64,7 @@ const string kMinBitrate = RTC_FIELD "min_bitrate";
// 数据通道设置 [AUTO-TRANSLATED:2dc48bc3]
// Data channel setting
const string kDataChannelEcho = RTC_FIELD "datachannel_echo";
const string kDrop264BFrame = RTC_FIELD "drop_h264_bframe";

static onceToken token([]() {
mINI::Instance()[kTimeOutSec] = 15;
Expand All @@ -76,6 +77,7 @@ static onceToken token([]() {
mINI::Instance()[kMaxBitrate] = 0;
mINI::Instance()[kMinBitrate] = 0;

mINI::Instance()[kDrop264BFrame] = true;
mINI::Instance()[kDataChannelEcho] = true;
});

Expand Down
1 change: 1 addition & 0 deletions webrtc/WebRtcTransport.h
Original file line number Diff line number Diff line change
Expand Up @@ -34,6 +34,7 @@ namespace Rtc {
extern const std::string kPort;
extern const std::string kTcpPort;
extern const std::string kTimeOutSec;
extern const std::string kDrop264BFrame;
}//namespace RTC

class WebRtcInterface {
Expand Down

0 comments on commit 971c66b

Please sign in to comment.