mirror of
https://github.com/ZLMediaKit/ZLMediaKit.git
synced 2024-12-18 08:26:38 +08:00
425 lines
15 KiB
C++
425 lines
15 KiB
C++
/*
|
||
* Copyright (c) 2016-present The ZLMediaKit project authors. All Rights Reserved.
|
||
*
|
||
* This file is part of ZLMediaKit(https://github.com/ZLMediaKit/ZLMediaKit).
|
||
*
|
||
* Use of this source code is governed by MIT-like license that can be found in the
|
||
* LICENSE file in the root of the source tree. All contributing project authors
|
||
* may be found in the AUTHORS file in the root of the source tree.
|
||
*/
|
||
|
||
#include "H264.h"
|
||
#include "H264Rtmp.h"
|
||
#include "H264Rtp.h"
|
||
#include "SPSParser.h"
|
||
#include "Util/logger.h"
|
||
#include "Util/base64.h"
|
||
#include "Common/Parser.h"
|
||
#include "Common/config.h"
|
||
#include "Extension/Factory.h"
|
||
|
||
#ifdef ENABLE_MP4
|
||
#include "mpeg4-avc.h"
|
||
#endif
|
||
|
||
using namespace std;
|
||
using namespace toolkit;
|
||
|
||
namespace mediakit {
|
||
|
||
static bool getAVCInfo(const char *sps, size_t sps_len, int &iVideoWidth, int &iVideoHeight, float &iVideoFps) {
|
||
if (sps_len < 4) {
|
||
return false;
|
||
}
|
||
T_GetBitContext tGetBitBuf;
|
||
T_SPS tH264SpsInfo;
|
||
memset(&tGetBitBuf, 0, sizeof(tGetBitBuf));
|
||
memset(&tH264SpsInfo, 0, sizeof(tH264SpsInfo));
|
||
tGetBitBuf.pu8Buf = (uint8_t *)sps + 1;
|
||
tGetBitBuf.iBufSize = (int)(sps_len - 1);
|
||
if (0 != h264DecSeqParameterSet((void *)&tGetBitBuf, &tH264SpsInfo)) {
|
||
return false;
|
||
}
|
||
h264GetWidthHeight(&tH264SpsInfo, &iVideoWidth, &iVideoHeight);
|
||
h264GeFramerate(&tH264SpsInfo, &iVideoFps);
|
||
// ErrorL << iVideoWidth << " " << iVideoHeight << " " << iVideoFps;
|
||
return true;
|
||
}
|
||
|
||
bool getAVCInfo(const string &strSps, int &iVideoWidth, int &iVideoHeight, float &iVideoFps) {
|
||
return getAVCInfo(strSps.data(), strSps.size(), iVideoWidth, iVideoHeight, iVideoFps);
|
||
}
|
||
|
||
static const char *memfind(const char *buf, ssize_t len, const char *subbuf, ssize_t sublen) {
|
||
for (auto i = 0; i < len - sublen; ++i) {
|
||
if (memcmp(buf + i, subbuf, sublen) == 0) {
|
||
return buf + i;
|
||
}
|
||
}
|
||
return NULL;
|
||
}
|
||
|
||
void splitH264(
|
||
const char *ptr, size_t len, size_t prefix, const std::function<void(const char *, size_t, size_t)> &cb) {
|
||
auto start = ptr + prefix;
|
||
auto end = ptr + len;
|
||
size_t next_prefix;
|
||
while (true) {
|
||
auto next_start = memfind(start, end - start, "\x00\x00\x01", 3);
|
||
if (next_start) {
|
||
// 找到下一帧 [AUTO-TRANSLATED:7161f54a]
|
||
// Find the next frame
|
||
if (*(next_start - 1) == 0x00) {
|
||
// 这个是00 00 00 01开头 [AUTO-TRANSLATED:b0d79e9e]
|
||
// This starts with 00 00 00 01
|
||
next_start -= 1;
|
||
next_prefix = 4;
|
||
} else {
|
||
// 这个是00 00 01开头 [AUTO-TRANSLATED:18ae81d8]
|
||
// This starts with 00 00 01
|
||
next_prefix = 3;
|
||
}
|
||
// 记得加上本帧prefix长度 [AUTO-TRANSLATED:8bde5d52]
|
||
// Remember to add the prefix length of this frame
|
||
cb(start - prefix, next_start - start + prefix, prefix);
|
||
// 搜索下一帧末尾的起始位置 [AUTO-TRANSLATED:8976b719]
|
||
// Search for the starting position of the end of the next frame
|
||
start = next_start + next_prefix;
|
||
// 记录下一帧的prefix长度 [AUTO-TRANSLATED:756aee4e]
|
||
// Record the prefix length of the next frame
|
||
prefix = next_prefix;
|
||
continue;
|
||
}
|
||
// 未找到下一帧,这是最后一帧 [AUTO-TRANSLATED:58365453]
|
||
// The next frame was not found, this is the last frame
|
||
cb(start - prefix, end - start + prefix, prefix);
|
||
break;
|
||
}
|
||
}
|
||
|
||
size_t prefixSize(const char *ptr, size_t len) {
|
||
if (len < 4) {
|
||
return 0;
|
||
}
|
||
|
||
if (ptr[0] != 0x00 || ptr[1] != 0x00) {
|
||
// 不是0x00 00开头 [AUTO-TRANSLATED:c406f0da]
|
||
// Not 0x00 00 at the beginning
|
||
return 0;
|
||
}
|
||
|
||
if (ptr[2] == 0x00 && ptr[3] == 0x01) {
|
||
// 是0x00 00 00 01 [AUTO-TRANSLATED:70caae72]
|
||
// It is 0x00 00 00 01
|
||
return 4;
|
||
}
|
||
|
||
if (ptr[2] == 0x01) {
|
||
// 是0x00 00 01 [AUTO-TRANSLATED:78b4a3c9]
|
||
// It is 0x00 00 01
|
||
return 3;
|
||
}
|
||
return 0;
|
||
}
|
||
|
||
////////////////////////////////////////////////////////////////////////////////////////////////////
|
||
|
||
H264Track::H264Track(const string &sps, const string &pps, int sps_prefix_len, int pps_prefix_len) {
|
||
_sps = sps.substr(sps_prefix_len);
|
||
_pps = pps.substr(pps_prefix_len);
|
||
H264Track::update();
|
||
}
|
||
|
||
CodecId H264Track::getCodecId() const {
|
||
return CodecH264;
|
||
}
|
||
|
||
int H264Track::getVideoHeight() const {
|
||
return _height;
|
||
}
|
||
|
||
int H264Track::getVideoWidth() const {
|
||
return _width;
|
||
}
|
||
|
||
float H264Track::getVideoFps() const {
|
||
return _fps;
|
||
}
|
||
|
||
bool H264Track::ready() const {
|
||
return !_sps.empty() && !_pps.empty();
|
||
}
|
||
|
||
bool H264Track::inputFrame(const Frame::Ptr &frame) {
|
||
using H264FrameInternal = FrameInternal<H264FrameNoCacheAble>;
|
||
int type = H264_TYPE(frame->data()[frame->prefixSize()]);
|
||
|
||
if ((type == H264Frame::NAL_B_P || type == H264Frame::NAL_IDR) && ready()) {
|
||
return inputFrame_l(frame);
|
||
}
|
||
|
||
// 非I/B/P帧情况下,split一下,防止多个帧粘合在一起 [AUTO-TRANSLATED:b69c6e75]
|
||
// In the case of non-I/B/P frames, split it to prevent multiple frames from sticking together
|
||
bool ret = false;
|
||
splitH264(frame->data(), frame->size(), frame->prefixSize(), [&](const char *ptr, size_t len, size_t prefix) {
|
||
H264FrameInternal::Ptr sub_frame = std::make_shared<H264FrameInternal>(frame, (char *)ptr, len, prefix);
|
||
if (inputFrame_l(sub_frame)) {
|
||
ret = true;
|
||
}
|
||
});
|
||
return ret;
|
||
}
|
||
|
||
toolkit::Buffer::Ptr H264Track::getExtraData() const {
|
||
CHECK(ready());
|
||
|
||
#ifdef ENABLE_MP4
|
||
struct mpeg4_avc_t avc;
|
||
memset(&avc, 0, sizeof(avc));
|
||
string sps_pps = string("\x00\x00\x00\x01", 4) + _sps + string("\x00\x00\x00\x01", 4) + _pps;
|
||
h264_annexbtomp4(&avc, sps_pps.data(), (int)sps_pps.size(), NULL, 0, NULL, NULL);
|
||
|
||
std::string extra_data;
|
||
extra_data.resize(1024);
|
||
auto extra_data_size = mpeg4_avc_decoder_configuration_record_save(&avc, (uint8_t *)extra_data.data(), extra_data.size());
|
||
if (extra_data_size == -1) {
|
||
WarnL << "生成H264 extra_data 失败";
|
||
return nullptr;
|
||
}
|
||
extra_data.resize(extra_data_size);
|
||
return std::make_shared<BufferString>(std::move(extra_data));
|
||
#else
|
||
std::string extra_data;
|
||
// AVCDecoderConfigurationRecord start
|
||
extra_data.push_back(1); // version
|
||
extra_data.push_back(_sps[1]); // profile
|
||
extra_data.push_back(_sps[2]); // compat
|
||
extra_data.push_back(_sps[3]); // level
|
||
extra_data.push_back((char)0xff); // 6 bits reserved + 2 bits nal size length - 1 (11)
|
||
extra_data.push_back((char)0xe1); // 3 bits reserved + 5 bits number of sps (00001)
|
||
// sps
|
||
uint16_t size = (uint16_t)_sps.size();
|
||
size = htons(size);
|
||
extra_data.append((char *)&size, 2);
|
||
extra_data.append(_sps);
|
||
// pps
|
||
extra_data.push_back(1); // version
|
||
size = (uint16_t)_pps.size();
|
||
size = htons(size);
|
||
extra_data.append((char *)&size, 2);
|
||
extra_data.append(_pps);
|
||
return std::make_shared<BufferString>(std::move(extra_data));
|
||
#endif
|
||
}
|
||
|
||
void H264Track::setExtraData(const uint8_t *data, size_t bytes) {
|
||
#ifdef ENABLE_MP4
|
||
struct mpeg4_avc_t avc;
|
||
memset(&avc, 0, sizeof(avc));
|
||
if (mpeg4_avc_decoder_configuration_record_load(data, bytes, &avc) > 0) {
|
||
std::vector<uint8_t> config(bytes * 2);
|
||
int size = mpeg4_avc_to_nalu(&avc, config.data(), bytes * 2);
|
||
if (size > 4) {
|
||
splitH264((char *)config.data(), size, 4, [&](const char *ptr, size_t len, size_t prefix) {
|
||
inputFrame_l(std::make_shared<H264FrameNoCacheAble>((char *)ptr, len, 0, 0, prefix));
|
||
});
|
||
update();
|
||
}
|
||
}
|
||
#else
|
||
CHECK(bytes >= 8); // 6 + 2
|
||
size_t offset = 6;
|
||
|
||
uint16_t sps_size = data[offset] << 8 | data[offset + 1];
|
||
auto sps_ptr = data + offset + 2;
|
||
offset += (2 + sps_size);
|
||
CHECK(bytes >= offset + 2); // + pps_size
|
||
_sps.assign((char *)sps_ptr, sps_size);
|
||
|
||
uint16_t pps_size = data[offset] << 8 | data[offset + 1];
|
||
auto pps_ptr = data + offset + 2;
|
||
offset += (2 + pps_size);
|
||
CHECK(bytes >= offset);
|
||
_pps.assign((char *)pps_ptr, pps_size);
|
||
update();
|
||
#endif
|
||
}
|
||
|
||
bool H264Track::update() {
|
||
return getAVCInfo(_sps, _width, _height, _fps);
|
||
}
|
||
|
||
std::vector<Frame::Ptr> H264Track::getConfigFrames() const {
|
||
if (!ready()) {
|
||
return {};
|
||
}
|
||
return { createConfigFrame<H264Frame>(_sps, 0, getIndex()),
|
||
createConfigFrame<H264Frame>(_pps, 0, getIndex()) };
|
||
}
|
||
|
||
Track::Ptr H264Track::clone() const {
|
||
return std::make_shared<H264Track>(*this);
|
||
}
|
||
|
||
bool H264Track::inputFrame_l(const Frame::Ptr &frame) {
|
||
int type = H264_TYPE(frame->data()[frame->prefixSize()]);
|
||
bool ret = true;
|
||
switch (type) {
|
||
case H264Frame::NAL_SPS: {
|
||
_sps = string(frame->data() + frame->prefixSize(), frame->size() - frame->prefixSize());
|
||
_latest_is_config_frame = true;
|
||
ret = VideoTrack::inputFrame(frame);
|
||
break;
|
||
}
|
||
case H264Frame::NAL_PPS: {
|
||
_pps = string(frame->data() + frame->prefixSize(), frame->size() - frame->prefixSize());
|
||
_latest_is_config_frame = true;
|
||
ret = VideoTrack::inputFrame(frame);
|
||
break;
|
||
}
|
||
default:
|
||
// 避免识别不出关键帧 [AUTO-TRANSLATED:8eb84679]
|
||
// Avoid not being able to recognize keyframes
|
||
if (_latest_is_config_frame && !frame->dropAble()) {
|
||
if (!frame->keyFrame()) {
|
||
const_cast<Frame::Ptr &>(frame) = std::make_shared<FrameCacheAble>(frame, true);
|
||
}
|
||
}
|
||
// 判断是否是I帧, 并且如果是,那判断前面是否插入过config帧, 如果插入过就不插入了 [AUTO-TRANSLATED:40733cd8]
|
||
// Determine if it is an I frame, and if it is, determine if a config frame has been inserted before, and if it has been inserted, do not insert it
|
||
if (frame->keyFrame() && !_latest_is_config_frame) {
|
||
insertConfigFrame(frame);
|
||
}
|
||
if(!frame->dropAble()){
|
||
_latest_is_config_frame = false;
|
||
}
|
||
ret = VideoTrack::inputFrame(frame);
|
||
break;
|
||
}
|
||
|
||
if (_width == 0 && ready()) {
|
||
update();
|
||
}
|
||
return ret;
|
||
}
|
||
|
||
void H264Track::insertConfigFrame(const Frame::Ptr &frame) {
|
||
if (!_sps.empty()) {
|
||
VideoTrack::inputFrame(createConfigFrame<H264Frame>(_sps, frame->dts(), frame->getIndex()));
|
||
}
|
||
|
||
if (!_pps.empty()) {
|
||
VideoTrack::inputFrame(createConfigFrame<H264Frame>(_pps, frame->dts(), frame->getIndex()));
|
||
}
|
||
}
|
||
|
||
class H264Sdp : public Sdp {
|
||
public:
|
||
H264Sdp(const string &strSPS, const string &strPPS, int payload_type, int bitrate) : Sdp(90000, payload_type) {
|
||
_printer << "m=video 0 RTP/AVP " << payload_type << "\r\n";
|
||
if (bitrate) {
|
||
_printer << "b=AS:" << bitrate << "\r\n";
|
||
}
|
||
_printer << "a=rtpmap:" << payload_type << " " << getCodecName(CodecH264) << "/" << 90000 << "\r\n";
|
||
|
||
/**
|
||
Single NAI Unit Mode = 0. // Single NAI mode (Only nals from 1-23 are allowed)
|
||
Non Interleaved Mode = 1,// Non-interleaved Mode: 1-23,24 (STAP-A),28 (FU-A) are allowed
|
||
Interleaved Mode = 2, // 25 (STAP-B),26 (MTAP16),27 (MTAP24),28 (EU-A),and 29 (EU-B) are allowed.
|
||
Single NAI Unit Mode = 0. // Single NAI mode (Only nals from 1-23 are allowed)
|
||
Non Interleaved Mode = 1,// Non-interleaved Mode: 1-23,24 (STAP-A),28 (FU-A) are allowed
|
||
Interleaved Mode = 2, // 25 (STAP-B),26 (MTAP16),27 (MTAP24),28 (EU-A),and 29 (EU-B) are allowed.
|
||
*
|
||
* [AUTO-TRANSLATED:6166738f]
|
||
**/
|
||
GET_CONFIG(bool, h264_stap_a, Rtp::kH264StapA);
|
||
_printer << "a=fmtp:" << payload_type << " packetization-mode=" << h264_stap_a << "; profile-level-id=";
|
||
|
||
uint32_t profile_level_id = 0;
|
||
if (strSPS.length() >= 4) { // sanity check
|
||
profile_level_id = (uint8_t(strSPS[1]) << 16) |
|
||
(uint8_t(strSPS[2]) << 8) |
|
||
(uint8_t(strSPS[3])); // profile_idc|constraint_setN_flag|level_idc
|
||
}
|
||
|
||
char profile[8];
|
||
snprintf(profile, sizeof(profile), "%06X", profile_level_id);
|
||
_printer << profile;
|
||
_printer << "; sprop-parameter-sets=";
|
||
_printer << encodeBase64(strSPS) << ",";
|
||
_printer << encodeBase64(strPPS) << "\r\n";
|
||
}
|
||
|
||
string getSdp() const { return _printer; }
|
||
|
||
private:
|
||
_StrPrinter _printer;
|
||
};
|
||
|
||
Sdp::Ptr H264Track::getSdp(uint8_t payload_type) const {
|
||
if (!ready()) {
|
||
WarnL << getCodecName() << " Track未准备好";
|
||
return nullptr;
|
||
}
|
||
return std::make_shared<H264Sdp>(_sps, _pps, payload_type, getBitRate() / 1024);
|
||
}
|
||
|
||
namespace {
|
||
|
||
CodecId getCodec() {
|
||
return CodecH264;
|
||
}
|
||
|
||
Track::Ptr getTrackByCodecId(int sample_rate, int channels, int sample_bit) {
|
||
return std::make_shared<H264Track>();
|
||
}
|
||
|
||
Track::Ptr getTrackBySdp(const SdpTrack::Ptr &track) {
|
||
//a=fmtp:96 packetization-mode=1;profile-level-id=42C01F;sprop-parameter-sets=Z0LAH9oBQBboQAAAAwBAAAAPI8YMqA==,aM48gA==
|
||
auto map = Parser::parseArgs(track->_fmtp, ";", "=");
|
||
auto sps_pps = map["sprop-parameter-sets"];
|
||
string base64_SPS = findSubString(sps_pps.data(), NULL, ",");
|
||
string base64_PPS = findSubString(sps_pps.data(), ",", NULL);
|
||
auto sps = decodeBase64(base64_SPS);
|
||
auto pps = decodeBase64(base64_PPS);
|
||
if (sps.empty() || pps.empty()) {
|
||
// 如果sdp里面没有sps/pps,那么可能在后续的rtp里面恢复出sps/pps [AUTO-TRANSLATED:60f03d45]
|
||
// If there is no sps/pps in the sdp, then it may be possible to recover the sps/pps in the subsequent rtp
|
||
return std::make_shared<H264Track>();
|
||
}
|
||
return std::make_shared<H264Track>(sps, pps, 0, 0);
|
||
}
|
||
|
||
RtpCodec::Ptr getRtpEncoderByCodecId(uint8_t pt) {
|
||
return std::make_shared<H264RtpEncoder>();
|
||
}
|
||
|
||
RtpCodec::Ptr getRtpDecoderByCodecId() {
|
||
return std::make_shared<H264RtpDecoder>();
|
||
}
|
||
|
||
RtmpCodec::Ptr getRtmpEncoderByTrack(const Track::Ptr &track) {
|
||
return std::make_shared<H264RtmpEncoder>(track);
|
||
}
|
||
|
||
RtmpCodec::Ptr getRtmpDecoderByTrack(const Track::Ptr &track) {
|
||
return std::make_shared<H264RtmpDecoder>(track);
|
||
}
|
||
|
||
Frame::Ptr getFrameFromPtr(const char *data, size_t bytes, uint64_t dts, uint64_t pts) {
|
||
return std::make_shared<H264FrameNoCacheAble>((char *)data, bytes, dts, pts, prefixSize(data, bytes));
|
||
}
|
||
|
||
} // namespace
|
||
|
||
CodecPlugin h264_plugin = { getCodec,
|
||
getTrackByCodecId,
|
||
getTrackBySdp,
|
||
getRtpEncoderByCodecId,
|
||
getRtpDecoderByCodecId,
|
||
getRtmpEncoderByTrack,
|
||
getRtmpDecoderByTrack,
|
||
getFrameFromPtr };
|
||
|
||
} // namespace mediakit
|