ZLMediaKit/src/Extension/Frame.h

568 lines
15 KiB
C++
Raw Normal View History

2018-10-25 10:00:17 +08:00
/*
2020-04-04 20:30:09 +08:00
* Copyright (c) 2016 The ZLMediaKit project authors. All Rights Reserved.
2018-10-25 10:00:17 +08:00
*
* This file is part of ZLMediaKit(https://github.com/xia-chu/ZLMediaKit).
2018-10-25 10:00:17 +08:00
*
2020-04-04 20:30:09 +08:00
* Use of this source code is governed by MIT license that can be found in the
* LICENSE file in the root of the source tree. All contributing project authors
* may be found in the AUTHORS file in the root of the source tree.
2018-10-25 10:00:17 +08:00
*/
2018-10-18 23:48:00 +08:00
#ifndef ZLMEDIAKIT_FRAME_H
#define ZLMEDIAKIT_FRAME_H
#include <map>
2018-10-26 16:09:48 +08:00
#include <mutex>
#include <functional>
#include "Util/List.h"
#include "Network/Buffer.h"
2018-10-26 16:09:48 +08:00
namespace mediakit {
class Stamp;
2018-10-23 11:09:21 +08:00
typedef enum {
TrackInvalid = -1,
TrackVideo = 0,
TrackAudio,
2018-10-25 22:57:59 +08:00
TrackTitle,
2021-03-28 17:32:53 +08:00
TrackApplication,
2021-03-30 11:51:19 +08:00
TrackMax
2018-10-23 11:09:21 +08:00
} TrackType;
2021-06-16 11:14:10 +08:00
#define CODEC_MAP(XX) \
2021-12-28 21:04:53 +08:00
XX(CodecH264, TrackVideo, 0, "H264", PSI_STREAM_H264) \
XX(CodecH265, TrackVideo, 1, "H265", PSI_STREAM_H265) \
XX(CodecAAC, TrackAudio, 2, "mpeg4-generic", PSI_STREAM_AAC) \
XX(CodecG711A, TrackAudio, 3, "PCMA", PSI_STREAM_AUDIO_G711A) \
XX(CodecG711U, TrackAudio, 4, "PCMU", PSI_STREAM_AUDIO_G711U) \
XX(CodecOpus, TrackAudio, 5, "opus", PSI_STREAM_AUDIO_OPUS) \
XX(CodecL16, TrackAudio, 6, "L16", PSI_STREAM_RESERVED) \
XX(CodecVP8, TrackVideo, 7, "VP8", PSI_STREAM_VP8) \
XX(CodecVP9, TrackVideo, 8, "VP9", PSI_STREAM_VP9) \
XX(CodecAV1, TrackVideo, 9, "AV1", PSI_STREAM_AV1) \
XX(CodecJPEG, TrackVideo, 10, "JPEG", PSI_STREAM_JPEG_2000)
2021-06-16 11:14:10 +08:00
typedef enum {
CodecInvalid = -1,
2021-12-28 21:04:53 +08:00
#define XX(name, type, value, str, mpeg_id) name = value,
2021-06-16 11:14:10 +08:00
CODEC_MAP(XX)
#undef XX
CodecMax
} CodecId;
2021-03-30 10:59:15 +08:00
/**
*
*/
TrackType getTrackType(const std::string &str);
2021-03-30 10:59:15 +08:00
/**
*
*/
const char* getTrackString(TrackType type);
/**
* SDP中描述获取codec_id
* @param str
* @return
*/
CodecId getCodecId(const std::string &str);
2021-03-30 10:59:15 +08:00
2020-05-15 18:08:54 +08:00
/**
*
*/
const char *getCodecName(CodecId codecId);
/**
*
*/
TrackType getTrackType(CodecId codecId);
2018-10-27 22:54:16 +08:00
/**
*
*/
2018-10-23 11:09:21 +08:00
class CodecInfo {
public:
2022-12-02 14:43:06 +08:00
using Ptr = std::shared_ptr<CodecInfo>;
2018-10-23 18:39:17 +08:00
CodecInfo() = default;
virtual ~CodecInfo() = default;
2018-10-23 11:09:21 +08:00
/**
*
*/
virtual CodecId getCodecId() const = 0;
2020-03-08 21:19:20 +08:00
/**
*
*/
const char *getCodecName() const;
2020-05-11 22:33:10 +08:00
/**
*
*/
TrackType getTrackType() const;
2018-10-23 11:09:21 +08:00
};
2018-10-27 22:54:16 +08:00
/**
*
*/
class Frame : public toolkit::Buffer, public CodecInfo {
2018-10-18 23:48:00 +08:00
public:
using Ptr = std::shared_ptr<Frame>;
virtual ~Frame() = default;
2018-11-17 17:26:38 +08:00
/**
*
*/
2022-08-08 17:13:39 +08:00
virtual uint64_t dts() const = 0;
2018-11-17 17:26:38 +08:00
/**
*
*/
2022-08-08 17:13:39 +08:00
virtual uint64_t pts() const { return dts(); }
2018-10-21 22:24:24 +08:00
/**
* 2640x00 00 00 01,4
* aac前缀则为7个字节
*/
virtual size_t prefixSize() const = 0;
2018-10-23 21:41:45 +08:00
/**
*
*/
virtual bool keyFrame() const = 0;
2019-07-24 18:02:55 +08:00
2019-08-01 18:49:04 +08:00
/**
* sps pps vps
*/
virtual bool configFrame() const = 0;
2019-07-24 18:02:55 +08:00
/**
*
*/
virtual bool cacheAble() const { return true; }
/**
*
* SEI/AUD帧可以丢弃
*
*/
virtual bool dropAble() const { return false; }
/**
*
* sps pps等帧不能解码
*/
virtual bool decodeAble() const {
if (getTrackType() != TrackVideo) {
//非视频帧都可以解码
return true;
}
//默认非sps pps帧都可以解码
return !configFrame();
}
/**
* frame
*/
static Ptr getCacheAbleFrame(const Ptr &frame);
2021-01-23 09:44:37 +08:00
private:
//对象个数统计
toolkit::ObjectStatistic<Frame> _statistic;
2018-10-18 23:48:00 +08:00
};
2020-05-11 22:33:10 +08:00
class FrameImp : public Frame {
public:
2021-02-05 11:51:16 +08:00
using Ptr = std::shared_ptr<FrameImp>;
template <typename C = FrameImp>
2021-09-02 10:56:21 +08:00
static std::shared_ptr<C> create() {
#if 0
static ResourcePool<C> packet_pool;
static onceToken token([]() {
packet_pool.setSize(1024);
});
2022-01-06 14:30:44 +08:00
auto ret = packet_pool.obtain2();
2021-09-02 10:56:21 +08:00
ret->_buffer.clear();
ret->_prefix_size = 0;
ret->_dts = 0;
ret->_pts = 0;
return ret;
#else
return std::shared_ptr<C>(new C());
#endif
}
2020-05-11 22:33:10 +08:00
char *data() const override { return (char *)_buffer.data(); }
size_t size() const override { return _buffer.size(); }
2022-08-08 17:13:39 +08:00
uint64_t dts() const override { return _dts; }
uint64_t pts() const override { return _pts ? _pts : _dts; }
size_t prefixSize() const override { return _prefix_size; }
CodecId getCodecId() const override { return _codec_id; }
bool keyFrame() const override { return false; }
bool configFrame() const override { return false; }
2020-05-11 22:33:10 +08:00
public:
2020-08-01 10:22:12 +08:00
CodecId _codec_id = CodecInvalid;
2022-08-08 17:13:39 +08:00
uint64_t _dts = 0;
uint64_t _pts = 0;
size_t _prefix_size = 0;
toolkit::BufferLikeString _buffer;
2021-02-05 16:49:11 +08:00
private:
2021-01-23 09:44:37 +08:00
//对象个数统计
toolkit::ObjectStatistic<FrameImp> _statistic;
2021-02-05 11:51:16 +08:00
protected:
friend class toolkit::ResourcePool_l<FrameImp>;
2021-02-05 11:51:16 +08:00
FrameImp() = default;
2020-05-11 22:33:10 +08:00
};
/**
* Frame类中可以有多个帧 0x 00 00 01
* ZLMediaKit会先把这种复合帧split成单个帧然后再处理
* Frame
*
*/
template <typename Parent>
class FrameInternal : public Parent {
2020-05-11 22:33:10 +08:00
public:
2022-12-02 14:43:06 +08:00
using Ptr = std::shared_ptr<FrameInternal>;
FrameInternal(const Frame::Ptr &parent_frame, char *ptr, size_t size, size_t prefix_size)
: Parent(ptr, size, parent_frame->dts(), parent_frame->pts(), prefix_size) {
2020-05-11 22:33:10 +08:00
_parent_frame = parent_frame;
}
bool cacheAble() const override { return _parent_frame->cacheAble(); }
2020-05-11 22:33:10 +08:00
private:
Frame::Ptr _parent_frame;
};
/**
* Frame类中可以有多个帧(AAC)
* ZLMediaKit会先把这种复合帧split成单个帧然后再处理
* Frame
*
*/
template <typename Parent>
class FrameTSInternal : public Parent {
public:
2022-12-02 14:43:06 +08:00
using Ptr = std::shared_ptr<FrameTSInternal>;
FrameTSInternal(
2022-08-08 17:13:39 +08:00
const Frame::Ptr &parent_frame, char *ptr, size_t size, size_t prefix_size, uint64_t dts, uint64_t pts)
: Parent(ptr, size, dts, pts, prefix_size) {
_parent_frame = parent_frame;
}
bool cacheAble() const override { return _parent_frame->cacheAble(); }
private:
Frame::Ptr _parent_frame;
};
2018-10-27 22:54:16 +08:00
/**
2020-05-11 22:33:10 +08:00
*
2018-10-27 22:54:16 +08:00
*/
class FrameWriterInterface {
2018-10-26 16:09:48 +08:00
public:
2022-12-02 14:43:06 +08:00
using Ptr = std::shared_ptr<FrameWriterInterface>;
FrameWriterInterface() = default;
virtual ~FrameWriterInterface() = default;
2020-05-11 22:33:10 +08:00
2018-10-26 16:09:48 +08:00
/**
2020-05-11 22:33:10 +08:00
*
*/
virtual bool inputFrame(const Frame::Ptr &frame) = 0;
2022-10-16 19:49:56 +08:00
/**
* frame缓存
*/
virtual void flush() {};
2018-10-26 16:09:48 +08:00
};
2018-10-27 22:54:16 +08:00
/**
*
*/
2019-12-25 20:07:42 +08:00
class FrameDispatcher : public FrameWriterInterface {
2018-10-23 22:16:54 +08:00
public:
2022-05-25 15:38:32 +08:00
using Ptr = std::shared_ptr<FrameDispatcher>;
FrameDispatcher() = default;
~FrameDispatcher() override = default;
2018-10-23 22:16:54 +08:00
2020-05-11 22:33:10 +08:00
/**
*
*/
2022-11-01 16:52:52 +08:00
FrameWriterInterface* addDelegate(FrameWriterInterface::Ptr delegate) {
std::lock_guard<std::mutex> lck(_mtx);
2022-11-01 16:52:52 +08:00
return _delegates.emplace(delegate.get(), std::move(delegate)).first->second.get();
2018-10-23 22:16:54 +08:00
}
2022-11-01 16:52:52 +08:00
FrameWriterInterface* addDelegate(std::function<bool(const Frame::Ptr &frame)> cb);
2020-05-11 22:33:10 +08:00
/**
*
*/
2022-05-25 15:38:32 +08:00
void delDelegate(FrameWriterInterface *ptr) {
std::lock_guard<std::mutex> lck(_mtx);
2022-05-25 15:38:32 +08:00
_delegates.erase(ptr);
2018-10-23 22:16:54 +08:00
}
/**
2020-05-11 22:33:10 +08:00
*
2018-10-23 22:16:54 +08:00
*/
2022-05-25 15:38:32 +08:00
bool inputFrame(const Frame::Ptr &frame) override {
std::lock_guard<std::mutex> lck(_mtx);
++_frames;
if (frame->keyFrame() && frame->getTrackType() == TrackVideo) {
++_video_key_frames;
}
bool ret = false;
2022-05-25 15:38:32 +08:00
for (auto &pr : _delegates) {
if (pr.second->inputFrame(frame)) {
ret = true;
}
2020-04-06 21:44:32 +08:00
}
return ret;
2020-05-11 22:33:10 +08:00
}
2020-04-06 21:44:32 +08:00
2020-05-11 22:33:10 +08:00
/**
*
*/
size_t size() const {
2022-05-25 15:38:32 +08:00
std::lock_guard<std::mutex> lck(_mtx);
return _delegates.size();
2018-10-23 22:16:54 +08:00
}
2022-05-25 15:38:32 +08:00
void clear() {
std::lock_guard<std::mutex> lck(_mtx);
_delegates.clear();
}
/**
*
*/
uint64_t getVideoKeyFrames() const {
std::lock_guard<std::mutex> lck(_mtx);
return _video_key_frames;
}
/**
*
*/
uint64_t getFrames() const {
std::lock_guard<std::mutex> lck(_mtx);
return _frames;
}
2018-10-23 22:16:54 +08:00
private:
uint64_t _frames = 0;
uint64_t _video_key_frames = 0;
2022-05-25 15:38:32 +08:00
mutable std::mutex _mtx;
std::map<void *, FrameWriterInterface::Ptr> _delegates;
2018-10-23 22:16:54 +08:00
};
2019-07-25 09:38:16 +08:00
/**
* Frame接口包装指针便使ZLMediaKit
*/
class FrameFromPtr : public Frame {
2018-10-26 16:09:48 +08:00
public:
2022-12-02 14:43:06 +08:00
using Ptr = std::shared_ptr<FrameFromPtr>;
2020-08-08 12:19:04 +08:00
FrameFromPtr(
2022-08-08 17:13:39 +08:00
CodecId codec_id, char *ptr, size_t size, uint64_t dts, uint64_t pts = 0, size_t prefix_size = 0,
bool is_key = false)
: FrameFromPtr(ptr, size, dts, pts, prefix_size, is_key) {
2020-08-01 10:22:12 +08:00
_codec_id = codec_id;
2020-08-08 12:19:04 +08:00
}
2022-08-08 17:13:39 +08:00
FrameFromPtr(char *ptr, size_t size, uint64_t dts, uint64_t pts = 0, size_t prefix_size = 0, bool is_key = false) {
2020-08-01 10:22:12 +08:00
_ptr = ptr;
_size = size;
_dts = dts;
_pts = pts;
_prefix_size = prefix_size;
_is_key = is_key;
2020-08-01 10:22:12 +08:00
}
char *data() const override { return _ptr; }
size_t size() const override { return _size; }
2022-08-08 17:13:39 +08:00
uint64_t dts() const override { return _dts; }
uint64_t pts() const override { return _pts ? _pts : dts(); }
size_t prefixSize() const override { return _prefix_size; }
bool cacheAble() const override { return false; }
bool keyFrame() const override { return _is_key; }
bool configFrame() const override { return false; }
void setCodecId(CodecId codec_id) { _codec_id = codec_id; }
2020-08-01 10:22:12 +08:00
2020-08-08 12:19:04 +08:00
CodecId getCodecId() const override {
if (_codec_id == CodecInvalid) {
throw std::invalid_argument("FrameFromPtr对象未设置codec类型");
}
2020-08-01 10:22:12 +08:00
return _codec_id;
}
protected:
FrameFromPtr() = default;
2020-08-01 10:22:12 +08:00
2019-07-25 09:38:16 +08:00
protected:
bool _is_key;
2019-07-25 09:38:16 +08:00
char *_ptr;
2022-08-08 17:13:39 +08:00
uint64_t _dts;
uint64_t _pts = 0;
size_t _size;
size_t _prefix_size;
2020-08-01 10:22:12 +08:00
CodecId _codec_id = CodecInvalid;
2019-07-25 09:38:16 +08:00
};
/**
*
*/
class FrameCacheAble : public FrameFromPtr {
public:
2022-12-02 14:43:06 +08:00
using Ptr = std::shared_ptr<FrameCacheAble>;
FrameCacheAble(const Frame::Ptr &frame, bool force_key_frame = false) {
if (frame->cacheAble()) {
_frame = frame;
_ptr = frame->data();
} else {
_buffer = FrameImp::create();
_buffer->_buffer.assign(frame->data(), frame->size());
_ptr = _buffer->data();
}
_size = frame->size();
_dts = frame->dts();
_pts = frame->pts();
_prefix_size = frame->prefixSize();
_codec_id = frame->getCodecId();
_key = force_key_frame ? true : frame->keyFrame();
_config = frame->configFrame();
_drop_able = frame->dropAble();
_decode_able = frame->decodeAble();
}
~FrameCacheAble() override = default;
/**
*
*/
bool cacheAble() const override { return true; }
bool keyFrame() const override { return _key; }
bool configFrame() const override { return _config; }
bool dropAble() const override { return _drop_able; }
bool decodeAble() const override { return _decode_able; }
private:
bool _key;
bool _config;
bool _drop_able;
bool _decode_able;
Frame::Ptr _frame;
FrameImp::Ptr _buffer;
};
//该类实现frame级别的时间戳覆盖
class FrameStamp : public Frame {
public:
using Ptr = std::shared_ptr<FrameStamp>;
FrameStamp(Frame::Ptr frame, Stamp &stamp, bool modify_stamp);
~FrameStamp() override {}
2022-08-08 17:13:39 +08:00
uint64_t dts() const override { return (uint64_t)_dts; }
uint64_t pts() const override { return (uint64_t)_pts; }
size_t prefixSize() const override { return _frame->prefixSize(); }
bool keyFrame() const override { return _frame->keyFrame(); }
bool configFrame() const override { return _frame->configFrame(); }
bool cacheAble() const override { return _frame->cacheAble(); }
bool dropAble() const override { return _frame->dropAble(); }
bool decodeAble() const override { return _frame->decodeAble(); }
char *data() const override { return _frame->data(); }
size_t size() const override { return _frame->size(); }
CodecId getCodecId() const override { return _frame->getCodecId(); }
private:
int64_t _dts;
int64_t _pts;
Frame::Ptr _frame;
};
2020-09-21 14:56:58 +08:00
/**
* Buffer对象转换成可缓存的Frame对象
*/
template <typename Parent>
class FrameWrapper : public Parent {
2020-09-21 14:56:58 +08:00
public:
~FrameWrapper() = default;
/**
* frame
* @param buf
* @param dts
* @param pts
* @param prefix
* @param offset buffer有效数据偏移量
*/
2022-08-08 17:13:39 +08:00
FrameWrapper(toolkit::Buffer::Ptr buf, uint64_t dts, uint64_t pts, size_t prefix, size_t offset)
: Parent(buf->data() + offset, buf->size() - offset, dts, pts, prefix) {
_buf = std::move(buf);
2020-09-21 14:56:58 +08:00
}
/**
* frame
* @param buf
* @param dts
* @param pts
* @param prefix
* @param offset buffer有效数据偏移量
* @param codec
*/
2022-08-08 17:13:39 +08:00
FrameWrapper(toolkit::Buffer::Ptr buf, uint64_t dts, uint64_t pts, size_t prefix, size_t offset, CodecId codec)
: Parent(codec, buf->data() + offset, buf->size() - offset, dts, pts, prefix) {
_buf = std::move(buf);
2020-09-21 14:56:58 +08:00
}
/**
*
*/
bool cacheAble() const override { return true; }
2020-09-21 14:56:58 +08:00
private:
toolkit::Buffer::Ptr _buf;
2020-09-21 14:56:58 +08:00
};
2021-04-26 18:26:07 +08:00
/**
* frame
*/
class FrameMerger {
public:
2022-08-08 17:13:39 +08:00
using onOutput = std::function<void(uint64_t dts, uint64_t pts, const toolkit::Buffer::Ptr &buffer, bool have_key_frame)>;
2021-06-29 17:42:32 +08:00
using Ptr = std::shared_ptr<FrameMerger>;
2021-04-26 18:26:07 +08:00
enum {
none = 0,
h264_prefix,
mp4_nal_size,
};
FrameMerger(int type);
~FrameMerger() = default;
2022-10-16 19:49:56 +08:00
/**
* FrameMerger::inputFrame传入的onOutput回调
*
*/
void flush();
2021-04-26 18:26:07 +08:00
void clear();
2022-10-16 19:49:56 +08:00
bool inputFrame(const Frame::Ptr &frame, onOutput cb, toolkit::BufferLikeString *buffer = nullptr);
2021-04-26 18:26:07 +08:00
private:
bool willFlush(const Frame::Ptr &frame) const;
void doMerge(toolkit::BufferLikeString &buffer, const Frame::Ptr &frame) const;
2021-04-26 18:26:07 +08:00
private:
int _type;
bool _have_decode_able_frame = false;
2022-10-16 19:49:56 +08:00
onOutput _cb;
toolkit::List<Frame::Ptr> _frame_cache;
2021-04-26 18:26:07 +08:00
};
} // namespace mediakit
#endif // ZLMEDIAKIT_FRAME_H