Use lambda to capture video decode result

This commit is contained in:
dijunkun
2023-09-14 17:32:33 +08:00
parent df686461a5
commit caf46a33bf
8 changed files with 481 additions and 18 deletions

View File

@@ -8,6 +8,17 @@ VideoFrame::VideoFrame(const uint8_t *buffer, size_t size) {
buffer_ = new uint8_t[size]; buffer_ = new uint8_t[size];
memcpy(buffer_, buffer, size); memcpy(buffer_, buffer, size);
size_ = size; size_ = size;
width_ = 0;
height_ = 0;
}
VideoFrame::VideoFrame(const uint8_t *buffer, size_t size, size_t width,
size_t height) {
buffer_ = new uint8_t[size];
memcpy(buffer_, buffer, size);
size_ = size;
width_ = width;
height_ = height;
} }
VideoFrame::VideoFrame(const VideoFrame &video_frame) { VideoFrame::VideoFrame(const VideoFrame &video_frame) {
@@ -15,14 +26,20 @@ VideoFrame::VideoFrame(const VideoFrame &video_frame) {
buffer_ = new uint8_t[video_frame.size_]; buffer_ = new uint8_t[video_frame.size_];
memcpy(buffer_, video_frame.buffer_, video_frame.size_); memcpy(buffer_, video_frame.buffer_, video_frame.size_);
size_ = video_frame.size_; size_ = video_frame.size_;
width_ = video_frame.width_;
height_ = video_frame.height_;
} }
} }
VideoFrame::VideoFrame(VideoFrame &&video_frame) VideoFrame::VideoFrame(VideoFrame &&video_frame)
: buffer_((uint8_t *)std::move(video_frame.buffer_)), : buffer_((uint8_t *)std::move(video_frame.buffer_)),
size_(video_frame.size_) { size_(video_frame.size_),
width_(video_frame.width_),
height_(video_frame.height_) {
video_frame.buffer_ = nullptr; video_frame.buffer_ = nullptr;
video_frame.size_ = 0; video_frame.size_ = 0;
video_frame.width_ = 0;
video_frame.height_ = 0;
} }
VideoFrame &VideoFrame::operator=(const VideoFrame &video_frame) { VideoFrame &VideoFrame::operator=(const VideoFrame &video_frame) {
@@ -34,6 +51,8 @@ VideoFrame &VideoFrame::operator=(const VideoFrame &video_frame) {
buffer_ = new uint8_t[video_frame.size_]; buffer_ = new uint8_t[video_frame.size_];
memcpy(buffer_, video_frame.buffer_, video_frame.size_); memcpy(buffer_, video_frame.buffer_, video_frame.size_);
size_ = video_frame.size_; size_ = video_frame.size_;
width_ = video_frame.width_;
height_ = video_frame.height_;
} }
return *this; return *this;
} }
@@ -44,6 +63,10 @@ VideoFrame &VideoFrame::operator=(VideoFrame &&video_frame) {
video_frame.buffer_ = nullptr; video_frame.buffer_ = nullptr;
size_ = video_frame.size_; size_ = video_frame.size_;
video_frame.size_ = 0; video_frame.size_ = 0;
width_ = video_frame.width_;
video_frame.width_ = 0;
height_ = video_frame.height_;
video_frame.height_ = 0;
} }
return *this; return *this;
} }
@@ -55,4 +78,6 @@ VideoFrame::~VideoFrame() {
} }
size_ = 0; size_ = 0;
width_ = 0;
height_ = 0;
} }

View File

@@ -7,6 +7,7 @@ class VideoFrame {
public: public:
VideoFrame(); VideoFrame();
VideoFrame(const uint8_t *buffer, size_t size); VideoFrame(const uint8_t *buffer, size_t size);
VideoFrame(const uint8_t *buffer, size_t size, size_t width, size_t height);
VideoFrame(const VideoFrame &video_frame); VideoFrame(const VideoFrame &video_frame);
VideoFrame(VideoFrame &&video_frame); VideoFrame(VideoFrame &&video_frame);
VideoFrame &operator=(const VideoFrame &video_frame); VideoFrame &operator=(const VideoFrame &video_frame);

View File

@@ -0,0 +1,358 @@
#include "ffmpeg_decoder.h"
#include "log.h"
const char H264_NAL_START[] = {0x00, 0x00, 0x00, 0x01};
VideoDecoder::VideoDecoder(PacketQueue *packetQueue) {
pPacketQueue = packetQueue;
pFrameDataCallbackMutex = (pthread_mutex_t *)malloc(sizeof(pthread_mutex_t));
int ret = pthread_mutex_init(pFrameDataCallbackMutex, nullptr);
if (ret != 0) {
LOG_ERROR("video FrameDataCallbackMutex init failed.\n");
}
gSPSLen = 0;
pSPS = nullptr;
gPPSLen = 0;
pPPS = nullptr;
isFirstIDR = false;
gFrameRate = 25;
pFrameDataCallback = nullptr;
}
VideoDecoder::~VideoDecoder() {
pthread_mutex_destroy(pFrameDataCallbackMutex);
if (nullptr != pFrameDataCallbackMutex) {
free(pFrameDataCallbackMutex);
pFrameDataCallbackMutex = nullptr;
}
}
void VideoDecoder::setFrameDataCallback(FrameDataCallback *frameDataCallback) {
pthread_mutex_lock(pFrameDataCallbackMutex);
pFrameDataCallback = frameDataCallback;
pthread_mutex_unlock(pFrameDataCallbackMutex);
}
void VideoDecoder::close() {
isDecoding = false;
pthread_join(decodeThread, nullptr);
if (pSPS != nullptr) {
free(pSPS);
pSPS = nullptr;
}
if (pPPS != nullptr) {
free(pPPS);
pPPS = nullptr;
}
if (pFrame != nullptr) {
av_frame_free(&pFrame);
LOG_INFO("%s video Frame free", __FUNCTION__);
}
if (pVideoAVCodecCtx != nullptr) {
avcodec_free_context(&pVideoAVCodecCtx);
LOG_INFO("%s video avcodec_free_context", __FUNCTION__);
}
}
bool VideoDecoder::open(unsigned int frameRate, unsigned int profile,
unsigned int level, char *sps, unsigned int spsLen,
char *pps, unsigned int ppsLen) {
gSPSLen = 0;
pSPS = nullptr;
gPPSLen = 0;
pPPS = nullptr;
LOG_INFO("%s spsLen=%d ppsLen=%d", __FUNCTION__, spsLen, ppsLen);
if (spsLen > 0) {
pSPS = (char *)malloc(spsLen);
if (nullptr == pSPS) {
return false;
}
memcpy(pSPS, sps, spsLen);
gSPSLen = spsLen;
}
if (ppsLen > 0) {
pPPS = (char *)malloc(ppsLen);
if (nullptr == pPPS) {
free(pSPS);
return false;
}
memcpy(pPPS, pps, ppsLen);
gPPSLen = ppsLen;
}
isFirstIDR = false;
if (frameRate > 0) {
gFrameRate = frameRate;
}
int ret;
AVCodec *dec = avcodec_find_decoder(AV_CODEC_ID_H264);
LOG_INFO("%s video decoder name: %s", __FUNCTION__, dec->name);
pVideoAVCodecCtx = avcodec_alloc_context3(dec);
if (pVideoAVCodecCtx == nullptr) {
LOG_ERROR("%s VideoAVCodecCtx alloc failed", __FUNCTION__);
return false;
}
AVCodecParameters *par = avcodec_parameters_alloc();
if (par == nullptr) {
LOG_ERROR("%s video AVCodecParameters alloc failed", __FUNCTION__);
free(pSPS);
free(pPPS);
avcodec_free_context(&pVideoAVCodecCtx);
return false;
}
par->codec_type = AVMEDIA_TYPE_VIDEO;
par->codec_id = AV_CODEC_ID_H264;
par->format = AV_PIX_FMT_YUV420P; // AV_PIX_FMT_NV12
par->color_range = AVCOL_RANGE_JPEG;
if (profile != 0) {
par->profile = (int)profile;
}
if (level != 0) {
par->level = (int)level;
}
avcodec_parameters_to_context(pVideoAVCodecCtx, par);
avcodec_parameters_free(&par);
LOG_INFO("%s profile=%d level=%d", __FUNCTION__, profile, level);
ret = avcodec_open2(pVideoAVCodecCtx, dec, nullptr);
if (ret < 0) {
LOG_ERROR("%s Can not open video encoder", __FUNCTION__);
free(pSPS);
free(pPPS);
avcodec_free_context(&pVideoAVCodecCtx);
return false;
}
LOG_INFO("%s avcodec_open2 video SUCC", __FUNCTION__);
pFrame = av_frame_alloc();
if (pFrame == nullptr) {
LOG_ERROR("%s video av_frame_alloc failed", __FUNCTION__);
free(pSPS);
free(pPPS);
avcodec_free_context(&pVideoAVCodecCtx);
return false;
}
isDecoding = true;
ret = pthread_create(&decodeThread, nullptr, &VideoDecoder::_decode,
(void *)this);
if (ret != 0) {
LOG_ERROR("video decode-thread create failed.\n");
isDecoding = false;
free(pSPS);
free(pPPS);
avcodec_free_context(&pVideoAVCodecCtx);
av_frame_free(&pFrame);
return false;
}
return true;
}
void VideoDecoder::decode() {
int ret;
unsigned sleepDelta = 1000000 / gFrameRate / 4; // 一帧视频的 1/4
int NAL_START_LEN = 4;
while (isDecoding) {
AVPacket *pkt = av_packet_alloc();
if (pkt == nullptr) {
usleep(sleepDelta);
continue;
}
if (pPacketQueue == nullptr) {
av_packet_free(&pkt);
usleep(sleepDelta);
continue;
}
PACKET_STRUCT *packetStruct;
bool isDone = pPacketQueue->Take(packetStruct);
if (isDone && packetStruct != nullptr && packetStruct->data != nullptr &&
packetStruct->data_size > 0) {
// 0x67:sps
if (packetStruct->data[0] == 0x67) {
if (gSPSLen <= 0) {
gSPSLen = packetStruct->data_size;
pSPS = (char *)malloc(gSPSLen);
if (nullptr == pSPS) {
av_packet_free(&pkt);
free(packetStruct->data);
free(packetStruct);
usleep(sleepDelta);
continue;
}
memcpy(pSPS, packetStruct->data, gSPSLen);
LOG_INFO("%s get sps spsLen=%d", __FUNCTION__, gSPSLen);
}
av_packet_free(&pkt);
free(packetStruct->data);
free(packetStruct);
continue;
}
// 0x68:pps
if (packetStruct->data[0] == 0x68) {
if (gPPSLen <= 0) {
gPPSLen = packetStruct->data_size;
pPPS = (char *)malloc(gPPSLen);
if (nullptr == pPPS) {
av_packet_free(&pkt);
free(packetStruct->data);
free(packetStruct);
usleep(sleepDelta);
continue;
}
memcpy(pPPS, packetStruct->data, gPPSLen);
LOG_INFO("%s get pps ppsLen=%d", __FUNCTION__, gPPSLen);
}
av_packet_free(&pkt);
free(packetStruct->data);
free(packetStruct);
continue;
}
if (!isFirstIDR) {
// 0x65:IDR
if (packetStruct->data[0] == 0x65) {
isFirstIDR = true;
LOG_INFO("%s get first idr.", __FUNCTION__);
} else {
av_packet_free(&pkt);
free(packetStruct->data);
free(packetStruct);
continue;
}
}
if (packetStruct->data[0] == 0x65 && gSPSLen > 0 && gPPSLen > 0) {
ret = av_new_packet(
pkt, (int)(NAL_START_LEN + gSPSLen + NAL_START_LEN + gPPSLen +
packetStruct->data_size + NAL_START_LEN));
} else {
ret = av_new_packet(pkt, packetStruct->data_size + NAL_START_LEN);
}
if (ret < 0) {
av_packet_free(&pkt);
free(packetStruct->data);
free(packetStruct);
usleep(sleepDelta);
continue;
}
} else {
av_packet_free(&pkt);
usleep(sleepDelta);
continue;
}
if (packetStruct->data[0] == 0x65 && gSPSLen > 0 && gPPSLen > 0) {
int pos = 0;
// 复制 0x 00 00 00 01
memcpy(pkt->data + pos, H264_NAL_START, NAL_START_LEN);
pos += NAL_START_LEN;
memcpy(pkt->data + pos, pSPS, gSPSLen);
pos += (int)gSPSLen;
memcpy(pkt->data + pos, H264_NAL_START, NAL_START_LEN);
pos += NAL_START_LEN;
memcpy(pkt->data + pos, pPPS, gPPSLen);
pos += (int)gPPSLen;
memcpy(pkt->data + pos, H264_NAL_START, NAL_START_LEN);
pos += NAL_START_LEN;
memcpy(pkt->data + pos, packetStruct->data, packetStruct->data_size);
} else {
memcpy(pkt->data, H264_NAL_START, NAL_START_LEN);
memcpy(pkt->data + NAL_START_LEN, packetStruct->data,
packetStruct->data_size);
}
pkt->pts = packetStruct->timestamp;
pkt->dts = packetStruct->timestamp;
free(packetStruct->data);
free(packetStruct);
/* send the packet for decoding */
ret = avcodec_send_packet(pVideoAVCodecCtx, pkt);
// LOGD("%s send the video packet for decoding pkt size=%d", __FUNCTION__,
// pkt->size);
av_packet_unref(pkt);
av_packet_free(&pkt);
if (ret < 0) {
LOG_ERROR("%s Error sending the video pkt to the decoder ret=%d",
__FUNCTION__, ret);
usleep(sleepDelta);
continue;
} else {
// 编码和解码都是一样的都是send 1次然后receive多次,
// 直到AVERROR(EAGAIN)或者AVERROR_EOF
while (ret >= 0) {
ret = avcodec_receive_frame(pVideoAVCodecCtx, pFrame);
if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) {
usleep(sleepDelta);
continue;
} else if (ret < 0) {
LOG_ERROR("%s Error receive decoding video frame ret=%d",
__FUNCTION__, ret);
usleep(sleepDelta);
continue;
}
pthread_mutex_lock(pFrameDataCallbackMutex);
if (pFrameDataCallback != nullptr) {
// 解码固定为 AV_PIX_FMT_YUV420P
int planeNum = 3;
int yuvLens[planeNum];
yuvLens[0] = pFrame->linesize[0] * pFrame->height;
yuvLens[1] = pFrame->linesize[1] * pFrame->height / 2;
yuvLens[2] = pFrame->linesize[2] * pFrame->height / 2;
// LOG_INFO("%s video onDataArrived", __FUNCTION__);
pFrameDataCallback->onDataArrived(
StreamType::VIDEO, (long long)pFrame->pts, (char **)pFrame->data,
yuvLens, planeNum, -1, -1, pFrame->width, pFrame->height);
}
pthread_mutex_unlock(pFrameDataCallbackMutex);
av_frame_unref(pFrame);
}
}
}
}

View File

@@ -0,0 +1,57 @@
#ifndef _FFMPEG_DECODER_H_
#define _FFMPEG_DECODER_H_
extern "C" {
// 编解码
#include "libavcodec/avcodec.h"
}
#include "PacketQueue.h"
#include "cb/FrameDataCallback.h"
class VideoDecoder {
public:
VideoDecoder(PacketQueue *packetQueue);
~VideoDecoder();
public:
int Init();
int Decode(const uint8_t *pData, int nSize);
int GetFrame(uint8_t *yuv_data, uint32_t &width, uint32_t &height,
uint32_t &size);
bool open(unsigned int frameRate, unsigned int profile, unsigned int level,
char *sps, unsigned int spsLen, char *pps, unsigned int ppsLen);
void close();
void decode();
static void *_decode(void *self) {
static_cast<VideoDecoder *>(self)->decode();
return nullptr;
}
void setFrameDataCallback(FrameDataCallback *frameDataCallback);
private:
PacketQueue *pPacketQueue;
AVCodecContext *pVideoAVCodecCtx;
AVFrame *pFrame;
bool volatile isDecoding;
pthread_t decodeThread;
pthread_mutex_t *pFrameDataCallbackMutex;
FrameDataCallback *pFrameDataCallback;
char *pSPS;
unsigned int volatile gSPSLen;
char *pPPS;
unsigned int volatile gPPSLen;
bool volatile isFirstIDR;
unsigned int gFrameRate;
};
#endif

View File

@@ -43,7 +43,9 @@ int VideoDecoder::Init() {
return 0; return 0;
} }
int VideoDecoder::Decode(const uint8_t *pData, int nSize) { int VideoDecoder::Decode(
const uint8_t *pData, int nSize,
std::function<void(VideoFrame)> on_receive_decoded_frame) {
if (!decoder) { if (!decoder) {
return -1; return -1;
} }
@@ -56,8 +58,26 @@ int VideoDecoder::Decode(const uint8_t *pData, int nSize) {
fwrite((unsigned char *)pData, 1, nSize, file_); fwrite((unsigned char *)pData, 1, nSize, file_);
} }
int ret = decoder->Decode(pData, nSize); int num_frame_returned = decoder->Decode(pData, nSize);
return ret;
for (size_t i = 0; i < num_frame_returned; ++i) {
cudaVideoSurfaceFormat format = decoder->GetOutputFormat();
if (format == cudaVideoSurfaceFormat_NV12) {
uint8_t *data = nullptr;
data = decoder->GetFrame();
if (data) {
VideoFrame decoded_frame(
data, decoder->GetWidth() * decoder->GetHeight() * 3 / 2,
decoder->GetWidth(), decoder->GetHeight());
if (on_receive_decoded_frame) {
on_receive_decoded_frame(decoded_frame);
}
}
}
}
return -1;
} }
int VideoDecoder::GetFrame(uint8_t *yuv_data, uint32_t &width, uint32_t &height, int VideoDecoder::GetFrame(uint8_t *yuv_data, uint32_t &width, uint32_t &height,

View File

@@ -1,18 +1,24 @@
#ifndef _NV_DECODER_H_ #ifndef _NV_DECODER_H_
#define _NV_DECODER_H_ #define _NV_DECODER_H_
#include <functional>
#include "NvDecoder.h" #include "NvDecoder.h"
#include "frame.h"
class VideoDecoder { class VideoDecoder {
public: public:
VideoDecoder(); VideoDecoder();
~VideoDecoder(); ~VideoDecoder();
public:
int Init(); int Init();
int Decode(const uint8_t* pData, int nSize); int Decode(const uint8_t* pData, int nSize,
std::function<void(VideoFrame)> on_receive_decoded_frame);
int GetFrame(uint8_t* yuv_data, uint32_t& width, uint32_t& height, int GetFrame(uint8_t* yuv_data, uint32_t& width, uint32_t& height,
uint32_t& size); uint32_t& size);
private:
NvDecoder* decoder = nullptr; NvDecoder* decoder = nullptr;
bool get_first_keyframe_ = false; bool get_first_keyframe_ = false;
bool skip_frame_ = false; bool skip_frame_ = false;

View File

@@ -47,18 +47,14 @@ int PeerConnection::Init(PeerConnectionParams params,
on_receive_video_ = [this](const char *data, size_t size, const char *user_id, on_receive_video_ = [this](const char *data, size_t size, const char *user_id,
size_t user_id_size) { size_t user_id_size) {
int num_frame_returned = Decode((uint8_t *)data, size); int num_frame_returned = Decode(
uint32_t width = 0; (uint8_t *)data, size,
uint32_t height = 0; [this, user_id, user_id_size](VideoFrame video_frame) {
uint32_t frame_size = 0; if (on_receive_video_buffer_) {
for (size_t i = 0; i < num_frame_returned; ++i) { on_receive_video_buffer_((const char *)video_frame.Buffer(),
int ret = GetFrame((uint8_t *)nv12_data_, width, height, frame_size); video_frame.Size(), user_id, user_id_size);
}
if (on_receive_video_buffer_) { });
on_receive_video_buffer_(nv12_data_, width * height * 3 / 2, user_id,
user_id_size);
}
}
}; };
on_receive_audio_ = [this](const char *data, size_t size, const char *user_id, on_receive_audio_ = [this](const char *data, size_t size, const char *user_id,

View File

@@ -88,7 +88,7 @@ target("ws")
target("media") target("media")
set_kind("static") set_kind("static")
add_deps("log") add_deps("log", "frame")
add_packages("cuda") add_packages("cuda")
add_links("cuda", "nvencodeapi", "nvcuvid") add_links("cuda", "nvencodeapi", "nvcuvid")
add_files("src/media/video/encode/nvcodec/*.cpp", add_files("src/media/video/encode/nvcodec/*.cpp",