From caf46a33bf3c1d1ef38fce8ac732bc5ce37b3ddd Mon Sep 17 00:00:00 2001
From: dijunkun <junkun.di@hotmail.com>
Date: Thu, 14 Sep 2023 17:32:33 +0800
Subject: [PATCH] Use lambda to capture video decode result

---
 src/frame/frame.cpp                           |  27 +-
 src/frame/frame.h                             |   1 +
 .../video/decode/ffmpeg/ffmpeg_decoder.cpp    | 358 ++++++++++++++++++
 .../video/decode/ffmpeg/ffmpeg_decoder.h      |  57 +++
 src/media/video/decode/nvcodec/nv_decoder.cpp |  26 +-
 src/media/video/decode/nvcodec/nv_decoder.h   |   8 +-
 src/pc/peer_connection.cpp                    |  20 +-
 xmake.lua                                     |   2 +-
 8 files changed, 481 insertions(+), 18 deletions(-)
 create mode 100644 src/media/video/decode/ffmpeg/ffmpeg_decoder.cpp
 create mode 100644 src/media/video/decode/ffmpeg/ffmpeg_decoder.h

diff --git a/src/frame/frame.cpp b/src/frame/frame.cpp
index 43c7e1f..767a9f9 100644
--- a/src/frame/frame.cpp
+++ b/src/frame/frame.cpp
@@ -8,6 +8,17 @@ VideoFrame::VideoFrame(const uint8_t *buffer, size_t size) {
   buffer_ = new uint8_t[size];
   memcpy(buffer_, buffer, size);
   size_ = size;
+  width_ = 0;
+  height_ = 0;
+}
+
+VideoFrame::VideoFrame(const uint8_t *buffer, size_t size, size_t width,
+                       size_t height) {
+  buffer_ = new uint8_t[size];
+  memcpy(buffer_, buffer, size);
+  size_ = size;
+  width_ = width;
+  height_ = height;
 }
 
 VideoFrame::VideoFrame(const VideoFrame &video_frame) {
@@ -15,14 +26,20 @@ VideoFrame::VideoFrame(const VideoFrame &video_frame) {
     buffer_ = new uint8_t[video_frame.size_];
     memcpy(buffer_, video_frame.buffer_, video_frame.size_);
     size_ = video_frame.size_;
+    width_ = video_frame.width_;
+    height_ = video_frame.height_;
   }
 }
 
 VideoFrame::VideoFrame(VideoFrame &&video_frame)
     : buffer_((uint8_t *)std::move(video_frame.buffer_)),
-      size_(video_frame.size_) {
+      size_(video_frame.size_),
+      width_(video_frame.width_),
+      height_(video_frame.height_) {
   video_frame.buffer_ = nullptr;
   video_frame.size_ = 0;
+  video_frame.width_ = 0;
+  video_frame.height_ = 0;
 }
 
 VideoFrame &VideoFrame::operator=(const VideoFrame &video_frame) {
@@ -34,6 +51,8 @@ VideoFrame &VideoFrame::operator=(const VideoFrame &video_frame) {
     buffer_ = new uint8_t[video_frame.size_];
     memcpy(buffer_, video_frame.buffer_, video_frame.size_);
     size_ = video_frame.size_;
+    width_ = video_frame.width_;
+    height_ = video_frame.height_;
   }
   return *this;
 }
@@ -44,6 +63,10 @@ VideoFrame &VideoFrame::operator=(VideoFrame &&video_frame) {
     video_frame.buffer_ = nullptr;
     size_ = video_frame.size_;
     video_frame.size_ = 0;
+    width_ = video_frame.width_;
+    video_frame.width_ = 0;
+    height_ = video_frame.height_;
+    video_frame.height_ = 0;
   }
   return *this;
 }
@@ -55,4 +78,6 @@ VideoFrame::~VideoFrame() {
   }
 
   size_ = 0;
+  width_ = 0;
+  height_ = 0;
 }
\ No newline at end of file
diff --git a/src/frame/frame.h b/src/frame/frame.h
index 8404a56..265a85c 100644
--- a/src/frame/frame.h
+++ b/src/frame/frame.h
@@ -7,6 +7,7 @@ class VideoFrame {
  public:
   VideoFrame();
   VideoFrame(const uint8_t *buffer, size_t size);
+  VideoFrame(const uint8_t *buffer, size_t size, size_t width, size_t height);
   VideoFrame(const VideoFrame &video_frame);
   VideoFrame(VideoFrame &&video_frame);
   VideoFrame &operator=(const VideoFrame &video_frame);
diff --git a/src/media/video/decode/ffmpeg/ffmpeg_decoder.cpp b/src/media/video/decode/ffmpeg/ffmpeg_decoder.cpp
new file mode 100644
index 0000000..89659f5
--- /dev/null
+++ b/src/media/video/decode/ffmpeg/ffmpeg_decoder.cpp
@@ -0,0 +1,358 @@
+#include "ffmpeg_decoder.h"
+
+#include "log.h"
+
+const char H264_NAL_START[] = {0x00, 0x00, 0x00, 0x01};
+
+VideoDecoder::VideoDecoder(PacketQueue *packetQueue) {
+  pPacketQueue = packetQueue;
+  pFrameDataCallbackMutex = (pthread_mutex_t *)malloc(sizeof(pthread_mutex_t));
+
+  int ret = pthread_mutex_init(pFrameDataCallbackMutex, nullptr);
+  if (ret != 0) {
+    LOG_ERROR("video FrameDataCallbackMutex init failed.\n");
+  }
+
+  gSPSLen = 0;
+  pSPS = nullptr;
+
+  gPPSLen = 0;
+  pPPS = nullptr;
+
+  isFirstIDR = false;
+
+  gFrameRate = 25;
+
+  pFrameDataCallback = nullptr;
+}
+
+VideoDecoder::~VideoDecoder() {
+  pthread_mutex_destroy(pFrameDataCallbackMutex);
+
+  if (nullptr != pFrameDataCallbackMutex) {
+    free(pFrameDataCallbackMutex);
+    pFrameDataCallbackMutex = nullptr;
+  }
+}
+
+void VideoDecoder::setFrameDataCallback(FrameDataCallback *frameDataCallback) {
+  pthread_mutex_lock(pFrameDataCallbackMutex);
+  pFrameDataCallback = frameDataCallback;
+  pthread_mutex_unlock(pFrameDataCallbackMutex);
+}
+
+void VideoDecoder::close() {
+  isDecoding = false;
+  pthread_join(decodeThread, nullptr);
+
+  if (pSPS != nullptr) {
+    free(pSPS);
+    pSPS = nullptr;
+  }
+
+  if (pPPS != nullptr) {
+    free(pPPS);
+    pPPS = nullptr;
+  }
+
+  if (pFrame != nullptr) {
+    av_frame_free(&pFrame);
+    LOG_INFO("%s video Frame free", __FUNCTION__);
+  }
+
+  if (pVideoAVCodecCtx != nullptr) {
+    avcodec_free_context(&pVideoAVCodecCtx);
+    LOG_INFO("%s video avcodec_free_context", __FUNCTION__);
+  }
+}
+
+bool VideoDecoder::open(unsigned int frameRate, unsigned int profile,
+                        unsigned int level, char *sps, unsigned int spsLen,
+                        char *pps, unsigned int ppsLen) {
+  gSPSLen = 0;
+  pSPS = nullptr;
+
+  gPPSLen = 0;
+  pPPS = nullptr;
+
+  LOG_INFO("%s spsLen=%d ppsLen=%d", __FUNCTION__, spsLen, ppsLen);
+
+  if (spsLen > 0) {
+    pSPS = (char *)malloc(spsLen);
+    if (nullptr == pSPS) {
+      return false;
+    }
+
+    memcpy(pSPS, sps, spsLen);
+    gSPSLen = spsLen;
+  }
+
+  if (ppsLen > 0) {
+    pPPS = (char *)malloc(ppsLen);
+    if (nullptr == pPPS) {
+      free(pSPS);
+      return false;
+    }
+
+    memcpy(pPPS, pps, ppsLen);
+    gPPSLen = ppsLen;
+  }
+
+  isFirstIDR = false;
+
+  if (frameRate > 0) {
+    gFrameRate = frameRate;
+  }
+
+  int ret;
+  AVCodec *dec = avcodec_find_decoder(AV_CODEC_ID_H264);
+  LOG_INFO("%s video decoder name: %s", __FUNCTION__, dec->name);
+  pVideoAVCodecCtx = avcodec_alloc_context3(dec);
+
+  if (pVideoAVCodecCtx == nullptr) {
+    LOG_ERROR("%s VideoAVCodecCtx alloc failed", __FUNCTION__);
+    return false;
+  }
+
+  AVCodecParameters *par = avcodec_parameters_alloc();
+  if (par == nullptr) {
+    LOG_ERROR("%s video AVCodecParameters alloc failed", __FUNCTION__);
+    free(pSPS);
+    free(pPPS);
+    avcodec_free_context(&pVideoAVCodecCtx);
+    return false;
+  }
+
+  par->codec_type = AVMEDIA_TYPE_VIDEO;
+  par->codec_id = AV_CODEC_ID_H264;
+  par->format = AV_PIX_FMT_YUV420P;  // AV_PIX_FMT_NV12
+  par->color_range = AVCOL_RANGE_JPEG;
+
+  if (profile != 0) {
+    par->profile = (int)profile;
+  }
+
+  if (level != 0) {
+    par->level = (int)level;
+  }
+
+  avcodec_parameters_to_context(pVideoAVCodecCtx, par);
+  avcodec_parameters_free(&par);
+
+  LOG_INFO("%s profile=%d level=%d", __FUNCTION__, profile, level);
+  ret = avcodec_open2(pVideoAVCodecCtx, dec, nullptr);
+  if (ret < 0) {
+    LOG_ERROR("%s Can not open video encoder", __FUNCTION__);
+    free(pSPS);
+    free(pPPS);
+    avcodec_free_context(&pVideoAVCodecCtx);
+    return false;
+  }
+  LOG_INFO("%s avcodec_open2 video SUCC", __FUNCTION__);
+  pFrame = av_frame_alloc();
+  if (pFrame == nullptr) {
+    LOG_ERROR("%s video av_frame_alloc failed", __FUNCTION__);
+    free(pSPS);
+    free(pPPS);
+    avcodec_free_context(&pVideoAVCodecCtx);
+    return false;
+  }
+
+  isDecoding = true;
+  ret = pthread_create(&decodeThread, nullptr, &VideoDecoder::_decode,
+                       (void *)this);
+  if (ret != 0) {
+    LOG_ERROR("video decode-thread create failed.\n");
+    isDecoding = false;
+    free(pSPS);
+    free(pPPS);
+    avcodec_free_context(&pVideoAVCodecCtx);
+    av_frame_free(&pFrame);
+    return false;
+  }
+
+  return true;
+}
+
+void VideoDecoder::decode() {
+  int ret;
+  unsigned sleepDelta = 1000000 / gFrameRate / 4;  // 一帧视频的 1/4
+  int NAL_START_LEN = 4;
+
+  while (isDecoding) {
+    AVPacket *pkt = av_packet_alloc();
+
+    if (pkt == nullptr) {
+      usleep(sleepDelta);
+      continue;
+    }
+
+    if (pPacketQueue == nullptr) {
+      av_packet_free(&pkt);
+      usleep(sleepDelta);
+      continue;
+    }
+
+    PACKET_STRUCT *packetStruct;
+    bool isDone = pPacketQueue->Take(packetStruct);
+    if (isDone && packetStruct != nullptr && packetStruct->data != nullptr &&
+        packetStruct->data_size > 0) {
+      // 0x67:sps
+      if (packetStruct->data[0] == 0x67) {
+        if (gSPSLen <= 0) {
+          gSPSLen = packetStruct->data_size;
+          pSPS = (char *)malloc(gSPSLen);
+          if (nullptr == pSPS) {
+            av_packet_free(&pkt);
+            free(packetStruct->data);
+            free(packetStruct);
+
+            usleep(sleepDelta);
+            continue;
+          }
+          memcpy(pSPS, packetStruct->data, gSPSLen);
+          LOG_INFO("%s get sps spsLen=%d", __FUNCTION__, gSPSLen);
+        }
+
+        av_packet_free(&pkt);
+        free(packetStruct->data);
+        free(packetStruct);
+
+        continue;
+      }
+      // 0x68:pps
+      if (packetStruct->data[0] == 0x68) {
+        if (gPPSLen <= 0) {
+          gPPSLen = packetStruct->data_size;
+          pPPS = (char *)malloc(gPPSLen);
+          if (nullptr == pPPS) {
+            av_packet_free(&pkt);
+            free(packetStruct->data);
+            free(packetStruct);
+
+            usleep(sleepDelta);
+            continue;
+          }
+          memcpy(pPPS, packetStruct->data, gPPSLen);
+          LOG_INFO("%s get pps ppsLen=%d", __FUNCTION__, gPPSLen);
+        }
+
+        av_packet_free(&pkt);
+        free(packetStruct->data);
+        free(packetStruct);
+
+        continue;
+      }
+
+      if (!isFirstIDR) {
+        // 0x65:IDR
+        if (packetStruct->data[0] == 0x65) {
+          isFirstIDR = true;
+          LOG_INFO("%s get first idr.", __FUNCTION__);
+        } else {
+          av_packet_free(&pkt);
+          free(packetStruct->data);
+          free(packetStruct);
+
+          continue;
+        }
+      }
+
+      if (packetStruct->data[0] == 0x65 && gSPSLen > 0 && gPPSLen > 0) {
+        ret = av_new_packet(
+            pkt, (int)(NAL_START_LEN + gSPSLen + NAL_START_LEN + gPPSLen +
+                       packetStruct->data_size + NAL_START_LEN));
+      } else {
+        ret = av_new_packet(pkt, packetStruct->data_size + NAL_START_LEN);
+      }
+
+      if (ret < 0) {
+        av_packet_free(&pkt);
+        free(packetStruct->data);
+        free(packetStruct);
+
+        usleep(sleepDelta);
+        continue;
+      }
+    } else {
+      av_packet_free(&pkt);
+      usleep(sleepDelta);
+      continue;
+    }
+
+    if (packetStruct->data[0] == 0x65 && gSPSLen > 0 && gPPSLen > 0) {
+      int pos = 0;
+      // 复制 0x 00 00 00 01
+      memcpy(pkt->data + pos, H264_NAL_START, NAL_START_LEN);
+      pos += NAL_START_LEN;
+      memcpy(pkt->data + pos, pSPS, gSPSLen);
+      pos += (int)gSPSLen;
+
+      memcpy(pkt->data + pos, H264_NAL_START, NAL_START_LEN);
+      pos += NAL_START_LEN;
+      memcpy(pkt->data + pos, pPPS, gPPSLen);
+      pos += (int)gPPSLen;
+
+      memcpy(pkt->data + pos, H264_NAL_START, NAL_START_LEN);
+      pos += NAL_START_LEN;
+      memcpy(pkt->data + pos, packetStruct->data, packetStruct->data_size);
+    } else {
+      memcpy(pkt->data, H264_NAL_START, NAL_START_LEN);
+      memcpy(pkt->data + NAL_START_LEN, packetStruct->data,
+             packetStruct->data_size);
+    }
+
+    pkt->pts = packetStruct->timestamp;
+    pkt->dts = packetStruct->timestamp;
+
+    free(packetStruct->data);
+    free(packetStruct);
+    /* send the packet for decoding */
+    ret = avcodec_send_packet(pVideoAVCodecCtx, pkt);
+    // LOGD("%s send the video packet for decoding pkt size=%d", __FUNCTION__,
+    // pkt->size);
+
+    av_packet_unref(pkt);
+    av_packet_free(&pkt);
+
+    if (ret < 0) {
+      LOG_ERROR("%s Error sending the video pkt to the decoder ret=%d",
+                __FUNCTION__, ret);
+      usleep(sleepDelta);
+      continue;
+    } else {
+      // 编码和解码都是一样的，都是send 1次，然后receive多次,
+      // 直到AVERROR(EAGAIN)或者AVERROR_EOF
+      while (ret >= 0) {
+        ret = avcodec_receive_frame(pVideoAVCodecCtx, pFrame);
+        if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) {
+          usleep(sleepDelta);
+          continue;
+        } else if (ret < 0) {
+          LOG_ERROR("%s Error receive decoding video frame ret=%d",
+                    __FUNCTION__, ret);
+          usleep(sleepDelta);
+          continue;
+        }
+
+        pthread_mutex_lock(pFrameDataCallbackMutex);
+        if (pFrameDataCallback != nullptr) {
+          // 解码固定为 AV_PIX_FMT_YUV420P
+          int planeNum = 3;
+          int yuvLens[planeNum];
+          yuvLens[0] = pFrame->linesize[0] * pFrame->height;
+          yuvLens[1] = pFrame->linesize[1] * pFrame->height / 2;
+          yuvLens[2] = pFrame->linesize[2] * pFrame->height / 2;
+          // LOG_INFO("%s video onDataArrived", __FUNCTION__);
+          pFrameDataCallback->onDataArrived(
+              StreamType::VIDEO, (long long)pFrame->pts, (char **)pFrame->data,
+              yuvLens, planeNum, -1, -1, pFrame->width, pFrame->height);
+        }
+
+        pthread_mutex_unlock(pFrameDataCallbackMutex);
+
+        av_frame_unref(pFrame);
+      }
+    }
+  }
+}
\ No newline at end of file
diff --git a/src/media/video/decode/ffmpeg/ffmpeg_decoder.h b/src/media/video/decode/ffmpeg/ffmpeg_decoder.h
new file mode 100644
index 0000000..bace9a6
--- /dev/null
+++ b/src/media/video/decode/ffmpeg/ffmpeg_decoder.h
@@ -0,0 +1,57 @@
+#ifndef _FFMPEG_DECODER_H_
+#define _FFMPEG_DECODER_H_
+
+extern "C" {
+// 编解码
+#include "libavcodec/avcodec.h"
+}
+
+#include "PacketQueue.h"
+#include "cb/FrameDataCallback.h"
+
+class VideoDecoder {
+ public:
+  VideoDecoder(PacketQueue *packetQueue);
+  ~VideoDecoder();
+
+ public:
+  int Init();
+  int Decode(const uint8_t *pData, int nSize);
+  int GetFrame(uint8_t *yuv_data, uint32_t &width, uint32_t &height,
+               uint32_t &size);
+
+  bool open(unsigned int frameRate, unsigned int profile, unsigned int level,
+            char *sps, unsigned int spsLen, char *pps, unsigned int ppsLen);
+
+  void close();
+
+  void decode();
+
+  static void *_decode(void *self) {
+    static_cast<VideoDecoder *>(self)->decode();
+    return nullptr;
+  }
+
+  void setFrameDataCallback(FrameDataCallback *frameDataCallback);
+
+ private:
+  PacketQueue *pPacketQueue;
+  AVCodecContext *pVideoAVCodecCtx;
+  AVFrame *pFrame;
+
+  bool volatile isDecoding;
+  pthread_t decodeThread;
+  pthread_mutex_t *pFrameDataCallbackMutex;
+  FrameDataCallback *pFrameDataCallback;
+
+  char *pSPS;
+  unsigned int volatile gSPSLen;
+  char *pPPS;
+  unsigned int volatile gPPSLen;
+
+  bool volatile isFirstIDR;
+
+  unsigned int gFrameRate;
+};
+
+#endif
\ No newline at end of file
diff --git a/src/media/video/decode/nvcodec/nv_decoder.cpp b/src/media/video/decode/nvcodec/nv_decoder.cpp
index 23059a6..57dd506 100644
--- a/src/media/video/decode/nvcodec/nv_decoder.cpp
+++ b/src/media/video/decode/nvcodec/nv_decoder.cpp
@@ -43,7 +43,9 @@ int VideoDecoder::Init() {
   return 0;
 }
 
-int VideoDecoder::Decode(const uint8_t *pData, int nSize) {
+int VideoDecoder::Decode(
+    const uint8_t *pData, int nSize,
+    std::function<void(VideoFrame)> on_receive_decoded_frame) {
   if (!decoder) {
     return -1;
   }
@@ -56,8 +58,26 @@ int VideoDecoder::Decode(const uint8_t *pData, int nSize) {
     fwrite((unsigned char *)pData, 1, nSize, file_);
   }
 
-  int ret = decoder->Decode(pData, nSize);
-  return ret;
+  int num_frame_returned = decoder->Decode(pData, nSize);
+
+  for (size_t i = 0; i < num_frame_returned; ++i) {
+    cudaVideoSurfaceFormat format = decoder->GetOutputFormat();
+    if (format == cudaVideoSurfaceFormat_NV12) {
+      uint8_t *data = nullptr;
+      data = decoder->GetFrame();
+      if (data) {
+        VideoFrame decoded_frame(
+            data, decoder->GetWidth() * decoder->GetHeight() * 3 / 2,
+            decoder->GetWidth(), decoder->GetHeight());
+
+        if (on_receive_decoded_frame) {
+          on_receive_decoded_frame(decoded_frame);
+        }
+      }
+    }
+  }
+
+  return -1;
 }
 
 int VideoDecoder::GetFrame(uint8_t *yuv_data, uint32_t &width, uint32_t &height,
diff --git a/src/media/video/decode/nvcodec/nv_decoder.h b/src/media/video/decode/nvcodec/nv_decoder.h
index 4bb2da3..be7c8e7 100644
--- a/src/media/video/decode/nvcodec/nv_decoder.h
+++ b/src/media/video/decode/nvcodec/nv_decoder.h
@@ -1,18 +1,24 @@
 #ifndef _NV_DECODER_H_
 #define _NV_DECODER_H_
 
+#include <functional>
+
 #include "NvDecoder.h"
+#include "frame.h"
 
 class VideoDecoder {
  public:
   VideoDecoder();
   ~VideoDecoder();
 
+ public:
   int Init();
-  int Decode(const uint8_t* pData, int nSize);
+  int Decode(const uint8_t* pData, int nSize,
+             std::function<void(VideoFrame)> on_receive_decoded_frame);
   int GetFrame(uint8_t* yuv_data, uint32_t& width, uint32_t& height,
                uint32_t& size);
 
+ private:
   NvDecoder* decoder = nullptr;
   bool get_first_keyframe_ = false;
   bool skip_frame_ = false;
diff --git a/src/pc/peer_connection.cpp b/src/pc/peer_connection.cpp
index aa2b341..8a5ef7c 100644
--- a/src/pc/peer_connection.cpp
+++ b/src/pc/peer_connection.cpp
@@ -47,18 +47,14 @@ int PeerConnection::Init(PeerConnectionParams params,
 
   on_receive_video_ = [this](const char *data, size_t size, const char *user_id,
                              size_t user_id_size) {
-    int num_frame_returned = Decode((uint8_t *)data, size);
-    uint32_t width = 0;
-    uint32_t height = 0;
-    uint32_t frame_size = 0;
-    for (size_t i = 0; i < num_frame_returned; ++i) {
-      int ret = GetFrame((uint8_t *)nv12_data_, width, height, frame_size);
-
-      if (on_receive_video_buffer_) {
-        on_receive_video_buffer_(nv12_data_, width * height * 3 / 2, user_id,
-                                 user_id_size);
-      }
-    }
+    int num_frame_returned = Decode(
+        (uint8_t *)data, size,
+        [this, user_id, user_id_size](VideoFrame video_frame) {
+          if (on_receive_video_buffer_) {
+            on_receive_video_buffer_((const char *)video_frame.Buffer(),
+                                     video_frame.Size(), user_id, user_id_size);
+          }
+        });
   };
 
   on_receive_audio_ = [this](const char *data, size_t size, const char *user_id,
diff --git a/xmake.lua b/xmake.lua
index 259d88b..4c5c226 100644
--- a/xmake.lua
+++ b/xmake.lua
@@ -88,7 +88,7 @@ target("ws")
 
 target("media")
     set_kind("static")
-    add_deps("log")
+    add_deps("log", "frame")
     add_packages("cuda")
     add_links("cuda", "nvencodeapi", "nvcuvid")
     add_files("src/media/video/encode/nvcodec/*.cpp",