Repository for OpenCV's extra modules
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

421 lines
19 KiB

/*M///////////////////////////////////////////////////////////////////////////////////////
//
// IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
//
// By downloading, copying, installing or using the software you agree to this license.
// If you do not agree to this license, do not download, install,
// copy or use the software.
//
//
// License Agreement
// For Open Source Computer Vision Library
//
// Copyright (C) 2000-2008, Intel Corporation, all rights reserved.
// Copyright (C) 2009, Willow Garage Inc., all rights reserved.
// Copyright (C) 2013, OpenCV Foundation, all rights reserved.
// Third party copyrights are property of their respective owners.
//
// Redistribution and use in source and binary forms, with or without modification,
// are permitted provided that the following conditions are met:
//
// * Redistribution's of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
//
// * Redistribution's in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
//
// * The name of the copyright holders may not be used to endorse or promote products
// derived from this software without specific prior written permission.
//
// This software is provided by the copyright holders and contributors "as is" and
// any express or implied warranties, including, but not limited to, the implied
// warranties of merchantability and fitness for a particular purpose are disclaimed.
// In no event shall the Intel Corporation or contributors be liable for any direct,
// indirect, incidental, special, exemplary, or consequential damages
// (including, but not limited to, procurement of substitute goods or services;
// loss of use, data, or profits; or business interruption) however caused
// and on any theory of liability, whether in contract, strict liability,
// or tort (including negligence or otherwise) arising in any way out of
// the use of this software, even if advised of the possibility of such damage.
//
//M*/
#include "precomp.hpp"
namespace cv { namespace cudacodec {
using namespace cv::cuda;
#if !defined(HAVE_NVCUVENC)
Ptr<cudacodec::VideoWriter> createVideoWriter(const String&, const Size, const Codec, const double, const ColorFormat, const Ptr<EncoderCallback>, const cv::cuda::Stream&) { throw_no_cuda(); return Ptr<cv::cudacodec::VideoWriter>(); }
Ptr<cudacodec::VideoWriter> createVideoWriter(const String&, const Size, const Codec, const double, const ColorFormat, const EncoderParams&, const Ptr<EncoderCallback>, const cv::cuda::Stream&) { throw_no_cuda(); return Ptr<cv::cudacodec::VideoWriter>(); }
#else // !defined HAVE_NVCUVENC
NV_ENC_BUFFER_FORMAT EncBufferFormat(const ColorFormat colorFormat);
int NChannels(const ColorFormat colorFormat);
GUID CodecGuid(const Codec codec);
void FrameRate(const double fps, uint32_t& frameRateNum, uint32_t& frameRateDen);
GUID EncodingProfileGuid(const EncodeProfile encodingProfile);
GUID EncodingPresetGuid(const EncodePreset nvPreset);
bool operator==(const EncoderParams& lhs, const EncoderParams& rhs)
{
return std::tie(lhs.nvPreset, lhs.tuningInfo, lhs.encodingProfile, lhs.rateControlMode, lhs.multiPassEncoding, lhs.constQp.qpInterB, lhs.constQp.qpInterP, lhs.constQp.qpIntra,
lhs.averageBitRate, lhs.maxBitRate, lhs.targetQuality, lhs.gopLength) == std::tie(rhs.nvPreset, rhs.tuningInfo, rhs.encodingProfile, rhs.rateControlMode, rhs.multiPassEncoding, rhs.constQp.qpInterB, rhs.constQp.qpInterP, rhs.constQp.qpIntra,
rhs.averageBitRate, rhs.maxBitRate, rhs.targetQuality, rhs.gopLength);
};
class FFmpegVideoWriter : public EncoderCallback
{
public:
FFmpegVideoWriter(const String& fileName, const Codec codec, const int fps, const Size sz, const int idrPeriod);
~FFmpegVideoWriter();
void onEncoded(const std::vector<std::vector<uint8_t>>& vPacket);
void onEncodingFinished();
private:
cv::VideoWriter writer;
};
FFmpegVideoWriter::FFmpegVideoWriter(const String& fileName, const Codec codec, const int fps, const Size sz, const int idrPeriod) {
if (!videoio_registry::hasBackend(CAP_FFMPEG))
CV_Error(Error::StsNotImplemented, "FFmpeg backend not found");
const int fourcc = codec == Codec::H264 ? cv::VideoWriter::fourcc('a', 'v', 'c', '1') : cv::VideoWriter::fourcc('h', 'e', 'v', '1');
writer.open(fileName, fourcc, fps, sz, { VideoWriterProperties::VIDEOWRITER_PROP_RAW_VIDEO, 1, VideoWriterProperties::VIDEOWRITER_PROP_KEY_INTERVAL, idrPeriod });
if (!writer.isOpened())
CV_Error(Error::StsUnsupportedFormat, "Unsupported video sink");
}
void FFmpegVideoWriter::onEncodingFinished() {
writer.release();
}
FFmpegVideoWriter::~FFmpegVideoWriter() {
onEncodingFinished();
}
void FFmpegVideoWriter::onEncoded(const std::vector<std::vector<uint8_t>>& vPacket) {
for (auto& packet : vPacket) {
Mat wrappedPacket(1, packet.size(), CV_8UC1, (void*)packet.data());
writer.write(wrappedPacket);
}
}
class RawVideoWriter : public EncoderCallback
{
public:
RawVideoWriter(const String fileName);
~RawVideoWriter();
void onEncoded(const std::vector<std::vector<uint8_t>>& vPacket);
void onEncodingFinished();
private:
std::ofstream fpOut;
};
RawVideoWriter::RawVideoWriter(String fileName) {
fpOut = std::ofstream(fileName, std::ios::out | std::ios::binary);
if (!fpOut)
CV_Error(Error::StsError, "Failed to open video file " + fileName + " for writing!");
}
void RawVideoWriter::onEncodingFinished() {
fpOut.close();
}
RawVideoWriter::~RawVideoWriter() {
onEncodingFinished();
}
void RawVideoWriter::onEncoded(const std::vector<std::vector<uint8_t>>& vPacket) {
for (auto& packet : vPacket)
fpOut.write(reinterpret_cast<const char*>(packet.data()), packet.size());
}
class VideoWriterImpl : public VideoWriter
{
public:
VideoWriterImpl(const Ptr<EncoderCallback>& videoWriter, const Size frameSize, const Codec codec, const double fps,
const ColorFormat colorFormat, const Stream& stream = Stream::Null());
VideoWriterImpl(const Ptr<EncoderCallback>& videoWriter, const Size frameSize, const Codec codec, const double fps,
const ColorFormat colorFormat, const EncoderParams& encoderParams, const Stream& stream = Stream::Null());
~VideoWriterImpl();
void write(InputArray frame);
EncoderParams getEncoderParams() const;
void release();
private:
void Init(const Codec codec, const double fps, const Size frameSz);
void InitializeEncoder(const GUID codec, const double fps);
void CopyToNvSurface(const InputArray src);
Ptr<EncoderCallback> encoderCallback;
ColorFormat colorFormat = ColorFormat::UNDEFINED;
NV_ENC_BUFFER_FORMAT surfaceFormat = NV_ENC_BUFFER_FORMAT::NV_ENC_BUFFER_FORMAT_UNDEFINED;
EncoderParams encoderParams;
Stream stream = Stream::Null();
Ptr<NvEncoderCuda> pEnc;
std::vector<std::vector<uint8_t>> vPacket;
int nSrcChannels = 0;
CUcontext cuContext;
};
NV_ENC_BUFFER_FORMAT EncBufferFormat(const ColorFormat colorFormat) {
switch (colorFormat) {
case ColorFormat::BGR: return NV_ENC_BUFFER_FORMAT_ARGB;
case ColorFormat::RGB: return NV_ENC_BUFFER_FORMAT_ABGR;
case ColorFormat::BGRA: return NV_ENC_BUFFER_FORMAT_ARGB;
case ColorFormat::RGBA: return NV_ENC_BUFFER_FORMAT_ABGR;
case ColorFormat::GRAY:
case ColorFormat::NV_NV12: return NV_ENC_BUFFER_FORMAT_NV12;
case ColorFormat::NV_YV12: return NV_ENC_BUFFER_FORMAT_YV12;
case ColorFormat::NV_IYUV: return NV_ENC_BUFFER_FORMAT_IYUV;
case ColorFormat::NV_YUV444: return NV_ENC_BUFFER_FORMAT_YUV444;
case ColorFormat::NV_AYUV: return NV_ENC_BUFFER_FORMAT_AYUV;
default: return NV_ENC_BUFFER_FORMAT_UNDEFINED;
}
}
int NChannels(const ColorFormat colorFormat) {
switch (colorFormat) {
case ColorFormat::BGR:
case ColorFormat::RGB:
case ColorFormat::NV_IYUV:
case ColorFormat::NV_YUV444: return 3;
case ColorFormat::RGBA:
case ColorFormat::BGRA:
case ColorFormat::NV_AYUV: return 4;
case ColorFormat::GRAY:
case ColorFormat::NV_NV12:
case ColorFormat::NV_YV12: return 1;
default: return 0;
}
}
VideoWriterImpl::VideoWriterImpl(const Ptr<EncoderCallback>& encoderCallBack_, const Size frameSz, const Codec codec, const double fps,
const ColorFormat colorFormat_, const EncoderParams& encoderParams_, const Stream& stream_) :
encoderCallback(encoderCallBack_), colorFormat(colorFormat_), encoderParams(encoderParams_), stream(stream_)
{
CV_Assert(colorFormat != ColorFormat::UNDEFINED);
surfaceFormat = EncBufferFormat(colorFormat);
if (surfaceFormat == NV_ENC_BUFFER_FORMAT_UNDEFINED) {
String msg = cv::format("Unsupported input surface format: %i", colorFormat);
CV_LOG_WARNING(NULL, msg);
CV_Error(Error::StsUnsupportedFormat, msg);
}
nSrcChannels = NChannels(colorFormat);
Init(codec, fps, frameSz);
}
void VideoWriterImpl::release() {
pEnc->EndEncode(vPacket);
encoderCallback->onEncoded(vPacket);
encoderCallback->onEncodingFinished();
}
VideoWriterImpl::~VideoWriterImpl() {
release();
}
GUID CodecGuid(const Codec codec) {
switch (codec) {
case Codec::H264: return NV_ENC_CODEC_H264_GUID;
case Codec::HEVC: return NV_ENC_CODEC_HEVC_GUID;
default: break;
}
std::string msg = "Unknown codec: cudacodec::VideoWriter only supports CODEC_VW::H264 and CODEC_VW::HEVC";
CV_LOG_WARNING(NULL, msg);
CV_Error(Error::StsUnsupportedFormat, msg);
}
void VideoWriterImpl::Init(const Codec codec, const double fps, const Size frameSz) {
// init context
GpuMat temp(1, 1, CV_8UC1);
temp.release();
cuSafeCall(cuCtxGetCurrent(&cuContext));
CV_Assert(nSrcChannels != 0);
const GUID codecGuid = CodecGuid(codec);
try {
pEnc = new NvEncoderCuda(cuContext, frameSz.width, frameSz.height, surfaceFormat);
InitializeEncoder(codecGuid, fps);
const cudaStream_t cudaStream = cuda::StreamAccessor::getStream(stream);
pEnc->SetIOCudaStreams((NV_ENC_CUSTREAM_PTR)&cudaStream, (NV_ENC_CUSTREAM_PTR)&cudaStream);
}
catch (cv::Exception& e)
{
String msg = String("Error initializing Nvidia Encoder. Refer to Nvidia's GPU Support Matrix to confirm your GPU supports hardware encoding, ") +
String("codec and surface format and check the encoder documentation to verify your choice of encoding paramaters are supported.") +
e.msg;
CV_Error(Error::GpuApiCallError, msg);
}
const Size encoderFrameSz(pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight());
CV_Assert(frameSz == encoderFrameSz);
}
void FrameRate(const double fps, uint32_t& frameRateNum, uint32_t& frameRateDen) {
CV_Assert(fps >= 0);
int frame_rate = (int)(fps + 0.5);
int frame_rate_base = 1;
while (fabs(((double)frame_rate / frame_rate_base) - fps) > 0.001) {
frame_rate_base *= 10;
frame_rate = (int)(fps * frame_rate_base + 0.5);
}
frameRateNum = frame_rate;
frameRateDen = frame_rate_base;
}
GUID EncodingProfileGuid(const EncodeProfile encodingProfile) {
switch (encodingProfile) {
case(ENC_CODEC_PROFILE_AUTOSELECT): return NV_ENC_CODEC_PROFILE_AUTOSELECT_GUID;
case(ENC_H264_PROFILE_BASELINE): return NV_ENC_H264_PROFILE_BASELINE_GUID;
case(ENC_H264_PROFILE_MAIN): return NV_ENC_H264_PROFILE_MAIN_GUID;
case(ENC_H264_PROFILE_HIGH): return NV_ENC_H264_PROFILE_HIGH_GUID;
case(ENC_H264_PROFILE_HIGH_444): return NV_ENC_H264_PROFILE_HIGH_444_GUID;
case(ENC_H264_PROFILE_STEREO): return NV_ENC_H264_PROFILE_STEREO_GUID;
case(ENC_H264_PROFILE_PROGRESSIVE_HIGH): return NV_ENC_H264_PROFILE_PROGRESSIVE_HIGH_GUID;
case(ENC_H264_PROFILE_CONSTRAINED_HIGH): return NV_ENC_H264_PROFILE_CONSTRAINED_HIGH_GUID;
case(ENC_HEVC_PROFILE_MAIN): return NV_ENC_HEVC_PROFILE_MAIN_GUID;
case(ENC_HEVC_PROFILE_MAIN10): return NV_ENC_HEVC_PROFILE_MAIN10_GUID;
case(ENC_HEVC_PROFILE_FREXT): return NV_ENC_HEVC_PROFILE_FREXT_GUID;
default: break;
}
std::string msg = "Unknown Encoding Profile.";
CV_LOG_WARNING(NULL, msg);
CV_Error(Error::StsUnsupportedFormat, msg);
}
GUID EncodingPresetGuid(const EncodePreset nvPreset) {
switch (nvPreset) {
case ENC_PRESET_P1: return NV_ENC_PRESET_P1_GUID;
case ENC_PRESET_P2: return NV_ENC_PRESET_P2_GUID;
case ENC_PRESET_P3: return NV_ENC_PRESET_P3_GUID;
case ENC_PRESET_P4: return NV_ENC_PRESET_P4_GUID;
case ENC_PRESET_P5: return NV_ENC_PRESET_P5_GUID;
case ENC_PRESET_P6: return NV_ENC_PRESET_P6_GUID;
case ENC_PRESET_P7: return NV_ENC_PRESET_P7_GUID;
default: break;
}
std::string msg = "Unknown Nvidia Encoding Preset.";
CV_LOG_WARNING(NULL, msg);
CV_Error(Error::StsUnsupportedFormat, msg);
}
void VideoWriterImpl::InitializeEncoder(const GUID codec, const double fps)
{
NV_ENC_INITIALIZE_PARAMS initializeParams = {};
initializeParams.version = NV_ENC_INITIALIZE_PARAMS_VER;
NV_ENC_CONFIG encodeConfig = {};
encodeConfig.version = NV_ENC_CONFIG_VER;
initializeParams.encodeConfig = &encodeConfig;
pEnc->CreateDefaultEncoderParams(&initializeParams, codec, EncodingPresetGuid(encoderParams.nvPreset), (NV_ENC_TUNING_INFO)encoderParams.tuningInfo);
FrameRate(fps, initializeParams.frameRateNum, initializeParams.frameRateDen);
initializeParams.encodeConfig->profileGUID = EncodingProfileGuid(encoderParams.encodingProfile);
initializeParams.encodeConfig->rcParams.rateControlMode = (NV_ENC_PARAMS_RC_MODE)(encoderParams.rateControlMode + encoderParams.multiPassEncoding);
initializeParams.encodeConfig->rcParams.constQP = { encoderParams.constQp.qpInterB, encoderParams.constQp.qpInterB,encoderParams.constQp.qpInterB };
initializeParams.encodeConfig->rcParams.averageBitRate = encoderParams.averageBitRate;
initializeParams.encodeConfig->rcParams.maxBitRate = encoderParams.maxBitRate;
initializeParams.encodeConfig->rcParams.targetQuality = encoderParams.targetQuality;
initializeParams.encodeConfig->gopLength = encoderParams.gopLength;
if (codec == NV_ENC_CODEC_H264_GUID)
initializeParams.encodeConfig->encodeCodecConfig.h264Config.idrPeriod = encoderParams.idrPeriod;
else if (codec == NV_ENC_CODEC_HEVC_GUID)
initializeParams.encodeConfig->encodeCodecConfig.hevcConfig.idrPeriod = encoderParams.idrPeriod;
pEnc->CreateEncoder(&initializeParams);
}
inline bool CvFormat(const ColorFormat cf) {
if (cf == ColorFormat::BGR || cf == ColorFormat::RGB || cf == ColorFormat::BGRA || cf == ColorFormat::RGBA || cf == ColorFormat::GRAY)
return true;
return false;
}
void VideoWriterImpl::CopyToNvSurface(const InputArray src)
{
const NvEncInputFrame* encoderInputFrame = pEnc->GetNextInputFrame();
CV_Assert(src.isGpuMat() || src.isMat());
if (CvFormat(colorFormat))
CV_Assert(src.size() == Size(pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight()));
Npp8u* dst = (Npp8u*)encoderInputFrame->inputPtr;
if (colorFormat == ColorFormat::BGR || colorFormat == ColorFormat::RGB) {
GpuMat srcDevice;
if (src.isGpuMat())
srcDevice = src.getGpuMat();
else {
if (stream)
srcDevice.upload(src, stream);
else
srcDevice.upload(src);
}
if (colorFormat == ColorFormat::BGR) {
GpuMat dstGpuMat(pEnc->GetEncodeHeight(), pEnc->GetEncodeWidth(), CV_8UC4, dst, encoderInputFrame->pitch);
cuda::cvtColor(srcDevice, dstGpuMat, COLOR_BGR2BGRA, 0, stream);
}
else {
GpuMat dstGpuMat(pEnc->GetEncodeHeight(), pEnc->GetEncodeWidth(), CV_8UC4, dst, encoderInputFrame->pitch);
cuda::cvtColor(srcDevice, dstGpuMat, COLOR_RGB2RGBA, 0, stream);
}
}
else if (colorFormat == ColorFormat::GRAY) {
const cudaMemcpyKind memcpyKind = src.isGpuMat() ? cudaMemcpyDeviceToDevice : cudaMemcpyHostToDevice;
const void* srcPtr = src.isGpuMat() ? src.getGpuMat().data : src.getMat().data;
const size_t srcPitch = src.isGpuMat() ? src.getGpuMat().step : src.getMat().step;
const uint32_t chromaHeight = NvEncoder::GetChromaHeight(NV_ENC_BUFFER_FORMAT_NV12, pEnc->GetEncodeHeight());
if (stream) {
cudaMemcpy2DAsync(dst, encoderInputFrame->pitch, srcPtr, srcPitch, pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight(), memcpyKind,
cuda::StreamAccessor::getStream(stream));
cudaMemset2DAsync(&dst[encoderInputFrame->pitch * pEnc->GetEncodeHeight()], encoderInputFrame->pitch, 128, pEnc->GetEncodeWidth(), chromaHeight,
cuda::StreamAccessor::getStream(stream));
}
else {
cudaMemcpy2D(dst, encoderInputFrame->pitch, srcPtr, srcPitch, pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight(), memcpyKind);
cudaMemset2D(&dst[encoderInputFrame->pitch * pEnc->GetEncodeHeight()], encoderInputFrame->pitch, 128, pEnc->GetEncodeWidth(), chromaHeight);
}
}
else {
void* srcPtr = src.isGpuMat() ? src.getGpuMat().data : src.getMat().data;
const CUmemorytype cuMemoryType = src.isGpuMat() ? CU_MEMORYTYPE_DEVICE : CU_MEMORYTYPE_HOST;
NvEncoderCuda::CopyToDeviceFrame(cuContext, srcPtr, static_cast<unsigned>(src.step()), (CUdeviceptr)encoderInputFrame->inputPtr, (int)encoderInputFrame->pitch, pEnc->GetEncodeWidth(),
pEnc->GetEncodeHeight(), cuMemoryType, encoderInputFrame->bufferFormat, encoderInputFrame->chromaOffsets, encoderInputFrame->numChromaPlanes,
false, cuda::StreamAccessor::getStream(stream));
}
}
void VideoWriterImpl::write(const InputArray frame) {
CV_Assert(frame.channels() == nSrcChannels);
CopyToNvSurface(frame);
pEnc->EncodeFrame(vPacket);
encoderCallback->onEncoded(vPacket);
};
EncoderParams VideoWriterImpl::getEncoderParams() const {
return encoderParams;
};
Ptr<VideoWriter> createVideoWriter(const String& fileName, const Size frameSize, const Codec codec, const double fps, const ColorFormat colorFormat,
Ptr<EncoderCallback> encoderCallback, const Stream& stream)
{
return createVideoWriter(fileName, frameSize, codec, fps, colorFormat, EncoderParams(), encoderCallback, stream);
}
Ptr<VideoWriter> createVideoWriter(const String& fileName, const Size frameSize, const Codec codec, const double fps, const ColorFormat colorFormat,
const EncoderParams& params, Ptr<EncoderCallback> encoderCallback, const Stream& stream)
{
CV_Assert(params.idrPeriod >= params.gopLength);
if (!encoderCallback) {
// required until PR for raw video encapsulation is merged and windows dll is updated
#ifndef WIN32 // remove #define and keep code once merged
try {
encoderCallback = new FFmpegVideoWriter(fileName, codec, fps, frameSize, params.idrPeriod);
}
catch (...)
#endif
{
encoderCallback = new RawVideoWriter(fileName);
}
}
return makePtr<VideoWriterImpl>(encoderCallback, frameSize, codec, fps, colorFormat, params, stream);
}
#endif // !defined HAVE_NVCUVENC
}}