/*M/////////////////////////////////////////////////////////////////////////////////////// // // IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING. // // By downloading, copying, installing or using the software you agree to this license. // If you do not agree to this license, do not download, install, // copy or use the software. // // // License Agreement // For Open Source Computer Vision Library // // Copyright (C) 2000-2008, Intel Corporation, all rights reserved. // Copyright (C) 2009, Willow Garage Inc., all rights reserved. // Copyright (C) 2013, OpenCV Foundation, all rights reserved. // Third party copyrights are property of their respective owners. // // Redistribution and use in source and binary forms, with or without modification, // are permitted provided that the following conditions are met: // // * Redistribution's of source code must retain the above copyright notice, // this list of conditions and the following disclaimer. // // * Redistribution's in binary form must reproduce the above copyright notice, // this list of conditions and the following disclaimer in the documentation // and/or other materials provided with the distribution. // // * The name of the copyright holders may not be used to endorse or promote products // derived from this software without specific prior written permission. // // This software is provided by the copyright holders and contributors "as is" and // any express or implied warranties, including, but not limited to, the implied // warranties of merchantability and fitness for a particular purpose are disclaimed. // In no event shall the Intel Corporation or contributors be liable for any direct, // indirect, incidental, special, exemplary, or consequential damages // (including, but not limited to, procurement of substitute goods or services; // loss of use, data, or profits; or business interruption) however caused // and on any theory of liability, whether in contract, strict liability, // or tort (including negligence or otherwise) arising in any way out of // the use of this software, even if advised of the possibility of such damage. // //M*/ #include "precomp.hpp" namespace cv { namespace cudacodec { using namespace cv::cuda; #if !defined(HAVE_NVCUVENC) Ptr createVideoWriter(const String&, const Size, const Codec, const double, const ColorFormat, const Ptr, const cv::cuda::Stream&) { throw_no_cuda(); return Ptr(); } Ptr createVideoWriter(const String&, const Size, const Codec, const double, const ColorFormat, const EncoderParams&, const Ptr, const cv::cuda::Stream&) { throw_no_cuda(); return Ptr(); } #else // !defined HAVE_NVCUVENC NV_ENC_BUFFER_FORMAT EncBufferFormat(const ColorFormat colorFormat); int NChannels(const ColorFormat colorFormat); GUID CodecGuid(const Codec codec); void FrameRate(const double fps, uint32_t& frameRateNum, uint32_t& frameRateDen); GUID EncodingProfileGuid(const EncodeProfile encodingProfile); GUID EncodingPresetGuid(const EncodePreset nvPreset); bool operator==(const EncoderParams& lhs, const EncoderParams& rhs) { return std::tie(lhs.nvPreset, lhs.tuningInfo, lhs.encodingProfile, lhs.rateControlMode, lhs.multiPassEncoding, lhs.constQp.qpInterB, lhs.constQp.qpInterP, lhs.constQp.qpIntra, lhs.averageBitRate, lhs.maxBitRate, lhs.targetQuality, lhs.gopLength) == std::tie(rhs.nvPreset, rhs.tuningInfo, rhs.encodingProfile, rhs.rateControlMode, rhs.multiPassEncoding, rhs.constQp.qpInterB, rhs.constQp.qpInterP, rhs.constQp.qpIntra, rhs.averageBitRate, rhs.maxBitRate, rhs.targetQuality, rhs.gopLength); }; class FFmpegVideoWriter : public EncoderCallback { public: FFmpegVideoWriter(const String& fileName, const Codec codec, const int fps, const Size sz, const int idrPeriod); ~FFmpegVideoWriter(); void onEncoded(const std::vector>& vPacket); void onEncodingFinished(); private: cv::VideoWriter writer; }; FFmpegVideoWriter::FFmpegVideoWriter(const String& fileName, const Codec codec, const int fps, const Size sz, const int idrPeriod) { if (!videoio_registry::hasBackend(CAP_FFMPEG)) CV_Error(Error::StsNotImplemented, "FFmpeg backend not found"); const int fourcc = codec == Codec::H264 ? cv::VideoWriter::fourcc('a', 'v', 'c', '1') : cv::VideoWriter::fourcc('h', 'e', 'v', '1'); writer.open(fileName, fourcc, fps, sz, { VideoWriterProperties::VIDEOWRITER_PROP_RAW_VIDEO, 1, VideoWriterProperties::VIDEOWRITER_PROP_KEY_INTERVAL, idrPeriod }); if (!writer.isOpened()) CV_Error(Error::StsUnsupportedFormat, "Unsupported video sink"); } void FFmpegVideoWriter::onEncodingFinished() { writer.release(); } FFmpegVideoWriter::~FFmpegVideoWriter() { onEncodingFinished(); } void FFmpegVideoWriter::onEncoded(const std::vector>& vPacket) { for (auto& packet : vPacket) { Mat wrappedPacket(1, packet.size(), CV_8UC1, (void*)packet.data()); writer.write(wrappedPacket); } } class RawVideoWriter : public EncoderCallback { public: RawVideoWriter(const String fileName); ~RawVideoWriter(); void onEncoded(const std::vector>& vPacket); void onEncodingFinished(); private: std::ofstream fpOut; }; RawVideoWriter::RawVideoWriter(String fileName) { fpOut = std::ofstream(fileName, std::ios::out | std::ios::binary); if (!fpOut) CV_Error(Error::StsError, "Failed to open video file " + fileName + " for writing!"); } void RawVideoWriter::onEncodingFinished() { fpOut.close(); } RawVideoWriter::~RawVideoWriter() { onEncodingFinished(); } void RawVideoWriter::onEncoded(const std::vector>& vPacket) { for (auto& packet : vPacket) fpOut.write(reinterpret_cast(packet.data()), packet.size()); } class VideoWriterImpl : public VideoWriter { public: VideoWriterImpl(const Ptr& videoWriter, const Size frameSize, const Codec codec, const double fps, const ColorFormat colorFormat, const Stream& stream = Stream::Null()); VideoWriterImpl(const Ptr& videoWriter, const Size frameSize, const Codec codec, const double fps, const ColorFormat colorFormat, const EncoderParams& encoderParams, const Stream& stream = Stream::Null()); ~VideoWriterImpl(); void write(InputArray frame); EncoderParams getEncoderParams() const; void release(); private: void Init(const Codec codec, const double fps, const Size frameSz); void InitializeEncoder(const GUID codec, const double fps); void CopyToNvSurface(const InputArray src); Ptr encoderCallback; ColorFormat colorFormat = ColorFormat::UNDEFINED; NV_ENC_BUFFER_FORMAT surfaceFormat = NV_ENC_BUFFER_FORMAT::NV_ENC_BUFFER_FORMAT_UNDEFINED; EncoderParams encoderParams; Stream stream = Stream::Null(); Ptr pEnc; std::vector> vPacket; int nSrcChannels = 0; CUcontext cuContext; }; NV_ENC_BUFFER_FORMAT EncBufferFormat(const ColorFormat colorFormat) { switch (colorFormat) { case ColorFormat::BGR: return NV_ENC_BUFFER_FORMAT_ARGB; case ColorFormat::RGB: return NV_ENC_BUFFER_FORMAT_ABGR; case ColorFormat::BGRA: return NV_ENC_BUFFER_FORMAT_ARGB; case ColorFormat::RGBA: return NV_ENC_BUFFER_FORMAT_ABGR; case ColorFormat::GRAY: case ColorFormat::NV_NV12: return NV_ENC_BUFFER_FORMAT_NV12; case ColorFormat::NV_YV12: return NV_ENC_BUFFER_FORMAT_YV12; case ColorFormat::NV_IYUV: return NV_ENC_BUFFER_FORMAT_IYUV; case ColorFormat::NV_YUV444: return NV_ENC_BUFFER_FORMAT_YUV444; case ColorFormat::NV_AYUV: return NV_ENC_BUFFER_FORMAT_AYUV; default: return NV_ENC_BUFFER_FORMAT_UNDEFINED; } } int NChannels(const ColorFormat colorFormat) { switch (colorFormat) { case ColorFormat::BGR: case ColorFormat::RGB: case ColorFormat::NV_IYUV: case ColorFormat::NV_YUV444: return 3; case ColorFormat::RGBA: case ColorFormat::BGRA: case ColorFormat::NV_AYUV: return 4; case ColorFormat::GRAY: case ColorFormat::NV_NV12: case ColorFormat::NV_YV12: return 1; default: return 0; } } VideoWriterImpl::VideoWriterImpl(const Ptr& encoderCallBack_, const Size frameSz, const Codec codec, const double fps, const ColorFormat colorFormat_, const EncoderParams& encoderParams_, const Stream& stream_) : encoderCallback(encoderCallBack_), colorFormat(colorFormat_), encoderParams(encoderParams_), stream(stream_) { CV_Assert(colorFormat != ColorFormat::UNDEFINED); surfaceFormat = EncBufferFormat(colorFormat); if (surfaceFormat == NV_ENC_BUFFER_FORMAT_UNDEFINED) { String msg = cv::format("Unsupported input surface format: %i", colorFormat); CV_LOG_WARNING(NULL, msg); CV_Error(Error::StsUnsupportedFormat, msg); } nSrcChannels = NChannels(colorFormat); Init(codec, fps, frameSz); } void VideoWriterImpl::release() { pEnc->EndEncode(vPacket); encoderCallback->onEncoded(vPacket); encoderCallback->onEncodingFinished(); } VideoWriterImpl::~VideoWriterImpl() { release(); } GUID CodecGuid(const Codec codec) { switch (codec) { case Codec::H264: return NV_ENC_CODEC_H264_GUID; case Codec::HEVC: return NV_ENC_CODEC_HEVC_GUID; default: break; } std::string msg = "Unknown codec: cudacodec::VideoWriter only supports CODEC_VW::H264 and CODEC_VW::HEVC"; CV_LOG_WARNING(NULL, msg); CV_Error(Error::StsUnsupportedFormat, msg); } void VideoWriterImpl::Init(const Codec codec, const double fps, const Size frameSz) { // init context GpuMat temp(1, 1, CV_8UC1); temp.release(); cuSafeCall(cuCtxGetCurrent(&cuContext)); CV_Assert(nSrcChannels != 0); const GUID codecGuid = CodecGuid(codec); try { pEnc = new NvEncoderCuda(cuContext, frameSz.width, frameSz.height, surfaceFormat); InitializeEncoder(codecGuid, fps); const cudaStream_t cudaStream = cuda::StreamAccessor::getStream(stream); pEnc->SetIOCudaStreams((NV_ENC_CUSTREAM_PTR)&cudaStream, (NV_ENC_CUSTREAM_PTR)&cudaStream); } catch (cv::Exception& e) { String msg = String("Error initializing Nvidia Encoder. Refer to Nvidia's GPU Support Matrix to confirm your GPU supports hardware encoding, ") + String("codec and surface format and check the encoder documentation to verify your choice of encoding paramaters are supported.") + e.msg; CV_Error(Error::GpuApiCallError, msg); } const Size encoderFrameSz(pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight()); CV_Assert(frameSz == encoderFrameSz); } void FrameRate(const double fps, uint32_t& frameRateNum, uint32_t& frameRateDen) { CV_Assert(fps >= 0); int frame_rate = (int)(fps + 0.5); int frame_rate_base = 1; while (fabs(((double)frame_rate / frame_rate_base) - fps) > 0.001) { frame_rate_base *= 10; frame_rate = (int)(fps * frame_rate_base + 0.5); } frameRateNum = frame_rate; frameRateDen = frame_rate_base; } GUID EncodingProfileGuid(const EncodeProfile encodingProfile) { switch (encodingProfile) { case(ENC_CODEC_PROFILE_AUTOSELECT): return NV_ENC_CODEC_PROFILE_AUTOSELECT_GUID; case(ENC_H264_PROFILE_BASELINE): return NV_ENC_H264_PROFILE_BASELINE_GUID; case(ENC_H264_PROFILE_MAIN): return NV_ENC_H264_PROFILE_MAIN_GUID; case(ENC_H264_PROFILE_HIGH): return NV_ENC_H264_PROFILE_HIGH_GUID; case(ENC_H264_PROFILE_HIGH_444): return NV_ENC_H264_PROFILE_HIGH_444_GUID; case(ENC_H264_PROFILE_STEREO): return NV_ENC_H264_PROFILE_STEREO_GUID; case(ENC_H264_PROFILE_PROGRESSIVE_HIGH): return NV_ENC_H264_PROFILE_PROGRESSIVE_HIGH_GUID; case(ENC_H264_PROFILE_CONSTRAINED_HIGH): return NV_ENC_H264_PROFILE_CONSTRAINED_HIGH_GUID; case(ENC_HEVC_PROFILE_MAIN): return NV_ENC_HEVC_PROFILE_MAIN_GUID; case(ENC_HEVC_PROFILE_MAIN10): return NV_ENC_HEVC_PROFILE_MAIN10_GUID; case(ENC_HEVC_PROFILE_FREXT): return NV_ENC_HEVC_PROFILE_FREXT_GUID; default: break; } std::string msg = "Unknown Encoding Profile."; CV_LOG_WARNING(NULL, msg); CV_Error(Error::StsUnsupportedFormat, msg); } GUID EncodingPresetGuid(const EncodePreset nvPreset) { switch (nvPreset) { case ENC_PRESET_P1: return NV_ENC_PRESET_P1_GUID; case ENC_PRESET_P2: return NV_ENC_PRESET_P2_GUID; case ENC_PRESET_P3: return NV_ENC_PRESET_P3_GUID; case ENC_PRESET_P4: return NV_ENC_PRESET_P4_GUID; case ENC_PRESET_P5: return NV_ENC_PRESET_P5_GUID; case ENC_PRESET_P6: return NV_ENC_PRESET_P6_GUID; case ENC_PRESET_P7: return NV_ENC_PRESET_P7_GUID; default: break; } std::string msg = "Unknown Nvidia Encoding Preset."; CV_LOG_WARNING(NULL, msg); CV_Error(Error::StsUnsupportedFormat, msg); } void VideoWriterImpl::InitializeEncoder(const GUID codec, const double fps) { NV_ENC_INITIALIZE_PARAMS initializeParams = {}; initializeParams.version = NV_ENC_INITIALIZE_PARAMS_VER; NV_ENC_CONFIG encodeConfig = {}; encodeConfig.version = NV_ENC_CONFIG_VER; initializeParams.encodeConfig = &encodeConfig; pEnc->CreateDefaultEncoderParams(&initializeParams, codec, EncodingPresetGuid(encoderParams.nvPreset), (NV_ENC_TUNING_INFO)encoderParams.tuningInfo); FrameRate(fps, initializeParams.frameRateNum, initializeParams.frameRateDen); initializeParams.encodeConfig->profileGUID = EncodingProfileGuid(encoderParams.encodingProfile); initializeParams.encodeConfig->rcParams.rateControlMode = (NV_ENC_PARAMS_RC_MODE)(encoderParams.rateControlMode + encoderParams.multiPassEncoding); initializeParams.encodeConfig->rcParams.constQP = { encoderParams.constQp.qpInterB, encoderParams.constQp.qpInterB,encoderParams.constQp.qpInterB }; initializeParams.encodeConfig->rcParams.averageBitRate = encoderParams.averageBitRate; initializeParams.encodeConfig->rcParams.maxBitRate = encoderParams.maxBitRate; initializeParams.encodeConfig->rcParams.targetQuality = encoderParams.targetQuality; initializeParams.encodeConfig->gopLength = encoderParams.gopLength; if (codec == NV_ENC_CODEC_H264_GUID) initializeParams.encodeConfig->encodeCodecConfig.h264Config.idrPeriod = encoderParams.idrPeriod; else if (codec == NV_ENC_CODEC_HEVC_GUID) initializeParams.encodeConfig->encodeCodecConfig.hevcConfig.idrPeriod = encoderParams.idrPeriod; pEnc->CreateEncoder(&initializeParams); } inline bool CvFormat(const ColorFormat cf) { if (cf == ColorFormat::BGR || cf == ColorFormat::RGB || cf == ColorFormat::BGRA || cf == ColorFormat::RGBA || cf == ColorFormat::GRAY) return true; return false; } void VideoWriterImpl::CopyToNvSurface(const InputArray src) { const NvEncInputFrame* encoderInputFrame = pEnc->GetNextInputFrame(); CV_Assert(src.isGpuMat() || src.isMat()); if (CvFormat(colorFormat)) CV_Assert(src.size() == Size(pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight())); Npp8u* dst = (Npp8u*)encoderInputFrame->inputPtr; if (colorFormat == ColorFormat::BGR || colorFormat == ColorFormat::RGB) { GpuMat srcDevice; if (src.isGpuMat()) srcDevice = src.getGpuMat(); else { if (stream) srcDevice.upload(src, stream); else srcDevice.upload(src); } if (colorFormat == ColorFormat::BGR) { GpuMat dstGpuMat(pEnc->GetEncodeHeight(), pEnc->GetEncodeWidth(), CV_8UC4, dst, encoderInputFrame->pitch); cuda::cvtColor(srcDevice, dstGpuMat, COLOR_BGR2BGRA, 0, stream); } else { GpuMat dstGpuMat(pEnc->GetEncodeHeight(), pEnc->GetEncodeWidth(), CV_8UC4, dst, encoderInputFrame->pitch); cuda::cvtColor(srcDevice, dstGpuMat, COLOR_RGB2RGBA, 0, stream); } } else if (colorFormat == ColorFormat::GRAY) { const cudaMemcpyKind memcpyKind = src.isGpuMat() ? cudaMemcpyDeviceToDevice : cudaMemcpyHostToDevice; const void* srcPtr = src.isGpuMat() ? src.getGpuMat().data : src.getMat().data; const size_t srcPitch = src.isGpuMat() ? src.getGpuMat().step : src.getMat().step; const uint32_t chromaHeight = NvEncoder::GetChromaHeight(NV_ENC_BUFFER_FORMAT_NV12, pEnc->GetEncodeHeight()); if (stream) { cudaMemcpy2DAsync(dst, encoderInputFrame->pitch, srcPtr, srcPitch, pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight(), memcpyKind, cuda::StreamAccessor::getStream(stream)); cudaMemset2DAsync(&dst[encoderInputFrame->pitch * pEnc->GetEncodeHeight()], encoderInputFrame->pitch, 128, pEnc->GetEncodeWidth(), chromaHeight, cuda::StreamAccessor::getStream(stream)); } else { cudaMemcpy2D(dst, encoderInputFrame->pitch, srcPtr, srcPitch, pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight(), memcpyKind); cudaMemset2D(&dst[encoderInputFrame->pitch * pEnc->GetEncodeHeight()], encoderInputFrame->pitch, 128, pEnc->GetEncodeWidth(), chromaHeight); } } else { void* srcPtr = src.isGpuMat() ? src.getGpuMat().data : src.getMat().data; const CUmemorytype cuMemoryType = src.isGpuMat() ? CU_MEMORYTYPE_DEVICE : CU_MEMORYTYPE_HOST; NvEncoderCuda::CopyToDeviceFrame(cuContext, srcPtr, static_cast(src.step()), (CUdeviceptr)encoderInputFrame->inputPtr, (int)encoderInputFrame->pitch, pEnc->GetEncodeWidth(), pEnc->GetEncodeHeight(), cuMemoryType, encoderInputFrame->bufferFormat, encoderInputFrame->chromaOffsets, encoderInputFrame->numChromaPlanes, false, cuda::StreamAccessor::getStream(stream)); } } void VideoWriterImpl::write(const InputArray frame) { CV_Assert(frame.channels() == nSrcChannels); CopyToNvSurface(frame); pEnc->EncodeFrame(vPacket); encoderCallback->onEncoded(vPacket); }; EncoderParams VideoWriterImpl::getEncoderParams() const { return encoderParams; }; Ptr createVideoWriter(const String& fileName, const Size frameSize, const Codec codec, const double fps, const ColorFormat colorFormat, Ptr encoderCallback, const Stream& stream) { return createVideoWriter(fileName, frameSize, codec, fps, colorFormat, EncoderParams(), encoderCallback, stream); } Ptr createVideoWriter(const String& fileName, const Size frameSize, const Codec codec, const double fps, const ColorFormat colorFormat, const EncoderParams& params, Ptr encoderCallback, const Stream& stream) { CV_Assert(params.idrPeriod >= params.gopLength); if (!encoderCallback) { // required until PR for raw video encapsulation is merged and windows dll is updated #ifndef WIN32 // remove #define and keep code once merged try { encoderCallback = new FFmpegVideoWriter(fileName, codec, fps, frameSize, params.idrPeriod); } catch (...) #endif { encoderCallback = new RawVideoWriter(fileName); } } return makePtr(encoderCallback, frameSize, codec, fps, colorFormat, params, stream); } #endif // !defined HAVE_NVCUVENC }}