// This file is part of OpenCV project. // It is subject to the license terms in the LICENSE file found in the top-level directory // of this distribution and at http://opencv.org/license.html #ifndef MFXHELPER_H #define MFXHELPER_H #include "opencv2/core.hpp" #include <iostream> #include <fstream> #include <sstream> #include <mfxcommon.h> #include <mfxstructures.h> #include <mfxvideo++.h> #include <mfxvp8.h> #include <mfxjpeg.h> #include <mfxplugin++.h> // // // Debug helpers // // // #if 0 # define DBG(i) i #else # define DBG(i) #endif #if 1 # define MSG(i) i #else # define MSG(i) #endif template <typename T> struct HexWrap { HexWrap(T val_) : val(val_) {} T val; }; template <typename T> inline std::ostream & operator<<(std::ostream &out, const HexWrap<T> &wrap) { std::ios_base::fmtflags flags = out.flags(std::ios::hex | std::ios::showbase); out << wrap.val; out.flags(flags); return out; } template <typename T> inline ::HexWrap<T> asHex(const T & val) { return ::HexWrap<T>(val); } struct FourCC { FourCC(uint val) : val32(val) {} FourCC(char a, char b, char c, char d) { val8[0] = a; val8[1] = b; val8[2] = c; val8[3] = d; } union { uint val32; int vali32; uchar val8[4]; }; }; inline std::ostream & operator<<(std::ostream &out, FourCC cc) { for (size_t i = 0; i < 4; out << cc.val8[i++]) {} out << " (" << asHex(cc.val32) << ")"; return out; } inline std::string mfxStatusToString(mfxStatus s) { switch (s) { case MFX_ERR_NONE: return "MFX_ERR_NONE"; case MFX_ERR_UNKNOWN: return "MFX_ERR_UNKNOWN"; case MFX_ERR_NULL_PTR: return "MFX_ERR_NULL_PTR"; case MFX_ERR_UNSUPPORTED: return "MFX_ERR_UNSUPPORTED"; case MFX_ERR_MEMORY_ALLOC: return "MFX_ERR_MEMORY_ALLOC"; case MFX_ERR_NOT_ENOUGH_BUFFER: return "MFX_ERR_NOT_ENOUGH_BUFFER"; case MFX_ERR_INVALID_HANDLE: return "MFX_ERR_INVALID_HANDLE"; case MFX_ERR_LOCK_MEMORY: return "MFX_ERR_LOCK_MEMORY"; case MFX_ERR_NOT_INITIALIZED: return "MFX_ERR_NOT_INITIALIZED"; case MFX_ERR_NOT_FOUND: return "MFX_ERR_NOT_FOUND"; case MFX_ERR_MORE_DATA: return "MFX_ERR_MORE_DATA"; case MFX_ERR_MORE_SURFACE: return "MFX_ERR_MORE_SURFACE"; case MFX_ERR_ABORTED: return "MFX_ERR_ABORTED"; case MFX_ERR_DEVICE_LOST: return "MFX_ERR_DEVICE_LOST"; case MFX_ERR_INCOMPATIBLE_VIDEO_PARAM: return "MFX_ERR_INCOMPATIBLE_VIDEO_PARAM"; case MFX_ERR_INVALID_VIDEO_PARAM: return "MFX_ERR_INVALID_VIDEO_PARAM"; case MFX_ERR_UNDEFINED_BEHAVIOR: return "MFX_ERR_UNDEFINED_BEHAVIOR"; case MFX_ERR_DEVICE_FAILED: return "MFX_ERR_DEVICE_FAILED"; case MFX_ERR_MORE_BITSTREAM: return "MFX_ERR_MORE_BITSTREAM"; case MFX_ERR_INCOMPATIBLE_AUDIO_PARAM: return "MFX_ERR_INCOMPATIBLE_AUDIO_PARAM"; case MFX_ERR_INVALID_AUDIO_PARAM: return "MFX_ERR_INVALID_AUDIO_PARAM"; case MFX_ERR_GPU_HANG: return "MFX_ERR_GPU_HANG"; case MFX_ERR_REALLOC_SURFACE: return "MFX_ERR_REALLOC_SURFACE"; case MFX_WRN_IN_EXECUTION: return "MFX_WRN_IN_EXECUTION"; case MFX_WRN_DEVICE_BUSY: return "MFX_WRN_DEVICE_BUSY"; case MFX_WRN_VIDEO_PARAM_CHANGED: return "MFX_WRN_VIDEO_PARAM_CHANGED"; case MFX_WRN_PARTIAL_ACCELERATION: return "MFX_WRN_PARTIAL_ACCELERATION"; case MFX_WRN_INCOMPATIBLE_VIDEO_PARAM: return "MFX_WRN_INCOMPATIBLE_VIDEO_PARAM"; case MFX_WRN_VALUE_NOT_CHANGED: return "MFX_WRN_VALUE_NOT_CHANGED"; case MFX_WRN_OUT_OF_RANGE: return "MFX_WRN_OUT_OF_RANGE"; case MFX_WRN_FILTER_SKIPPED: return "MFX_WRN_FILTER_SKIPPED"; case MFX_WRN_INCOMPATIBLE_AUDIO_PARAM: return "MFX_WRN_INCOMPATIBLE_AUDIO_PARAM"; default: return "<Invalid mfxStatus>"; } } inline std::ostream & operator<<(std::ostream &out, mfxStatus s) { out << mfxStatusToString(s) << " (" << (int)s << ")"; return out; } inline std::ostream & operator<<(std::ostream &out, const mfxInfoMFX &info) { out << "InfoMFX:" << std::endl << "| Codec: " << FourCC(info.CodecId) << " / " << info.CodecProfile << " / " << info.CodecLevel << std::endl << "| DecodedOrder: " << info.DecodedOrder << std::endl << "| TimeStampCalc: " << info.TimeStampCalc << std::endl ; return out; } inline std::ostream & operator<<(std::ostream & out, const mfxFrameInfo & info) { out << "FrameInfo: " << std::endl << "| FourCC: " << FourCC(info.FourCC) << std::endl << "| Size: " << info.Width << "x" << info.Height << std::endl << "| ROI: " << "(" << info.CropX << ";" << info.CropY << ") " << info.CropW << "x" << info.CropH << std::endl << "| BitDepth(L/C): " << info.BitDepthLuma << " / " << info.BitDepthChroma << std::endl << "| Shift: " << info.Shift << std::endl << "| TemporalID: " << info.FrameId.TemporalId << std::endl << "| FrameRate: " << info.FrameRateExtN << "/" << info.FrameRateExtD << std::endl << "| AspectRatio: " << info.AspectRatioW << "x" << info.AspectRatioH << std::endl << "| PicStruct: " << info.PicStruct << std::endl << "| ChromaFormat: " << info.ChromaFormat << std::endl ; return out; } inline std::ostream & operator<<(std::ostream &out, const mfxFrameData &data) { out << "FrameData:" << std::endl << "| NumExtParam: " << data.NumExtParam << std::endl << "| MemType: " << data.MemType << std::endl << "| PitchHigh: " << data.PitchHigh << std::endl << "| TimeStamp: " << data.TimeStamp << std::endl << "| FrameOrder: " << data.FrameOrder << std::endl << "| Locked: " << data.Locked << std::endl << "| Pitch: " << data.PitchHigh << ", " << data.PitchLow << std::endl << "| Y: " << (void*)data.Y << std::endl << "| U: " << (void*)data.U << std::endl << "| V: " << (void*)data.V << std::endl ; return out; } //================================================================================================== static const int CC_MPG2 = FourCC('M', 'P', 'G', '2').vali32; static const int CC_H264 = FourCC('H', '2', '6', '4').vali32; static const int CC_X264 = FourCC('X', '2', '6', '4').vali32; static const int CC_AVC = FourCC('A', 'V', 'C', ' ').vali32; static const int CC_H265 = FourCC('H', '2', '6', '5').vali32; static const int CC_HEVC = FourCC('H', 'E', 'V', 'C').vali32; static const int CC_VC1 = FourCC('V', 'C', '1', ' ').vali32; //================================================================================================== template <typename T> inline void cleanup(T * &ptr) { if (ptr) { delete ptr; ptr = 0; } } //================================================================================================== struct Plugin { public: static Plugin * loadEncoderPlugin(MFXVideoSession &session, mfxU32 codecId) { static const mfxPluginUID hevc_enc_uid = { 0x6f, 0xad, 0xc7, 0x91, 0xa0, 0xc2, 0xeb, 0x47, 0x9a, 0xb6, 0xdc, 0xd5, 0xea, 0x9d, 0xa3, 0x47 }; if (codecId == MFX_CODEC_HEVC) return new Plugin(session, hevc_enc_uid); return 0; } static Plugin * loadDecoderPlugin(MFXVideoSession &session, mfxU32 codecId) { static const mfxPluginUID hevc_dec_uid = { 0x33, 0xa6, 0x1c, 0x0b, 0x4c, 0x27, 0x45, 0x4c, 0xa8, 0xd8, 0x5d, 0xde, 0x75, 0x7c, 0x6f, 0x8e }; if (codecId == MFX_CODEC_HEVC) return new Plugin(session, hevc_dec_uid); return 0; } ~Plugin() { if (isGood()) MFXVideoUSER_UnLoad(session, &uid); } bool isGood() const { return res >= MFX_ERR_NONE; } private: MFXVideoSession &session; mfxPluginUID uid; mfxStatus res; private: Plugin(MFXVideoSession &_session, mfxPluginUID _uid) : session(_session), uid(_uid) { res = MFXVideoUSER_Load(session, &uid, 1); } Plugin(const Plugin &); Plugin &operator=(const Plugin &); }; //================================================================================================== struct ReadBitstream { public: ReadBitstream(const char * filename, size_t maxSize = 10 * 1024 * 1024); ~ReadBitstream(); bool isOpened() const; bool isDone() const; bool read(); private: ReadBitstream(const ReadBitstream &); ReadBitstream &operator=(const ReadBitstream &); public: std::fstream input; mfxBitstream stream; bool drain; }; //================================================================================================== struct WriteBitstream { public: WriteBitstream(const char * filename, size_t maxSize); ~WriteBitstream(); bool write(); bool isOpened() const; private: WriteBitstream(const WriteBitstream &); WriteBitstream &operator=(const WriteBitstream &); public: std::fstream output; mfxBitstream stream; }; //================================================================================================== class SurfacePool { public: SurfacePool(ushort width_, ushort height_, ushort count, const mfxFrameInfo & frameInfo, uchar bpp = 12); ~SurfacePool(); mfxFrameSurface1 *getFreeSurface(); template <typename T> static SurfacePool * create(T * instance, mfxVideoParam ¶ms) { CV_Assert(instance); mfxFrameAllocRequest request; memset(&request, 0, sizeof(request)); mfxStatus res = instance->QueryIOSurf(¶ms, &request); DBG(std::cout << "MFX QueryIOSurf: " << res << std::endl); if (res < MFX_ERR_NONE) return 0; return new SurfacePool(request.Info.Width, request.Info.Height, request.NumFrameSuggested, params.mfx.FrameInfo); } private: SurfacePool(const SurfacePool &); SurfacePool &operator=(const SurfacePool &); public: ushort width, height; size_t oneSize; cv::AutoBuffer<uchar, 0> buffers; std::vector<mfxFrameSurface1> surfaces; }; //================================================================================================== class DeviceHandler { public: virtual ~DeviceHandler() {} bool init(MFXVideoSession &session); protected: virtual bool initDeviceSession(MFXVideoSession &session) = 0; }; // Linux specific #include <va/va_drm.h> class VAHandle : public DeviceHandler { public: VAHandle(); ~VAHandle(); private: VAHandle(const VAHandle &); VAHandle &operator=(const VAHandle &); virtual bool initDeviceSession(MFXVideoSession &session); private: VADisplay display; int file; }; // TODO: Windows specific #endif // MFXHELPER_H