/* The copyright in this software is being made available under the BSD * License, included below. This software may be subject to other third party * and contributor rights, including patent rights, and no such rights are * granted under this license. * * Copyright (c) 2010-2013, ITU/ISO/IEC * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * * Redistributions of source code must retain the above copyright notice, * this list of conditions and the following disclaimer. * * Redistributions in binary form must reproduce the above copyright notice, * this list of conditions and the following disclaimer in the documentation * and/or other materials provided with the distribution. * * Neither the name of the ITU/ISO/IEC nor the names of its contributors may * be used to endorse or promote products derived from this software without * specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF * THE POSSIBILITY OF SUCH DAMAGE. */ /** \file TAppEncCfg.h \brief Handle encoder configuration parameters (header) */ #ifndef __TAPPENCCFG__ #define __TAPPENCCFG__ #include "TLibCommon/CommonDef.h" #include "TLibEncoder/TEncCfg.h" #include #if H_3D #include "TAppCommon/TAppComCamPara.h" #include "TLibRenderer/TRenModel.h" #include "TLibRenderer/TRenModSetupStrParser.h" #endif //! \ingroup TAppEncoder //! \{ // ==================================================================================================================== // Class definition // ==================================================================================================================== /// encoder configuration class class TAppEncCfg { protected: // file I/O #if H_MV std::vector m_pchInputFileList; ///< source file names #else Char* m_pchInputFile; ///< source file name #endif Char* m_pchBitstreamFile; ///< output bitstream file #if H_MV std::vector m_pchReconFileList; ///< output reconstruction file names Int m_numberOfLayers; ///< number of Layers to Encode #if H_3D Int m_iNumberOfViews; ///< number of Layers that are views #endif #else Char* m_pchReconFile; ///< output reconstruction file #endif #if H_MV // VPS specification std::vector< std::vector > m_dimIds; ///< dimension ids ( pointers to m_viewId and m_depthFlag std::vector m_viewId; ///< view id #if H_3D std::vector m_depthFlag; ///< depth flag #endif std::vector m_layerIdInNuh; ///< layer Id in Nuh for each layer Bool m_splittingFlag; ///< Splitting Flag Int m_scalabilityMask; ///< Mask indicating scalabilities, 1: texture; 3: texture + depth std::vector m_dimensionIdLen; ///< Length of scalability dimension s // layer sets Int m_vpsNumLayerSets; ///< Number of layer sets std::vector< std::vector > m_layerIdsInSets; ///< LayerIds in vps of layer set Bool m_defaultOneTargetOutputLayerFlag; ///< Output highest layer of layer sets by default std::vector m_outputLayerSetIdx; ///< Indices of layer sets used as additional output layer sets std::vector< std::vector > m_layerIdsInAddOutputLayerSet; ///< LayerIds in vps of additional output layers std::vector m_profileLevelTierIdx; ///< Indices of of profile level tier // Dependencies std::vector< std::vector > m_directRefLayers; ///< LayerIds of direct reference layers std::vector< std::vector > m_dependencyTypes; ///< Dependency types of direct reference layers #if H_3D_IV_MERGE Bool m_ivMvPredFlag; ///< Interview motion vector prediction #endif #if H_3D_ARP /// < flag and number of weighting factors in ARP UInt m_uiUseAdvResPred; UInt m_uiARPStepNum; #endif #if H_3D_IC vector m_abUseIC; ///< flag for using illumination compensation for inter-view prediction #endif #if H_3D_NBDV_REF Bool m_depthRefinementFlag; #endif #if H_3D_VSP Bool m_viewSynthesisPredFlag; #endif #if H_3D_TMVP Bool m_ivMvScalingFlag; #endif #endif Double m_adLambdaModifier[ MAX_TLAYER ]; ///< Lambda modifier array for each temporal layer // source specification Int m_iFrameRate; ///< source frame-rates (Hz) UInt m_FrameSkip; ///< number of skipped frames from the beginning Int m_iSourceWidth; ///< source width in pixel Int m_iSourceHeight; ///< source height in pixel Int m_conformanceMode; Int m_confLeft; Int m_confRight; Int m_confTop; Int m_confBottom; Int m_framesToBeEncoded; ///< number of encoded frames Int m_aiPad[2]; ///< number of padded pixels for width and height // profile/level Profile::Name m_profile; Level::Tier m_levelTier; Level::Name m_level; Bool m_progressiveSourceFlag; Bool m_interlacedSourceFlag; Bool m_nonPackedConstraintFlag; Bool m_frameOnlyConstraintFlag; // coding structure Int m_iIntraPeriod; ///< period of I-slice (random access period) Int m_iDecodingRefreshType; ///< random access type Int m_iGOPSize; ///< GOP size of hierarchical structure #if H_MV Int m_extraRPSsMvc[MAX_NUM_LAYERS]; ///< extra RPSs added to handle CRA for each layer std::vector< GOPEntry* > m_GOPListMvc; ///< the coding structure entries from the config file for each layer Int m_numReorderPicsMvc[MAX_NUM_LAYERS][MAX_TLAYER]; ///< total number of reorder pictures for each layer Int m_maxDecPicBufferingMvc[MAX_NUM_LAYERS][MAX_TLAYER]; ///< total number of reference pictures needed for decoding for each layer #else Int m_extraRPSs; ///< extra RPSs added to handle CRA GOPEntry m_GOPList[MAX_GOP]; ///< the coding structure entries from the config file Int m_numReorderPics[MAX_TLAYER]; ///< total number of reorder pictures Int m_maxDecPicBuffering[MAX_TLAYER]; ///< total number of pictures in the decoded picture buffer #endif Bool m_useTransformSkip; ///< flag for enabling intra transform skipping Bool m_useTransformSkipFast; ///< flag for enabling fast intra transform skipping Bool m_enableAMP; // coding quality #if H_MV std::vector m_fQP; ///< QP value of key-picture (floating point) for each layer std::vector m_iQP; ///< QP value of key-picture (integer) for each layer #else Double m_fQP; ///< QP value of key-picture (floating point) Int m_iQP; ///< QP value of key-picture (integer) #endif Char* m_pchdQPFile; ///< QP offset for each slice (initialized from external file) #if H_MV std::vector m_aidQP; ///< array of slice QP values for each layer #else Int* m_aidQP; ///< array of slice QP values #endif Int m_iMaxDeltaQP; ///< max. |delta QP| UInt m_uiDeltaQpRD; ///< dQP range for multi-pass slice QP optimization Int m_iMaxCuDQPDepth; ///< Max. depth for a minimum CuDQPSize (0:default) Int m_cbQpOffset; ///< Chroma Cb QP Offset (0:default) Int m_crQpOffset; ///< Chroma Cr QP Offset (0:default) #if ADAPTIVE_QP_SELECTION Bool m_bUseAdaptQpSelect; #endif Bool m_bUseAdaptiveQP; ///< Flag for enabling QP adaptation based on a psycho-visual model Int m_iQPAdaptationRange; ///< dQP range by QP adaptation #if H_MV Int m_maxTempLayerMvc[MAX_NUM_LAYER_IDS]; ///< Max temporal layer for each layer #else Int m_maxTempLayer; ///< Max temporal layer #endif // coding unit (CU) definition UInt m_uiMaxCUWidth; ///< max. CU width in pixel UInt m_uiMaxCUHeight; ///< max. CU height in pixel UInt m_uiMaxCUDepth; ///< max. CU depth // transfom unit (TU) definition UInt m_uiQuadtreeTULog2MaxSize; UInt m_uiQuadtreeTULog2MinSize; UInt m_uiQuadtreeTUMaxDepthInter; UInt m_uiQuadtreeTUMaxDepthIntra; // coding tools (bit-depth) Int m_inputBitDepthY; ///< bit-depth of input file (luma component) Int m_inputBitDepthC; ///< bit-depth of input file (chroma component) Int m_outputBitDepthY; ///< bit-depth of output file (luma component) Int m_outputBitDepthC; ///< bit-depth of output file (chroma component) Int m_internalBitDepthY; ///< bit-depth codec operates at in luma (input/output files will be converted) Int m_internalBitDepthC; ///< bit-depth codec operates at in chroma (input/output files will be converted) // coding tools (PCM bit-depth) Bool m_bPCMInputBitDepthFlag; ///< 0: PCM bit-depth is internal bit-depth. 1: PCM bit-depth is input bit-depth. // coding tool (lossless) Bool m_useLossless; ///< flag for using lossless coding #if H_MV std::vector m_bUseSAO; #else Bool m_bUseSAO; #endif Int m_maxNumOffsetsPerPic; ///< SAO maximun number of offset per picture Bool m_saoLcuBoundary; ///< SAO parameter estimation using non-deblocked pixels for LCU bottom and right boundary areas Bool m_saoLcuBasedOptimization; ///< SAO LCU-based optimization // coding tools (loop filter) #if H_MV std::vector m_bLoopFilterDisable; ///< flag for using deblocking filter for each layer #else Bool m_bLoopFilterDisable; ///< flag for using deblocking filter #endif Bool m_loopFilterOffsetInPPS; ///< offset for deblocking filter in 0 = slice header, 1 = PPS Int m_loopFilterBetaOffsetDiv2; ///< beta offset for deblocking filter Int m_loopFilterTcOffsetDiv2; ///< tc offset for deblocking filter Bool m_DeblockingFilterControlPresent; ///< deblocking filter control present flag in PPS Bool m_DeblockingFilterMetric; ///< blockiness metric in encoder // coding tools (PCM) Bool m_usePCM; ///< flag for using IPCM UInt m_pcmLog2MaxSize; ///< log2 of maximum PCM block size UInt m_uiPCMLog2MinSize; ///< log2 of minimum PCM block size Bool m_bPCMFilterDisableFlag; ///< PCM filter disable flag // coding tools (encoder-only parameters) Bool m_bUseSBACRD; ///< flag for using RD optimization based on SBAC Bool m_bUseASR; ///< flag for using adaptive motion search range Bool m_bUseHADME; ///< flag for using HAD in sub-pel ME Bool m_useRDOQ; ///< flag for using RD optimized quantization Bool m_useRDOQTS; ///< flag for using RD optimized quantization for transform skip Int m_rdPenalty; ///< RD-penalty for 32x32 TU for intra in non-intra slices (0: no RD-penalty, 1: RD-penalty, 2: maximum RD-penalty) Int m_iFastSearch; ///< ME mode, 0 = full, 1 = diamond, 2 = PMVFAST Int m_iSearchRange; ///< ME search range Int m_bipredSearchRange; ///< ME search range for bipred refinement Bool m_bUseFastEnc; ///< flag for using fast encoder setting Bool m_bUseEarlyCU; ///< flag for using Early CU setting Bool m_useFastDecisionForMerge; ///< flag for using Fast Decision Merge RD-Cost Bool m_bUseCbfFastMode; ///< flag for using Cbf Fast PU Mode Decision Bool m_useEarlySkipDetection; ///< flag for using Early SKIP Detection Int m_sliceMode; ///< 0: no slice limits, 1 : max number of CTBs per slice, 2: max number of bytes per slice, ///< 3: max number of tiles per slice Int m_sliceArgument; ///< argument according to selected slice mode Int m_sliceSegmentMode; ///< 0: no slice segment limits, 1 : max number of CTBs per slice segment, 2: max number of bytes per slice segment, ///< 3: max number of tiles per slice segment Int m_sliceSegmentArgument; ///< argument according to selected slice segment mode Bool m_bLFCrossSliceBoundaryFlag; ///< 1: filter across slice boundaries 0: do not filter across slice boundaries Bool m_bLFCrossTileBoundaryFlag; ///< 1: filter across tile boundaries 0: do not filter across tile boundaries Int m_iUniformSpacingIdr; Int m_iNumColumnsMinus1; Char* m_pchColumnWidth; Int m_iNumRowsMinus1; Char* m_pchRowHeight; UInt* m_pColumnWidth; UInt* m_pRowHeight; Int m_iWaveFrontSynchro; //< 0: no WPP. >= 1: WPP is enabled, the "Top right" from which inheritance occurs is this LCU offset in the line above the current. Int m_iWaveFrontSubstreams; //< If iWaveFrontSynchro, this is the number of substreams per frame (dependent tiles) or per tile (independent tiles). Bool m_bUseConstrainedIntraPred; ///< flag for using constrained intra prediction Int m_decodedPictureHashSEIEnabled; ///< Checksum(3)/CRC(2)/MD5(1)/disable(0) acting on decoded picture hash SEI message Int m_recoveryPointSEIEnabled; Int m_bufferingPeriodSEIEnabled; Int m_pictureTimingSEIEnabled; Bool m_toneMappingInfoSEIEnabled; Int m_toneMapId; Bool m_toneMapCancelFlag; Bool m_toneMapPersistenceFlag; Int m_toneMapCodedDataBitDepth; Int m_toneMapTargetBitDepth; Int m_toneMapModelId; Int m_toneMapMinValue; Int m_toneMapMaxValue; Int m_sigmoidMidpoint; Int m_sigmoidWidth; Int m_numPivots; Int m_cameraIsoSpeedIdc; Int m_cameraIsoSpeedValue; Int m_exposureCompensationValueSignFlag; Int m_exposureCompensationValueNumerator; Int m_exposureCompensationValueDenomIdc; Int m_refScreenLuminanceWhite; Int m_extendedRangeWhiteLevel; Int m_nominalBlackLevelLumaCodeValue; Int m_nominalWhiteLevelLumaCodeValue; Int m_extendedWhiteLevelLumaCodeValue; Int* m_startOfCodedInterval; Int* m_codedPivotValue; Int* m_targetPivotValue; Int m_framePackingSEIEnabled; Int m_framePackingSEIType; Int m_framePackingSEIId; Int m_framePackingSEIQuincunx; Int m_framePackingSEIInterpretation; Int m_displayOrientationSEIAngle; Int m_temporalLevel0IndexSEIEnabled; Int m_gradualDecodingRefreshInfoEnabled; Int m_decodingUnitInfoSEIEnabled; Int m_SOPDescriptionSEIEnabled; Int m_scalableNestingSEIEnabled; // weighted prediction Bool m_useWeightedPred; ///< Use of weighted prediction in P slices Bool m_useWeightedBiPred; ///< Use of bi-directional weighted prediction in B slices UInt m_log2ParallelMergeLevel; ///< Parallel merge estimation region UInt m_maxNumMergeCand; ///< Max number of merge candidates Int m_TMVPModeId; Int m_signHideFlag; #if RATE_CONTROL_LAMBDA_DOMAIN Bool m_RCEnableRateControl; ///< enable rate control or not Int m_RCTargetBitrate; ///< target bitrate when rate control is enabled #if M0036_RC_IMPROVEMENT Int m_RCKeepHierarchicalBit; ///< 0: equal bit allocation; 1: fixed ratio bit allocation; 2: adaptive ratio bit allocation #else Bool m_RCKeepHierarchicalBit; ///< whether keeping hierarchical bit allocation structure or not #endif Bool m_RCLCULevelRC; ///< true: LCU level rate control; false: picture level rate control Bool m_RCUseLCUSeparateModel; ///< use separate R-lambda model at LCU level Int m_RCInitialQP; ///< inital QP for rate control Bool m_RCForceIntraQP; ///< force all intra picture to use initial QP or not #else Bool m_enableRateCtrl; ///< Flag for using rate control algorithm Int m_targetBitrate; ///< target bitrate Int m_numLCUInUnit; ///< Total number of LCUs in a frame should be completely divided by the NumLCUInUnit #endif Int m_useScalingListId; ///< using quantization matrix Char* m_scalingListFile; ///< quantization matrix file name Bool m_TransquantBypassEnableFlag; ///< transquant_bypass_enable_flag setting in PPS. Bool m_CUTransquantBypassFlagValue; ///< if transquant_bypass_enable_flag, the fixed value to use for the per-CU cu_transquant_bypass_flag. Bool m_recalculateQPAccordingToLambda; ///< recalculate QP value according to the lambda value Bool m_useStrongIntraSmoothing; ///< enable strong intra smoothing for 32x32 blocks where the reference samples are flat Int m_activeParameterSetsSEIEnabled; Bool m_vuiParametersPresentFlag; ///< enable generation of VUI parameters Bool m_aspectRatioInfoPresentFlag; ///< Signals whether aspect_ratio_idc is present Int m_aspectRatioIdc; ///< aspect_ratio_idc Int m_sarWidth; ///< horizontal size of the sample aspect ratio Int m_sarHeight; ///< vertical size of the sample aspect ratio Bool m_overscanInfoPresentFlag; ///< Signals whether overscan_appropriate_flag is present Bool m_overscanAppropriateFlag; ///< Indicates whether conformant decoded pictures are suitable for display using overscan Bool m_videoSignalTypePresentFlag; ///< Signals whether video_format, video_full_range_flag, and colour_description_present_flag are present Int m_videoFormat; ///< Indicates representation of pictures Bool m_videoFullRangeFlag; ///< Indicates the black level and range of luma and chroma signals Bool m_colourDescriptionPresentFlag; ///< Signals whether colour_primaries, transfer_characteristics and matrix_coefficients are present Int m_colourPrimaries; ///< Indicates chromaticity coordinates of the source primaries Int m_transferCharacteristics; ///< Indicates the opto-electronic transfer characteristics of the source Int m_matrixCoefficients; ///< Describes the matrix coefficients used in deriving luma and chroma from RGB primaries Bool m_chromaLocInfoPresentFlag; ///< Signals whether chroma_sample_loc_type_top_field and chroma_sample_loc_type_bottom_field are present Int m_chromaSampleLocTypeTopField; ///< Specifies the location of chroma samples for top field Int m_chromaSampleLocTypeBottomField; ///< Specifies the location of chroma samples for bottom field Bool m_neutralChromaIndicationFlag; ///< Indicates that the value of all decoded chroma samples is equal to 1<<(BitDepthCr-1) Bool m_defaultDisplayWindowFlag; ///< Indicates the presence of the default window parameters Int m_defDispWinLeftOffset; ///< Specifies the left offset from the conformance window of the default window Int m_defDispWinRightOffset; ///< Specifies the right offset from the conformance window of the default window Int m_defDispWinTopOffset; ///< Specifies the top offset from the conformance window of the default window Int m_defDispWinBottomOffset; ///< Specifies the bottom offset from the conformance window of the default window Bool m_frameFieldInfoPresentFlag; ///< Indicates that pic_struct values are present in picture timing SEI messages Bool m_pocProportionalToTimingFlag; ///< Indicates that the POC value is proportional to the output time w.r.t. first picture in CVS Int m_numTicksPocDiffOneMinus1; ///< Number of ticks minus 1 that for a POC difference of one Bool m_bitstreamRestrictionFlag; ///< Signals whether bitstream restriction parameters are present Bool m_tilesFixedStructureFlag; ///< Indicates that each active picture parameter set has the same values of the syntax elements related to tiles Bool m_motionVectorsOverPicBoundariesFlag; ///< Indicates that no samples outside the picture boundaries are used for inter prediction Int m_minSpatialSegmentationIdc; ///< Indicates the maximum size of the spatial segments in the pictures in the coded video sequence Int m_maxBytesPerPicDenom; ///< Indicates a number of bytes not exceeded by the sum of the sizes of the VCL NAL units associated with any coded picture Int m_maxBitsPerMinCuDenom; ///< Indicates an upper bound for the number of bits of coding_unit() data Int m_log2MaxMvLengthHorizontal; ///< Indicate the maximum absolute value of a decoded horizontal MV component in quarter-pel luma units Int m_log2MaxMvLengthVertical; ///< Indicate the maximum absolute value of a decoded vertical MV component in quarter-pel luma units #if H_3D // Camera parameters Char* m_pchCameraParameterFile; ///< camera parameter file Char* m_pchBaseViewCameraNumbers; TAppComCamPara m_cCameraData; Int m_iCodedCamParPrecision; ///< precision for coding of camera parameters #if H_3D_VSO Char* m_pchVSOConfig; Bool m_bUseVSO; ///< flag for using View Synthesis Optimization Bool m_bVSOLSTable; ///< Depth QP dependent Lagrange parameter optimization (m23714) Bool m_bVSOEarlySkip; ///< Early skip of VSO computation (JCT3V-A0093 modification 4) //// Used for development by GT, might be removed later Double m_dLambdaScaleVSO; ///< Scaling factor for Lambda in VSO mode Bool m_bForceLambdaScaleVSO; ///< Use Lambda Scale for depth even if VSO is turned off Bool m_bAllowNegDist; ///< Allow negative distortion in VSO UInt m_uiVSOMode; ///< Number of VSO Mode, 1 = , 2 = simple, org vs. ren, 3 = simple, ren vs. ren, 4 = full // SAIT_VSO_EST_A0033 Bool m_bUseEstimatedVSD; ///< Flag for using model based VSD estimation instead of VSO for some encoder decisions (JCT3V-A0033 modification 3) // LGE_WVSO_A0119 Bool m_bUseWVSO; ///< flag for using View Synthesis Optimization Int m_iVSOWeight; Int m_iVSDWeight; Int m_iDWeight; // Ren Model String TRenModSetupStrParser m_cRenModStrParser; #endif #if H_3D_DIM Bool m_useDMM; ///< flag for using DMM Bool m_useRBC; ///< flag for using RBC Bool m_useSDC; ///< flag for using SDC Bool m_useDLT; ///< flag for using DLT #endif #if H_3D_QTLPC Bool m_bUseQTL; ///< flag for using depth QuadTree Limitation Bool m_bUsePC; ///< flag for using Predictive Coding with QTL #endif #endif // internal member functions Void xSetGlobal (); ///< set global variables Void xCheckParameter (); ///< check validity of configuration values Void xPrintParameter (); ///< print configuration values Void xPrintUsage (); ///< print usage #if H_MV template Void xResizeVector( std::vector & rpcVector ) { for( Int layer = 0; rpcVector.size() < m_numberOfLayers; layer++ ) { assert( rpcVector.size() > 0 ); rpcVector.push_back( rpcVector[layer] ); } for( ; rpcVector.size() > m_numberOfLayers; ) { rpcVector.pop_back( ); } } template Void xPrintParaVector( std::string description, std::vector & rpcVector ) { Int iSpace = max(1, ENC_CFG_CONSOUT_SPACE - (Int) description.length() ); for ( Int i = 0; i < iSpace; i++ ) description.append( " " ); description.append( ":" ); printf( "%s", description.c_str() ); for(Int i=0;i