source: 3DVCSoftware/branches/0.2-poznan-univ/source/App/TAppEncoder/TAppEncCfg.h @ 21

Last change on this file since 21 was 12, checked in by poznan-univ, 13 years ago

Poznan Tools

  • Depth base motion vector prediction
  • Property svn:eol-style set to native
File size: 14.9 KB
Line 
1/* The copyright in this software is being made available under the BSD
2 * License, included below. This software may be subject to other third party
3 * and contributor rights, including patent rights, and no such rights are
4 * granted under this license.
5 *
6 * Copyright (c) 2010-2011, ISO/IEC
7 * All rights reserved.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions are met:
11 *
12 *  * Redistributions of source code must retain the above copyright notice,
13 *    this list of conditions and the following disclaimer.
14 *  * Redistributions in binary form must reproduce the above copyright notice,
15 *    this list of conditions and the following disclaimer in the documentation
16 *    and/or other materials provided with the distribution.
17 *  * Neither the name of the ISO/IEC nor the names of its contributors may
18 *    be used to endorse or promote products derived from this software without
19 *    specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS
25 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
31 * THE POSSIBILITY OF SUCH DAMAGE.
32 */
33
34
35
36/** \file     TAppEncCfg.h
37    \brief    Handle encoder configuration parameters (header)
38*/
39
40#ifndef __TAPPENCCFG__
41#define __TAPPENCCFG__
42
43#include "../../Lib/TLibCommon/CommonDef.h"
44#include "../../Lib/TLibCommon/TComMVDRefData.h"
45#include "../../App/TAppCommon/TAppComCamPara.h"
46#include "../../Lib/TLibRenderer/TRenTop.h"
47#include "../../Lib/TLibRenderer/TRenModel.h"
48#include "../../Lib/TLibRenderer/TRenModSetupStrParser.h"
49
50#include <string>
51#include <vector>
52
53// ====================================================================================================================
54// Class definition
55// ====================================================================================================================
56
57/// encoder configuration class
58class TAppEncCfg
59{
60protected:
61  // file I/O
62  char*     m_pchBitstreamFile;                               ///< output bitstream file
63
64  std::vector<char*>     m_pchInputFileList;                  ///< source file names
65  std::vector<char*>     m_pchDepthInputFileList;             ///< source depth file names
66  std::vector<char*>     m_pchReconFileList;                  ///< output reconstruction file names
67  std::vector<char*>     m_pchDepthReconFileList;             ///< output depth reconstruction file names
68
69  std::vector<char*>     m_pchERRefFileList;                  ///< virtual external reference view files names
70
71  // source specification
72  Int       m_iFrameRate;                                     ///< source frame-rates (Hz)
73  unsigned int m_FrameSkip;                                   ///< number of skipped frames from the beginning
74  Int       m_iSourceWidth;                                   ///< source width in pixel
75  Int       m_iSourceHeight;                                  ///< source height in pixel
76  Int       m_iFrameToBeEncoded;                              ///< number of encoded frames
77  Bool      m_bUsePAD;                                        ///< flag for using source padding
78  Int       m_aiPad[2];                                       ///< number of padded pixels for width and height
79
80  Int       m_iNumberOfViews;                                ///< number Views to Encode
81  Bool      m_bUsingDepthMaps ;
82
83
84  // coding structure
85#if DCM_DECODING_REFRESH
86  Int       m_iDecodingRefreshType;                           ///< random access type
87#endif
88  UInt      m_uiCodedPictureStoreSize ;
89  Int       m_iGOPSize;                                       ///< GOP size of hierarchical structure
90  Int       m_iRateGOPSize;                                   ///< GOP size for QP variance
91#if !HHI_NO_LowDelayCoding
92  Bool      m_bUseLDC;                                        ///< flag for using low-delay coding mode
93#endif
94#if DCM_COMB_LIST
95  Bool      m_bUseLComb;                                      ///< flag for using combined reference list for uni-prediction in B-slices (JCTVC-D421)
96  Bool      m_bLCMod;                                         ///< flag for specifying whether the combined reference list for uni-prediction in B-slices is uploaded explicitly
97#endif
98  std::string     m_cInputFormatString ;                            // GOP string
99  // coding quality
100
101  std::vector<Double>  m_adQP;                                ///< QP value of key-picture (floating point) [0] video, [1] depth
102  std::vector<Int>     m_aiQP;                                ///< QP value of key-picture (integer)
103
104  Int       m_aiTLayerQPOffset[MAX_TLAYER];                   ///< QP offset corresponding to temporal layer depth
105  char*     m_pchdQPFile;                                     ///< QP offset for each slice (initialized from external file)
106  Int*      m_aidQP;                                          ///< array of slice QP values
107  Int       m_iMaxDeltaQP;                                    ///< max. |delta QP|
108  UInt      m_uiDeltaQpRD;                                    ///< dQP range for multi-pass slice QP optimization
109
110  // coding unit (CU) definition
111  UInt      m_uiMaxCUWidth;                                   ///< max. CU width in pixel
112  UInt      m_uiMaxCUHeight;                                  ///< max. CU height in pixel
113  UInt      m_uiMaxCUDepth;                                   ///< max. CU depth
114
115  // transfom unit (TU) definition
116  UInt      m_uiQuadtreeTULog2MaxSize;
117  UInt      m_uiQuadtreeTULog2MinSize;
118
119  UInt      m_uiQuadtreeTUMaxDepthInter;
120  UInt      m_uiQuadtreeTUMaxDepthIntra;
121
122  // coding tools (bit-depth)
123  UInt      m_uiInputBitDepth;                                ///< bit-depth of input file
124  UInt      m_uiOutputBitDepth;                               ///< bit-depth of output file
125#ifdef ENABLE_IBDI
126  UInt      m_uiBitIncrement;                                 ///< bit-depth increment
127#endif
128  UInt      m_uiInternalBitDepth;                             ///< Internal bit-depth (BitDepth+BitIncrement)
129
130#if MTK_SAO
131  vector<Bool> m_abUseSAO;
132#endif
133
134  // coding tools (loop filter)
135  vector<Bool> m_abUseALF;                                    ///< flag for using adaptive loop filter [0] - video, [1] - depth
136#ifdef MQT_ALF_NPASS
137  Int       m_iALFEncodePassReduction;                        ///< ALF encoding pass, 0 = original 16-pass, 1 = 1-pass, 2 = 2-pass
138#endif
139
140  vector<Bool> m_abLoopFilterDisable;                         ///< flag for using deblocking filter filter [0] - video, [1] - depth
141  Int       m_iLoopFilterAlphaC0Offset;                       ///< alpha offset for deblocking filter
142  Int       m_iLoopFilterBetaOffset;                          ///< beta offset for deblocking filter
143
144  // coding tools (entropy coder)
145  Int       m_iSymbolMode;                                    ///< entropy coder mode, 0 = VLC, 1 = CABAC
146
147  // coding tools (inter - merge motion partitions)
148  Bool      m_bUseMRG;                                        ///< SOPH: flag for using motion partition Merge Mode
149
150#if LM_CHROMA
151  Bool      m_bUseLMChroma;                                  ///< JL: Chroma intra prediction based on luma signal
152#endif
153
154#if HHI_RMP_SWITCH
155  Bool      m_bUseRMP;
156#endif
157
158  // coding tools (encoder-only parameters)
159  Bool      m_bUseSBACRD;                                     ///< flag for using RD optimization based on SBAC
160  Bool      m_bUseASR;                                        ///< flag for using adaptive motion search range
161  Bool      m_bUseHADME;                                      ///< flag for using HAD in sub-pel ME
162  vector<Bool> m_abUseRDOQ;                                   ///< flag for using RD optimized quantization [0]-video, [1]-depth
163  Int       m_iFastSearch;                                    ///< ME mode, 0 = full, 1 = diamond, 2 = PMVFAST
164  Int       m_iSearchRange;                                   ///< ME search range
165  Int       m_bipredSearchRange;                              ///< ME search range for bipred refinement
166  Bool      m_bUseFastEnc;                                    ///< flag for using fast encoder setting
167
168#if DEPTH_MAP_GENERATION
169  UInt      m_uiPredDepthMapGeneration;                       ///< using of (virtual) depth maps for texture coding
170#endif
171#if HHI_INTER_VIEW_MOTION_PRED
172  UInt      m_uiMultiviewMvPredMode;                          ///< usage of predictors for multi-view mv prediction
173  UInt      m_uiMultiviewMvRegMode;                           ///< regularization for multiview motion vectors
174  Double    m_dMultiviewMvRegLambdaScale;                     ///< lambda scale for multiview motion vectors regularization
175#endif
176#if HHI_INTER_VIEW_RESIDUAL_PRED
177  UInt      m_uiMultiviewResPredMode;                         ///< using multiview residual prediction
178#endif
179
180#if HHI_INTERVIEW_SKIP
181  UInt      m_uiInterViewSkip;                            ///< usage of interview skip mode ( do not transmit residual)
182#if HHI_INTERVIEW_SKIP_LAMBDA_SCALE
183  Double    m_dInterViewSkipLambdaScale;                 ///< lambda scale for interview skip
184#endif
185#endif
186
187  // camera parameter
188  Char*     m_pchCameraParameterFile;                         ///< camera parameter file
189  Char*     m_pchBaseViewCameraNumbers;
190  TAppComCamPara m_cCameraData;
191
192  Int       m_iCodedCamParPrecision;                          ///< precision for coding of camera parameters
193
194#if HHI_INTERVIEW_SKIP
195  TRenTop  m_cUsedPelsRenderer;                               ///< renderer for used pels map
196#endif
197
198#if HHI_VSO
199  Char*     m_pchVSOConfig;
200  Bool      m_bUseVSO;                                    ///< flag for using View Synthesis Optimization
201
202  //// Used for development by GT, might be removed later
203  Double    m_dLambdaScaleVSO;                            ///< Scaling factor for Lambda in VSO mode
204  Bool      m_bForceLambdaScaleVSO;                       ///< Use Lambda Scale for depth even if VSO is turned off
205#if HHI_VSO_DIST_INT
206  Bool      m_bAllowNegDist;                              ///< Allow negative distortion in VSO
207#endif
208  UInt      m_uiVSOMode;                                  ///< Number of VSO Mode, 1 = , 2 = simple, org vs. ren, 3 = simple, ren vs. ren, 4 = full
209  Int       m_iNumberOfExternalRefs;                      ///< number Virtual External Reference Views
210  std::vector< std::vector<Int> > m_aaiBaseViewRefInd;    ///< View numbers of Base View References
211  std::vector< std::vector<Int> > m_aaiERViewRefInd;      ///< View numbers of External ViewReferences
212  std::vector< std::vector<Int> > m_aaiERViewRefLutInd;   ///< Indices of LUTs used for External View References
213#endif
214
215  Int       m_iSliceMode;           ///< 0: Disable all Recon slice limits, 1 : Maximum number of largest coding units per slice, 2: Maximum number of bytes in a slice
216  Int       m_iSliceArgument;       ///< If m_iSliceMode==1, m_iSliceArgument=max. # of largest coding units. If m_iSliceMode==2, m_iSliceArgument=max. # of bytes.
217  Int       m_iEntropySliceMode;    ///< 0: Disable all entropy slice limits, 1 : Maximum number of largest coding units per slice, 2: Constraint based entropy slice
218  Int       m_iEntropySliceArgument;///< If m_iEntropySliceMode==1, m_iEntropySliceArgument=max. # of largest coding units. If m_iEntropySliceMode==2, m_iEntropySliceArgument=max. # of bins.
219
220#if MTK_NONCROSS_INLOOP_FILTER
221  Bool m_bLFCrossSliceBoundaryFlag;  ///< 0: Cross-slice-boundary in-loop filtering 1: non-cross-slice-boundary in-loop filtering
222#endif
223#ifdef ROUNDING_CONTROL_BIPRED
224  Bool m_useRoundingControlBipred;
225#endif
226#if CONSTRAINED_INTRA_PRED
227  Bool      m_bUseConstrainedIntraPred;                       ///< flag for using constrained intra prediction
228#endif
229#if HHI_DMM_WEDGE_INTRA || HHI_DMM_PRED_TEX
230  Bool      m_bUseDMM;
231#endif
232#if HHI_MPI
233  Bool      m_bUseMVI;  ///< flag for using Motion Vector Inheritance for depth map coding
234#endif
235
236  PicOrderCnt m_iQpChangeFrame;
237  Int         m_iQpChangeOffsetVideo;
238  Int         m_iQpChangeOffsetDepth;
239
240  bool m_pictureDigestEnabled; ///< enable(1)/disable(0) md5 computation and SEI signalling
241
242  //====== Weighted Prediction ========
243#ifdef WEIGHT_PRED
244  Bool                    m_bUseWeightPred;                   ///< Use of explicit Weighting Prediction for P_SLICE
245  UInt                    m_uiBiPredIdc;                      ///< Use of Bi-Directional Weighting Prediction (B_SLICE): explicit(1) or implicit(2)
246#endif
247
248  // internal member functions
249  Void  xSetGlobal      ();                                   ///< set global variables
250  Void  xCheckParameter ();                                   ///< check validity of configuration values
251  Void  xPrintParameter ();                                   ///< print configuration values
252  Void  xPrintUsage     ();                                   ///< print usage
253
254  Void  xCleanUpVectors ();                                   ///< clean up vector sizes
255  Void  xInitCameraPars ();                                   ///< init camera parameters
256
257
258  // set MVD Parameters and LUTs
259  Void xSetShiftParameters();
260  Void xGetShiftParameter( UInt uiSourceView, UInt uiTargetView, bool bExternal, double& rdScale, double& rdOffset ); ///< Get one Shift Parameters
261
262  // util
263  Void  xAppendToFileNameEnd( Char* pchInputFileName, const Char* pchStringToAppend, Char* & rpchOutputFileName);
264  Bool  xConfirmParameter(Bool bflag, const char* message);
265
266
267  template <class T> Void xCleanUpVector( std::vector<T>& rcVec, const T& rcInvalid );
268
269#if HHI_VSO
270  // Ren Model String
271  TRenModSetupStrParser       m_cRenModStrParser;
272#endif
273
274#if POZNAN_TEXTURE_TU_DELTA_QP_PARAM_IN_CFG_FOR_ENC
275  Double                      m_dTextureCuDeltaQpOffset;
276  Double                      m_dTextureCuDeltaQpMul;
277  Int                         m_iTextureCuDeltaQpTopBottomRow;
278#endif
279
280#if POZNAN_NONLINEAR_DEPTH
281  Double    m_fDepthPower;                                                                        ///< Depth power value
282#endif
283
284#if POZNAN_STAT_JK
285  std::vector<char*>       m_pchStatFileList;                                   ///< texure statistics file names
286  std::vector<char*>       m_pchDepthStatFileList;                              ///< depth statistics file names
287#endif
288
289public:
290
291  TAppEncCfg();
292  virtual ~TAppEncCfg();
293
294public:
295  Void  create    ();                                         ///< create option handling class
296  Void  destroy   ();                                         ///< destroy option handling class
297  Bool  parseCfg  ( Int argc, Char* argv[] );                 ///< parse configuration file to fill member variables
298
299};// END CLASS DEFINITION TAppEncCfg
300
301#endif // __TAPPENCCFG__
302
Note: See TracBrowser for help on using the repository browser.