Context navigation

source: 3DVCSoftware/branches/HTM-6.2-dev3-Qualcomm/source/App/TAppEncoder/TAppEncCfg.h @ 360

Visit:

Last change on this file since 360 was 332, checked in by tech, 12 years ago
Merged branch 6.1-Cleanup@329.
Property svn:eol-style set to `native`
File size: 19.7 KB

Line
1	/* The copyright in this software is being made available under the BSD
2	* License, included below. This software may be subject to other third party
3	* and contributor rights, including patent rights, and no such rights are
4	* granted under this license.
5	*
6	* Copyright (c) 2010-2012, ITU/ISO/IEC
7	* All rights reserved.
8	*
9	* Redistribution and use in source and binary forms, with or without
10	* modification, are permitted provided that the following conditions are met:
11	*
12	* * Redistributions of source code must retain the above copyright notice,
13	* this list of conditions and the following disclaimer.
14	* * Redistributions in binary form must reproduce the above copyright notice,
15	* this list of conditions and the following disclaimer in the documentation
16	* and/or other materials provided with the distribution.
17	* * Neither the name of the ITU/ISO/IEC nor the names of its contributors may
18	* be used to endorse or promote products derived from this software without
19	* specific prior written permission.
20	*
21	* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22	* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23	* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24	* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS
25	* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26	* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27	* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28	* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29	* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30	* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
31	* THE POSSIBILITY OF SUCH DAMAGE.
32	*/
33
34	/** \file TAppEncCfg.h
35	\brief Handle encoder configuration parameters (header)
36	*/
37
38	#ifndef __TAPPENCCFG__
39	#define __TAPPENCCFG__
40
41	#include "TLibCommon/CommonDef.h"
42
43	#include "TLibEncoder/TEncCfg.h"
44	#include "TAppCommon/TAppComCamPara.h"
45	#include "TLibRenderer/TRenTop.h"
46	#include "TLibRenderer/TRenModel.h"
47	#include "TLibRenderer/TRenModSetupStrParser.h"
48
49	#include <sstream>
50	#include <vector>
51
52	//! \ingroup TAppEncoder
53	//! \{
54
55	// ====================================================================================================================
56	// Class definition
57	// ====================================================================================================================
58
59	/// encoder configuration class
60	class TAppEncCfg
61	{
62	protected:
63	// file I/O
64	std::vector<char*> m_pchInputFileList; ///< source file names
65	std::vector<char*> m_pchDepthInputFileList; ///< source depth file names
66	std::vector<char*> m_pchReconFileList; ///< output reconstruction file names
67	std::vector<char*> m_pchDepthReconFileList; ///< output depth reconstruction file names
68	char* m_pchBitstreamFile; ///< output bitstream file
69	Double m_adLambdaModifier[ MAX_TLAYER ]; ///< Lambda modifier array for each temporal layer
70	// source specification
71	Int m_iFrameRate; ///< source frame-rates (Hz)
72	unsigned int m_FrameSkip; ///< number of skipped frames from the beginning
73	Int m_iSourceWidth; ///< source width in pixel
74	Int m_iSourceHeight; ///< source height in pixel
75	Int m_croppingMode;
76	Int m_cropLeft;
77	Int m_cropRight;
78	Int m_cropTop;
79	Int m_cropBottom;
80	Int m_iFrameToBeEncoded; ///< number of encoded frames
81	Int m_aiPad[2]; ///< number of padded pixels for width and height
82
83	Int m_iNumberOfViews; ///< number Views to Encode
84	Bool m_bUsingDepthMaps;
85
86	#if FLEX_CODING_ORDER_M23723
87	Char* m_pchMVCJointCodingOrder; ///< texture-depth coding order
88	Bool m_b3DVFlexOrder; ///< flexible coding order flag
89	#endif
90
91	// coding structure
92	Int m_iIntraPeriod; ///< period of I-slice (random access period)
93	Int m_iDecodingRefreshType; ///< random access type
94	Int m_iGOPSize; ///< GOP size of hierarchical structure
95	Int m_extraRPSs[MAX_VIEW_NUM];
96	GOPEntryMvc m_GOPListsMvc[MAX_VIEW_NUM][MAX_GOP+1];
97	Int m_numReorderPics[MAX_VIEW_NUM][MAX_TLAYER]; ///< total number of reorder pictures
98	Int m_maxDecPicBuffering[MAX_VIEW_NUM][MAX_TLAYER]; ///< total number of reference pictures needed for decoding
99	Bool m_bUseLComb; ///< flag for using combined reference list for uni-prediction in B-slices (JCTVC-D421)
100	Bool m_bLCMod; ///< flag for specifying whether the combined reference list for uni-prediction in B-slices is uploaded explicitly
101	Bool m_bDisInter4x4;
102	Bool m_enableNSQT; ///< flag for enabling NSQT
103	Bool m_enableAMP;
104	// coding quality
105	std::vector<Double> m_adQP; ///< QP value of key-picture (floating point) [0] video, [1] depth
106	std::vector<Int> m_aiQP; ///< QP value of key-picture (integer) [0] video, [1] depth
107	#if QC_MVHEVC_B0046
108	std::vector<Int> m_aiVId; ///< view id
109	#endif
110	Int m_aiTLayerQPOffset[MAX_TLAYER]; ///< QP offset corresponding to temporal layer depth
111	char* m_pchdQPFile; ///< QP offset for each slice (initialized from external file)
112	Int* m_aidQP; ///< array of slice QP values
113	Int* m_aidQPdepth; ///< array of depth slice QP values
114	Int m_iMaxDeltaQP; ///< max. \|delta QP\|
115	UInt m_uiDeltaQpRD; ///< dQP range for multi-pass slice QP optimization
116	Int m_iMaxCuDQPDepth; ///< Max. depth for a minimum CuDQPSize (0:default)
117
118	Int m_iChromaQpOffset; ///< ChromaQpOffset (0:default)
119	Int m_iChromaQpOffset2nd; ///< ChromaQpOffset2nd (0:default)
120
121	#if ADAPTIVE_QP_SELECTION
122	Bool m_bUseAdaptQpSelect;
123	#endif
124
125	Bool m_bUseAdaptiveQP; ///< Flag for enabling QP adaptation based on a psycho-visual model
126	Int m_iQPAdaptationRange; ///< dQP range by QP adaptation
127
128	Int m_maxTempLayer[MAX_VIEW_NUM]; ///< Max temporal layer
129
130	// coding unit (CU) definition
131	UInt m_uiMaxCUWidth; ///< max. CU width in pixel
132	UInt m_uiMaxCUHeight; ///< max. CU height in pixel
133	UInt m_uiMaxCUDepth; ///< max. CU depth
134
135	// transfom unit (TU) definition
136	UInt m_uiQuadtreeTULog2MaxSize;
137	UInt m_uiQuadtreeTULog2MinSize;
138
139	UInt m_uiQuadtreeTUMaxDepthInter;
140	UInt m_uiQuadtreeTUMaxDepthIntra;
141
142	// coding tools (bit-depth)
143	UInt m_uiInputBitDepth; ///< bit-depth of input file
144	UInt m_uiOutputBitDepth; ///< bit-depth of output file
145	UInt m_uiInternalBitDepth; ///< Internal bit-depth (BitDepth+BitIncrement)
146
147	// coding tools (PCM bit-depth)
148	Bool m_bPCMInputBitDepthFlag; ///< 0: PCM bit-depth is internal bit-depth. 1: PCM bit-depth is input bit-depth.
149	UInt m_uiPCMBitDepthLuma; ///< PCM bit-depth for luma
150
151	// coding tool (lossless)
152	#if LOSSLESS_CODING
153	Bool m_useLossless; ///< flag for using lossless coding
154	#endif
155	vector<Bool> m_abUseSAO;
156	#if LGE_ILLUCOMP_B0045
157	#if LGE_ILLUCOMP_DEPTH_C0046
158	vector<Bool> m_abUseIC; ///< flag for using illumination compensation for inter-view prediction
159	#else
160	Bool m_bUseIC; ///< flag for using illumination compensation for inter-view prediction
161	#endif
162	#endif
163	#if INTER_VIEW_VECTOR_SCALING_C0115
164	Bool m_bUseIVS; ///< flag for using inter-view vector scaling
165	#endif
166	Int m_maxNumOffsetsPerPic; ///< SAO maximun number of offset per picture
167	Bool m_saoInterleavingFlag; ///< SAO interleaving flag
168	// coding tools (loop filter)
169	vector<Bool> m_abUseALF; ///< flag for using adaptive loop filter [0] - video, [1] - depth
170	Int m_iALFEncodePassReduction; //!< ALF encoding pass, 0 = original 16-pass, 1 = 1-pass, 2 = 2-pass
171
172	Int m_iALFMaxNumberFilters; ///< ALF Max Number Filters in one picture
173	Bool m_bALFParamInSlice;
174	Bool m_bALFPicBasedEncode;
175
176	vector<Bool> m_abLoopFilterDisable; ///< flag for using deblocking filter filter [0] - video, [1] - depth
177	Bool m_loopFilterOffsetInAPS; ///< offset for deblocking filter in 0 = slice header, 1 = APS
178	Int m_loopFilterBetaOffsetDiv2; ///< beta offset for deblocking filter
179	Int m_loopFilterTcOffsetDiv2; ///< tc offset for deblocking filter
180	Bool m_DeblockingFilterControlPresent; ///< deblocking filter control present flag in PPS
181
182	Bool m_bUseLMChroma; ///< JL: Chroma intra prediction based on luma signal
183
184	// coding tools (PCM)
185	Bool m_usePCM; ///< flag for using IPCM
186	UInt m_pcmLog2MaxSize; ///< log2 of maximum PCM block size
187	UInt m_uiPCMLog2MinSize; ///< log2 of minimum PCM block size
188	Bool m_bPCMFilterDisableFlag; ///< PCM filter disable flag
189
190	// coding tools (encoder-only parameters)
191	Bool m_bUseSBACRD; ///< flag for using RD optimization based on SBAC
192	Bool m_bUseASR; ///< flag for using adaptive motion search range
193	Bool m_bUseHADME; ///< flag for using HAD in sub-pel ME
194	vector<Bool> m_abUseRDOQ; ///< flag for using RD optimized quantization [0]-video, [1]-depth
195	Int m_iFastSearch; ///< ME mode, 0 = full, 1 = diamond, 2 = PMVFAST
196	Int m_iSearchRange; ///< ME search range
197	#if DV_V_RESTRICTION_B0037
198	Bool m_bUseDisparitySearchRangeRestriction; ///< restrict vertical search range for inter-view prediction
199	Int m_iVerticalDisparitySearchRange; ///< ME vertical search range for inter-view prediction
200	#endif
201	Int m_bipredSearchRange; ///< ME search range for bipred refinement
202	Bool m_bUseFastEnc; ///< flag for using fast encoder setting
203	#if HHI_INTERVIEW_SKIP
204	Bool m_bInterViewSkip; ///< usage of interview skip mode ( do not transmit residual)
205	#if HHI_INTERVIEW_SKIP_LAMBDA_SCALE
206	Double m_dInterViewSkipLambdaScale; ///< lambda scale for interview skip
207	#endif
208	#endif
209	Bool m_bUseEarlyCU; ///< flag for using Early CU setting
210
211	#if DEPTH_MAP_GENERATION
212	UInt m_uiPredDepthMapGeneration; ///< using of (virtual) depth maps for texture coding
213	#endif
214	#if H3D_IVMP
215	UInt m_uiMultiviewMvPredMode; ///< usage of predictors for multi-view mv prediction
216	UInt m_uiMultiviewMvRegMode; ///< regularization for multiview motion vectors
217	Double m_dMultiviewMvRegLambdaScale; ///< lambda scale for multiview motion vectors regularization
218	#endif
219	#if H3D_IVRP
220	UInt m_uiMultiviewResPredMode; ///< using multiview residual prediction
221	#endif
222
223	Bool m_useFastDecisionForMerge; ///< flag for using Fast Decision Merge RD-Cost
224	Bool m_bUseCbfFastMode; ///< flag for using Cbf Fast PU Mode Decision
225	Int m_iSliceMode; ///< 0: Disable all Recon slice limits, 1 : Maximum number of largest coding units per slice, 2: Maximum number of bytes in a slice
226	Int m_iSliceArgument; ///< If m_iSliceMode==1, m_iSliceArgument=max. # of largest coding units. If m_iSliceMode==2, m_iSliceArgument=max. # of bytes.
227	Int m_iEntropySliceMode; ///< 0: Disable all entropy slice limits, 1 : Maximum number of largest coding units per slice, 2: Constraint based entropy slice
228	Int m_iEntropySliceArgument; ///< If m_iEntropySliceMode==1, m_iEntropySliceArgument=max. # of largest coding units. If m_iEntropySliceMode==2, m_iEntropySliceArgument=max. # of bins.
229
230	Int m_iSliceGranularity; ///< 0: Slices always end at LCU borders. 1-3: slices may end at a depth of 1-3 below LCU level.
231	Bool m_bLFCrossSliceBoundaryFlag; ///< 0: Cross-slice-boundary in-loop filtering 1: non-cross-slice-boundary in-loop filtering
232	Int m_iTileBehaviorControlPresentFlag; //!< 1: tile behavior control parameters are in PPS 0: tile behavior control parameters are not in PPS
233	Bool m_bLFCrossTileBoundaryFlag; //!< 1: Cross-tile-boundary in-loop filtering 0: non-cross-tile-boundary in-loop filtering
234	Int m_iColumnRowInfoPresent;
235	Int m_iUniformSpacingIdr;
236	Int m_iNumColumnsMinus1;
237	char* m_pchColumnWidth;
238	Int m_iNumRowsMinus1;
239	char* m_pchRowHeight;
240	Int m_iTileLocationInSliceHeaderFlag; //< enable(1)/disable(0) transmitssion of tile location in slice header
241	Int m_iTileMarkerFlag; //< enable(1)/disable(0) transmitssion of light weight tile marker
242	Int m_iMaxTileMarkerEntryPoints; //< maximum number of tile markers allowed in a slice (controls degree of parallelism)
243	Double m_dMaxTileMarkerOffset; //< Calculated offset. Light weight tile markers will be transmitted for TileIdx= Offset, 2Offset, 3Offset ...
244
245	Int m_iWaveFrontSynchro; //< 0: no WPP. >= 1: WPP is enabled, the "Top right" from which inheritance occurs is this LCU offset in the line above the current.
246	Int m_iWaveFrontFlush; //< enable(1)/disable(0) the CABAC flush at the end of each line of LCUs.
247	Int m_iWaveFrontSubstreams; //< If iWaveFrontSynchro, this is the number of substreams per frame (dependent tiles) or per tile (independent tiles).
248
249	Bool m_bUseConstrainedIntraPred; ///< flag for using constrained intra prediction
250
251	bool m_pictureDigestEnabled; ///< enable(1)/disable(0) md5 computation and SEI signalling
252
253	// weighted prediction
254	Bool m_bUseWeightPred; ///< Use of explicit Weighting Prediction for P_SLICE
255	UInt m_uiBiPredIdc; ///< Use of Bi-Directional Weighting Prediction (B_SLICE): explicit(1) or implicit(2)
256
257	#if TMVP_DEPTH_SWITCH
258	vector<Bool> m_enableTMVP; ///< Enable TMVP [0] video, [1] depth
259	#else
260	Bool m_enableTMVP;
261	#endif
262
263	Int m_signHideFlag;
264	Int m_signHidingThreshold;
265	#if HHI_MPI
266	Bool m_bUseMVI; ///< flag for using Motion Vector Inheritance for depth map coding
267	#endif
268	#if RWTH_SDC_DLT_B0036
269	Bool m_bUseDLT;
270	Bool m_bUseSDC;
271	#endif
272
273	Int m_useScalingListId; ///< using quantization matrix
274	char* m_scalingListFile; ///< quantization matrix file name
275
276	// camera parameter
277	Char* m_pchCameraParameterFile; ///< camera parameter file
278	Char* m_pchBaseViewCameraNumbers;
279	#if !QC_MVHEVC_B0046
280	TAppComCamPara m_cCameraData;
281	#endif
282	Int m_iCodedCamParPrecision; ///< precision for coding of camera parameters
283
284	#if HHI_VSO
285	Char* m_pchVSOConfig;
286	Bool m_bUseVSO; ///< flag for using View Synthesis Optimization
287	#if HHI_VSO_LS_TABLE_M23714
288	Bool m_bVSOLSTable; ///< Depth QP dependent Lagrange parameter optimization (m23714)
289	#endif
290	#if LGE_VSO_EARLY_SKIP_A0093
291	Bool m_bVSOEarlySkip; ///< Early skip of VSO computation (JCT3V-A0093 modification 4)
292	#endif
293	//// Used for development by GT, might be removed later
294	Double m_dLambdaScaleVSO; ///< Scaling factor for Lambda in VSO mode
295	Bool m_bForceLambdaScaleVSO; ///< Use Lambda Scale for depth even if VSO is turned off
296	#if HHI_VSO_DIST_INT
297	Bool m_bAllowNegDist; ///< Allow negative distortion in VSO
298	#endif
299	UInt m_uiVSOMode; ///< Number of VSO Mode, 1 = , 2 = simple, org vs. ren, 3 = simple, ren vs. ren, 4 = full
300	#endif
301	#if SAIT_VSO_EST_A0033
302	Bool m_bUseEstimatedVSD; ///< Flag for using model based VSD estimation instead of VSO for some encoder decisions (JCT3V-A0033 modification 3)
303	#endif
304	#if LGE_WVSO_A0119
305	Bool m_bUseWVSO; ///< flag for using View Synthesis Optimization
306	Int m_iVSOWeight;
307	Int m_iVSDWeight;
308	Int m_iDWeight;
309	#endif
310	// coding tools (depth intra modes)
311	#if HHI_DMM_WEDGE_INTRA \|\| HHI_DMM_PRED_TEX
312	Bool m_bUseDMM; ///< flag for using DMM
313	#endif
314
315	#if H3D_QTL
316	Bool m_bUseQTLPC; ///< flag for using depth QuadTree Limitation + Predictive Coding
317	#endif
318
319	// internal member functions
320	Void xSetGlobal (); ///< set global variables
321	Void xCheckParameter (); ///< check validity of configuration values
322	Void xPrintParameter (); ///< print configuration values
323	Void xPrintUsage (); ///< print usage
324
325	Void xCleanUpVectors (); ///< clean up vector sizes
326	Void xInitCameraPars (); ///< init camera parameters
327
328
329	// set MVD Parameters and LUTs
330	Void xSetShiftParameters();
331	Void xGetShiftParameter( UInt uiSourceView, UInt uiTargetView, bool bExternal, double& rdScale, double& rdOffset ); ///< Get one Shift Parameters
332
333	Void xAppendToFileNameEnd( Char* pchInputFileName, const Char* pchStringToAppend, Char* & rpchOutputFileName);
334
335	Void xCheckCodingStructureMvc(); ///< validate and configure inter-view coding structure
336
337	template <class T> Void xCleanUpVector( std::vector<T>& rcVec, const T& rcInvalid );
338	#if HHI_VSO
339	// Ren Model String
340	TRenModSetupStrParser m_cRenModStrParser;
341	#endif
342	public:
343	TAppEncCfg();
344	virtual ~TAppEncCfg();
345
346	public:
347	Void create (); ///< create option handling class
348	Void destroy (); ///< destroy option handling class
349	Bool parseCfg ( Int argc, Char* argv[] ); ///< parse configuration file to fill member variables
350
351	};// END CLASS DEFINITION TAppEncCfg
352
353	//! \}
354
355	#endif // __TAPPENCCFG__
356

Note: See TracBrowser for help on using the repository browser.

Download in other formats: