1 | \documentclass[a4paper,11pt]{jctvcdoc} |
---|
2 | |
---|
3 | \usepackage{geometry}[2010/02/12] |
---|
4 | |
---|
5 | \usepackage{hyperref} |
---|
6 | \hypersetup{colorlinks=true} |
---|
7 | \usepackage{color,soul} |
---|
8 | |
---|
9 | \usepackage[position=bottom]{subfig} |
---|
10 | \captionsetup[subfloat]{position=top} |
---|
11 | \usepackage{multirow} |
---|
12 | \usepackage{dcolumn} |
---|
13 | \newcolumntype{.}{D{.}{.}{-1}} |
---|
14 | \usepackage{colortbl} |
---|
15 | \usepackage{makecell} |
---|
16 | \usepackage{longtable} |
---|
17 | \usepackage{array} |
---|
18 | \usepackage{algorithm2e} |
---|
19 | |
---|
20 | \usepackage[strings]{underscore} |
---|
21 | \usepackage{csquotes} |
---|
22 | \MakeOuterQuote{"} |
---|
23 | \EnableQuotes |
---|
24 | |
---|
25 | \newcommand\None{} |
---|
26 | \newcommand\NotSet{} |
---|
27 | \makeatletter |
---|
28 | \newcommand{\Option}[1]{\ifx\optOption\@empty\gdef\optOption{#1}\else\g@addto@macro\optOption{ \\ #1}\fi} |
---|
29 | \newcommand{\ShortOption}[1]{\ifx\optShortOption\@empty\gdef\optShortOption{#1}\else\g@addto@macro\optShortOption{ \\ #1}\fi} |
---|
30 | \newcommand{\Default}[1]{\ifx\optDefault\@empty\gdef\optDefault{#1}\else\g@addto@macro\optDefault{ \\ #1}\fi} |
---|
31 | \newcommand{\clearOptions}{\gdef\optOption{}\gdef\optShortOption{}\gdef\optDefault{}} |
---|
32 | \makeatother |
---|
33 | \newenvironment{OptionTable}[1]{% |
---|
34 | \footnotesize |
---|
35 | \def\arraystretch{1.8} |
---|
36 | \clearOptions |
---|
37 | \begin{longtable}{l<{\makecell[tl]{\optOption}}% |
---|
38 | >{\texttt\bgroup}l<{\makecell[tl]{\optShortOption}\egroup}% |
---|
39 | c<{\makecell[tc]{\optDefault}}% |
---|
40 | >{\def\arraystretch{1.0}}p{0.5\textwidth}<{\clearOptions}} |
---|
41 | \caption{#1} \\ |
---|
42 | \hspace*{12em}&&\hspace*{8em}&\kill |
---|
43 | \hline |
---|
44 | \thead{Option} & |
---|
45 | \egroup\thead{Shorthand}\bgroup & |
---|
46 | \thead{Default} & |
---|
47 | \thead{Description} \\ |
---|
48 | \hline |
---|
49 | \endfirsthead |
---|
50 | \caption[]{#1 (Continued)} \\ |
---|
51 | \hspace*{12em}&&\hspace*{8em}&\kill |
---|
52 | \hline |
---|
53 | \thead{Option} & |
---|
54 | \egroup\thead{Shorthand}\bgroup & |
---|
55 | \thead{Default} & |
---|
56 | \thead{Description} \\ |
---|
57 | \hline |
---|
58 | \endhead |
---|
59 | \multicolumn{4}{r}{Continued...}\\ |
---|
60 | \hline |
---|
61 | \endfoot |
---|
62 | \hline |
---|
63 | \endlastfoot |
---|
64 | }{% |
---|
65 | \hline |
---|
66 | \end{longtable} |
---|
67 | } |
---|
68 | |
---|
69 | \newenvironment{MacroTable}[1]{% |
---|
70 | \footnotesize |
---|
71 | \def\arraystretch{1.3} |
---|
72 | \clearOptions |
---|
73 | \begin{longtable}{lcp{0.5\textwidth}} |
---|
74 | \caption{#1} \\ |
---|
75 | %\hspace*{12em}&&\hspace*{8em}&\kill |
---|
76 | \hline |
---|
77 | \thead{Option} & |
---|
78 | \thead{Default} & |
---|
79 | \thead{Description} \\ |
---|
80 | \hline |
---|
81 | \endfirsthead |
---|
82 | \caption[]{#1 (Continued)} \\ |
---|
83 | \hline |
---|
84 | \thead{Option} & |
---|
85 | \thead{Default} & |
---|
86 | \thead{Description} \\ |
---|
87 | \hline |
---|
88 | \endhead |
---|
89 | \multicolumn{3}{r}{Continued...}\\ |
---|
90 | \hline |
---|
91 | \endfoot |
---|
92 | \hline |
---|
93 | \endlastfoot |
---|
94 | }{% |
---|
95 | \end{longtable} |
---|
96 | } |
---|
97 | |
---|
98 | \title{HM Software Manual} |
---|
99 | \author{% |
---|
100 | Frank Bossen |
---|
101 | \email{bossen@docomoinnovations.com} |
---|
102 | \and |
---|
103 | David Flynn |
---|
104 | \email{davidf@rd.bbc.co.uk} |
---|
105 | \and |
---|
106 | Karsten S\"uhring |
---|
107 | \email{Karsten.Suehring@hhi.fraunhofer.de} |
---|
108 | } |
---|
109 | |
---|
110 | \jctvcmeeting{} |
---|
111 | \jctvcdocnum{Software Manual} |
---|
112 | \jctvcdocstatus{Software AHG working document} |
---|
113 | \jctvcdocpurpose{Information} |
---|
114 | \jctvcdocsource{AHG chairs} |
---|
115 | |
---|
116 | \begin{document} |
---|
117 | \maketitle |
---|
118 | \begin{abstract} |
---|
119 | This document is a user manual describing usage of reference software |
---|
120 | for the HEVC project. It applies to version 10.0 |
---|
121 | of the software. |
---|
122 | \end{abstract} |
---|
123 | |
---|
124 | \tableofcontents |
---|
125 | \listoftables |
---|
126 | |
---|
127 | \section{General Information} |
---|
128 | Reference software is being made available to provide a reference |
---|
129 | implementation of the draft HEVC standard being developed by the Joint |
---|
130 | Collaborative Team on Video Coding (JCT-VC) regrouping experts from |
---|
131 | ITU-T SG 16 and ISO/IEC SC29 WG11. One of the main goals of the |
---|
132 | reference software is to provide a basis upon which to conduct |
---|
133 | experiments in order to determine which coding tools provide desired |
---|
134 | coding performance. It is not meant to be a particularly efficient |
---|
135 | implementation of anything, and one may notice its apparent |
---|
136 | unsuitability for a particular use. It should not be construed to be a |
---|
137 | reflection of how complex a production-quality implementation of a |
---|
138 | future HEVC standard would be. |
---|
139 | |
---|
140 | This document aims to provide guidance on the usage of the reference |
---|
141 | software. It is widely suspected to be incomplete and suggestions for |
---|
142 | improvements are welcome. Such suggestions and general inquiries may be |
---|
143 | sent to the general JCT-VC email reflector on |
---|
144 | \url{jct-vc@lists.rwth-aachen.de} (registration required). |
---|
145 | |
---|
146 | \subsection*{Bug reporting} |
---|
147 | Bugs should be reported on the issue tracker set up at |
---|
148 | \url{http://hevc.kw.bbc.co.uk/trac/} |
---|
149 | |
---|
150 | \section{Installation and compilation} |
---|
151 | The software may be retrieved from one of the following SVN servers |
---|
152 | (mirrored): |
---|
153 | \begin{itemize} |
---|
154 | \item \url{https://hevc.hhi.fraunhofer.de/svn/svn_HEVCSoftware/} |
---|
155 | \item \url{svn://hevc.kw.bbc.co.uk/svn/jctvc-hm/} |
---|
156 | \end{itemize} |
---|
157 | |
---|
158 | Table~\ref{tab:project-files} enumerates various project files that are |
---|
159 | provided for development environments. |
---|
160 | |
---|
161 | \begin{table}[ht] |
---|
162 | \footnotesize |
---|
163 | \caption{Available project files} |
---|
164 | \label{tab:project-files} |
---|
165 | \centering |
---|
166 | \begin{tabular}{ll} |
---|
167 | \hline |
---|
168 | \thead{Environment} & |
---|
169 | \thead{Location of project file} \\ |
---|
170 | % Environment & Location of project file \\ |
---|
171 | \hline |
---|
172 | MS Visual Studio 8 & build/HM_vc8.sln \\ |
---|
173 | MS Visual Studio 9 & build/HM_vc9.sln \\ |
---|
174 | Xcode & HM.xcodeproj \\ |
---|
175 | Linux & build/linux/makefile \\ |
---|
176 | \hline |
---|
177 | \end{tabular} |
---|
178 | \end{table} |
---|
179 | |
---|
180 | %%%% |
---|
181 | %%%% |
---|
182 | %%%% |
---|
183 | \section{Using the encoder} |
---|
184 | \begin{verbatim} |
---|
185 | TAppEncoder [-h] [-c config.cfg] [--parameter=value] |
---|
186 | \end{verbatim} |
---|
187 | |
---|
188 | \begin{table}[ht] |
---|
189 | \footnotesize |
---|
190 | \centering |
---|
191 | \begin{tabular}{lp{0.5\textwidth}} |
---|
192 | \hline |
---|
193 | \thead{Option} & |
---|
194 | \thead{Description} \\ |
---|
195 | \hline |
---|
196 | \texttt{-h} & Prints parameter usage. \\ |
---|
197 | \texttt{-c} & Defines configuration file to use. Multiple configuration files |
---|
198 | may be used with repeated --c options. \\ |
---|
199 | \texttt{--}\emph{parameter}\texttt{=}\emph{value} |
---|
200 | & Assigns value to a given parameter as further described below. |
---|
201 | Some parameters are also supported by shorthand |
---|
202 | "--\em{opt}~\emph{value}".\\ |
---|
203 | \hline |
---|
204 | \end{tabular} |
---|
205 | \end{table} |
---|
206 | |
---|
207 | Sample configuration files are provided in the cfg/ folder. |
---|
208 | |
---|
209 | \subsection{GOP structure table} |
---|
210 | \label{sec:gop-structure} |
---|
211 | Defines the cyclic GOP structure that will be used repeatedly |
---|
212 | throughout the sequence. The table should contain GOPSize lines, |
---|
213 | named Frame1, Frame2, etc. The frames are listed in decoding |
---|
214 | order, so Frame1 is the first frame in decoding order, Frame2 is |
---|
215 | the second and so on. Among other things, the table specifies all |
---|
216 | reference pictures kept by the decoder for each frame. This |
---|
217 | includes pictures that are used for reference for the current |
---|
218 | picture as well as pictures that will be used for reference in |
---|
219 | the future. The encoder will not automatically calculate what |
---|
220 | pictures that has to be kept for future references, they have to |
---|
221 | be specified. Note that some specified reference frames for |
---|
222 | pictures encoded in the very first GOP after an IDR frame might |
---|
223 | not be available. This is handled automatically by the encoder, |
---|
224 | so the reference pictures can be given in the GOP structure table |
---|
225 | as if there were infinitely many identical GOPs before the |
---|
226 | current one. Each line in the table contains the parameters used |
---|
227 | for the corresponding frame, separated by whitespace: |
---|
228 | |
---|
229 | \begin{itemize} |
---|
230 | \item[]\textbf{Type}: Slice type, can be either I, P or B. |
---|
231 | |
---|
232 | \item[]\textbf{POC}: Display order of the frame within a GOP, ranging |
---|
233 | from 1 to GOPSize. |
---|
234 | |
---|
235 | \item[]\textbf{QPOffset}: QP offset is added to the QP parameter to set |
---|
236 | the final QP value to use for this frame. |
---|
237 | |
---|
238 | \item[]\textbf{QPFactor}: Weight used during rate distortion |
---|
239 | optimization. Higher values mean lower quality and less bits. Typical |
---|
240 | range is between |
---|
241 | 0.3 and 1. |
---|
242 | |
---|
243 | \item[]\textbf{tcOffsetDiv2}: In-loop deblocking filter parameter tcOffsetDiv2 |
---|
244 | is added to the base parameter LoopFilterTcOffset_div2 to set the final tc_offset_div2 |
---|
245 | parameter for this picture signalled in the slice segment header. The final |
---|
246 | value of tc_offset_div2 shall be an integer number in the range $-6..6$. |
---|
247 | |
---|
248 | \item[]\textbf{betaOffsetDiv2}: In-loop deblocking filter parameter betaOffsetDiv2 |
---|
249 | is added to the base parameter LoopFilterBetaOffset_div2 to set the final beta_offset_div2 |
---|
250 | parameter for this picture signalled in the slice segment header. The final |
---|
251 | value of beta_offset_div2 shall be an integer number in the range $-6..6$. |
---|
252 | |
---|
253 | \item[]\textbf{temporal_id}: Temporal layer of the frame. A frame cannot |
---|
254 | predict from a frame with a higher temporal id. If a frame with higher |
---|
255 | temporal IDs is listed among a frame's reference pictures, it is |
---|
256 | not used, but is kept for possible use in future frames. |
---|
257 | |
---|
258 | \item[]\textbf{num_ref_pics_active}: Size of reference picture lists L0 |
---|
259 | and L1, indicating how many reference pictures in each direction that |
---|
260 | are used during coding. |
---|
261 | |
---|
262 | \item[]\textbf{num_ref_pics}: The number of reference pictures kept for |
---|
263 | this frame. This includes pictures that are used for reference for the |
---|
264 | current picture as well as pictures that will be used for reference in |
---|
265 | the future. |
---|
266 | |
---|
267 | \item[]\textbf{reference_pictures}: A space-separated list of |
---|
268 | num_ref_pics integers, specifying the POC of the reference pictures |
---|
269 | kept, relative the POC of the current frame. The picture list shall be |
---|
270 | ordered, first with negative numbers from largest to smallest, followed |
---|
271 | by positive numbers from smallest to largest (e.g. \verb|-1 -3 -5 1 3|). |
---|
272 | Note that any pictures not supplied in this list will be discarded and |
---|
273 | therefore not available as reference pictures later. |
---|
274 | |
---|
275 | \item[]\textbf{predict}: Defines the value of the syntax element |
---|
276 | inter_ref_pic_set_prediction_flag. A value of 0 indicates that the |
---|
277 | reference picture set is encoded without inter RPS prediction and the |
---|
278 | subsequent parameters deltaRIdx$-1$, deltaRPS, num_ref_idcs and |
---|
279 | Reference_idcs are ignored and do not need to be present. A value of 1 |
---|
280 | indicates that the reference picture set is encoded with inter |
---|
281 | prediction RPS using the subsequent parameters deltaRIdx$-1$, deltaRPS, |
---|
282 | num_ref_idcs and Reference_idcs in the line. A value of 2 indicates that |
---|
283 | the reference picture set is encoded with inter RPS but only the |
---|
284 | deltaRIdx$-1$ parameters is needed. The deltaRPS, num_ref_idcs and |
---|
285 | Reference_idcs values are automatically derived by the encoder based on |
---|
286 | the POC and refPic values of the current line and the RPS pointed to by |
---|
287 | the deltaRIdx$-1$ parameters. |
---|
288 | |
---|
289 | \item[]\textbf{deltaRIdx$-1$}: The difference between the index of the |
---|
290 | curent RPS and the predictor RPS minus 1. |
---|
291 | |
---|
292 | \item[]\textbf{deltaRPS}: The difference between the POC of the |
---|
293 | predictor RPS and POC the current RPS. |
---|
294 | |
---|
295 | \item[]\textbf{num_ref_idcs}: The number of ref_idcs to encode for the |
---|
296 | current RPS. The value is equal to the value of num_ref_pics of the |
---|
297 | predictor RPS plus 1. |
---|
298 | |
---|
299 | \item[]\textbf{reference_idcs}: A space-separated list of num_ref_idcs |
---|
300 | integers, specifying the ref idcs of the inter RPS prediction. The value |
---|
301 | of ref_idcs may be 0, 1 or 2 indicating that the reference picture is a |
---|
302 | reference picture used by the current picture, a reference picture used |
---|
303 | for future picture or not a reference picture anymore, respectively. The |
---|
304 | first num_ref_pics of ref_idcs correspond to the Reference pictures in |
---|
305 | the predictor RPS. The last ref_idcs corresponds to the predictor |
---|
306 | picture. |
---|
307 | \end{itemize} |
---|
308 | |
---|
309 | For example, consider the coding structure of Figure~\ref{fig:gop-example}. |
---|
310 | This coding structure is of size 4. The pictures are listed in decoding |
---|
311 | order. Frame1 shall therefore describe picture with $\textrm{POC}=4$. It |
---|
312 | references picture 0, and therefore has $-4$ as a reference picture. |
---|
313 | Similarly, Frame2 has a POC of 2, and since it references pictures 0 and |
---|
314 | 4, its reference pictures are listed as \verb|-2 2|. Frame3 is a special |
---|
315 | case: even though it only references pictures with POC 0 and 2, it also |
---|
316 | needs to include the picture with POC 4, which must be kept in order to |
---|
317 | be used as a reference picture in the future. The reference picture list |
---|
318 | for Frame3 therefore becomes \verb|-1 1 3|. Frame4 has a POC of 3 and |
---|
319 | its list of reference pictures is \verb|-1 1|. |
---|
320 | |
---|
321 | \begin{figure}[h] |
---|
322 | \caption{A GOP structure} |
---|
323 | \label{fig:gop-example} |
---|
324 | \centering |
---|
325 | \includegraphics[width=0.7\textwidth]{gop-structure-example} |
---|
326 | \end{figure} |
---|
327 | |
---|
328 | Inter RPS prediction may be used for Frame2, Frame3 and Frame4, hence |
---|
329 | the predict parameter is set to 1 for these frames. Frame2 uses Frame1 |
---|
330 | as the predictor hence the deltaRIdx$-1$ is 0. Similarly for Frame3 and |
---|
331 | Frame4 which use Frame2 and Frame3 as predictors, respectively. The |
---|
332 | deltaRPS is equal to the POC of the predictor minus the POC of the |
---|
333 | current picture, therefore the deltaRPS for Frame2 is $4 -2 = 2$, for |
---|
334 | Frame3 is $2 - 1 = 1$ and for Frame4 is $1 - 3 = -2$. |
---|
335 | |
---|
336 | In Frame2, reference pictures with POC 0 and 2 are used, so the |
---|
337 | reference idcs for Frame2 are \verb|1 1| indicating that the reference |
---|
338 | picture, $-4$, in Frame1 is still a reference picture in Frame2 and |
---|
339 | Frame1 is also a reference picture in Frame2. The reference idcs for |
---|
340 | Frame3 are \verb|1 1 1|. The first and second “1”s indicating that |
---|
341 | the reference pictures "$-2$ $2$" in Frame2 are still reference pictures in |
---|
342 | Frame3 and the last “1” indicating that Frame2 is also a reference |
---|
343 | picture in Frame3. In Frame 4, the reference idcs are \verb|0 1 1 0|. |
---|
344 | The first “0” indicates that the reference pictures “-1” in Frame 3 is |
---|
345 | no longer a reference picture in Frame4. The next two “1”s indicate that |
---|
346 | the reference pictures “$1$ $3$” are now reference pictures of Frame4. |
---|
347 | The final “0” indicates that Frame3 is not a reference picture. |
---|
348 | |
---|
349 | In order to specify this to the encoder, the parameters in |
---|
350 | Table~\ref{tab:gop-example} could be used. |
---|
351 | |
---|
352 | \begin{table}[ht] |
---|
353 | \footnotesize |
---|
354 | \caption{GOP structure example} |
---|
355 | \label{tab:gop-example} |
---|
356 | \centering |
---|
357 | \begin{tabular}{lrrrr} |
---|
358 | \hline |
---|
359 | \thead{} & |
---|
360 | \thead{Frame1} & |
---|
361 | \thead{Frame2} & |
---|
362 | \thead{Frame3} & |
---|
363 | \thead{Frame4} \\ |
---|
364 | \hline |
---|
365 | Type & P & B & B & B \\ |
---|
366 | POC & 4 & 2 & 1 & 3 \\ |
---|
367 | QPoffset & 1 & 2 & 3 & 3 \\ |
---|
368 | QPfactor & 0.5 & 0.5 & 0.5 & 0.5 \\ |
---|
369 | tcOffsetDiv2 & 0 & 1 & 2 & 2 \\ |
---|
370 | betaOffsetDiv2 & 0 & 0 & 0 & 0 \\ |
---|
371 | temporal_id & 0 & 1 & 2 & 2 \\ |
---|
372 | num_ref_pics_active & 1 & 1 & 1 & 1 \\ |
---|
373 | num_ref_pics & 1 & 2 & 3 & 2 \\ |
---|
374 | reference_pictures & $-$4 & $-$2 2 & $-$1 1 3 & $-$1 1 \\ |
---|
375 | predict & 0 & 1 & 1 & 1 \\ |
---|
376 | deltaRIdx$-$1 & & 0 & 0 & 0 \\ |
---|
377 | deltaRPS & & 2 & 1 & $-$2 \\ |
---|
378 | num_ref_idcs & & 2 & 3 & 4 \\ |
---|
379 | reference_idcs & & 1 1 & 1 1 1 & 0 1 1 0 \\ |
---|
380 | \hline |
---|
381 | \end{tabular} |
---|
382 | \end{table} |
---|
383 | |
---|
384 | Here, the frames used for prediction have been given higher |
---|
385 | quality by assigning a lower QP offset. Also, the non-reference |
---|
386 | frames have been marked as belonging to a higher temporal layer, |
---|
387 | to make it possible to decode only every other frame. Note: each |
---|
388 | line should contain information for one frame, so this |
---|
389 | configuration would be specified as: |
---|
390 | |
---|
391 | \begin{verbatim} |
---|
392 | Frame1: P 4 1 0.5 0 0 0 1 1 -4 0 |
---|
393 | Frame2: B 2 2 0.5 1 0 1 1 2 -2 2 1 0 2 2 1 1 |
---|
394 | Frame3: B 1 3 0.5 2 0 2 1 3 -1 1 3 1 0 1 3 1 1 1 |
---|
395 | Frame4: B 3 3 0.5 2 0 2 1 2 -1 1 1 0 -2 4 0 1 1 0 |
---|
396 | \end{verbatim} |
---|
397 | |
---|
398 | The values of deltaRIdx$-1$, deltaRPS, num_ref_idcs and reference |
---|
399 | idcs of Frame$K$ can be derived from the POC value of Frame$_K$ and |
---|
400 | the POC, num_ref_pics and reference_pictures values of Frame$_M$, where |
---|
401 | $K$ is the index of the RPS to be inter coded and the $M$ is the |
---|
402 | index of the reference RPS, as follows. |
---|
403 | |
---|
404 | \setlength{\algomargin}{2em} |
---|
405 | \begin{algorithm}[h] |
---|
406 | \SetKwData{deltaRIdx}{deltaRIdx} |
---|
407 | \SetKwData{deltaRPS}{deltaRPS} |
---|
408 | \SetKwData{numrefidcs}{num_ref_idcs} |
---|
409 | \SetKwData{numrefpics}{num_ref_pics} |
---|
410 | \SetKwData{referencepictures}{reference_pictures} |
---|
411 | \SetKwData{referenceidcs}{reference_idcs} |
---|
412 | \SetKwData{POC}{POC} |
---|
413 | |
---|
414 | $\deltaRIdx_K - 1 \leftarrow K - M - 1$ \; |
---|
415 | $\deltaRPS_K \leftarrow \POC_M - \POC_K$ \; |
---|
416 | $\numrefidcs_K \leftarrow \numrefpics_M + 1$ \; |
---|
417 | |
---|
418 | \For{$j \leftarrow 0$ \KwTo $\numrefpics_M$}{ |
---|
419 | \For{$i \leftarrow 0$ \KwTo $\numrefidcs_K$}{ |
---|
420 | \eIf{$\referencepictures_{M,j} + \deltaRPS_K == \referencepictures_{K,i}$}{ |
---|
421 | \lIf{$\referencepictures_{K,i}$ is used by the current frame}{ |
---|
422 | $\referenceidcs_{K,j} = 1$} \; |
---|
423 | \lElse{$\referenceidcs_{K,j} = 2$} \; |
---|
424 | }{ |
---|
425 | $\referenceidcs_K[j] = 0$ \; |
---|
426 | } |
---|
427 | } |
---|
428 | } |
---|
429 | |
---|
430 | \tcc{$\referencepictures_{M,\numrefpics_M}$ does not exist and is assumed to be 0} |
---|
431 | \end{algorithm} |
---|
432 | |
---|
433 | Note: The above (automatic) generation of the inter RPS parameter |
---|
434 | values has been integrated into the encoder, and is activated by |
---|
435 | the value of predict $= 2$ followed by the value of deltaRIdx$-1$, |
---|
436 | only, as described above. |
---|
437 | |
---|
438 | |
---|
439 | |
---|
440 | %%%% |
---|
441 | %%%% |
---|
442 | %%%% |
---|
443 | \newgeometry{tmargin=1.6cm,lmargin=1cm,rmargin=1cm,bmargin=1in,nohead} |
---|
444 | \subsection{Encoder parameters} |
---|
445 | |
---|
446 | %% |
---|
447 | %% File, I/O and source parameters |
---|
448 | %% |
---|
449 | \begin{OptionTable}{File, I/O and source parameters} |
---|
450 | \Option{InputFile} & |
---|
451 | \ShortOption{-i} & |
---|
452 | \Default{\NotSet} & |
---|
453 | Specifies the input video file. |
---|
454 | |
---|
455 | Video data must be in a raw 4:2:0 planar format (Y$'$CbCr). |
---|
456 | |
---|
457 | Note: When the bit depth of samples is larger than 8, each sample is encoded in |
---|
458 | 2 bytes (little endian, LSB-justified). |
---|
459 | \\ |
---|
460 | |
---|
461 | \Option{BitstreamFile} & |
---|
462 | \ShortOption{-b} & |
---|
463 | \Default{\NotSet} & |
---|
464 | Specifies the output coded bit stream file. |
---|
465 | \\ |
---|
466 | |
---|
467 | \Option{ReconFile} & |
---|
468 | \ShortOption{-o} & |
---|
469 | \Default{\NotSet} & |
---|
470 | Specifies the output locally reconstructed video file. |
---|
471 | \\ |
---|
472 | |
---|
473 | \Option{SourceWidth}% |
---|
474 | \Option{SourceHeight} & |
---|
475 | \ShortOption{-wdt}% |
---|
476 | \ShortOption{-hgt} & |
---|
477 | \Default{0}% |
---|
478 | \Default{0} & |
---|
479 | Specifies the width and height of the input video in luma samples. |
---|
480 | \\ |
---|
481 | |
---|
482 | \Option{InputBitDepth} & |
---|
483 | \ShortOption{\None} & |
---|
484 | \Default{8} & |
---|
485 | Specifies the bit depth of the input video. |
---|
486 | \\ |
---|
487 | |
---|
488 | \Option{InternalBitDepth} & |
---|
489 | \ShortOption{\None} & |
---|
490 | \Default{0 \\ (InputBitDepth)} & |
---|
491 | Specifies the bit depth used for coding. |
---|
492 | |
---|
493 | If the input video is a different bit depth to InternalBitDepth, it is |
---|
494 | automatically converted by: |
---|
495 | \begin{displaymath} |
---|
496 | \left\lfloor |
---|
497 | \frac{\mathrm{Pel} * 2^{\mathrm{InternalBitDepth}}}{ |
---|
498 | 2^{\mathrm{InputBitDepth}}} |
---|
499 | \right\rfloor |
---|
500 | \end{displaymath} |
---|
501 | |
---|
502 | Note: The effect of this option is as if the input video is externally |
---|
503 | converted to the InternalBitDepth and then coded with this value as |
---|
504 | InputBitDepth. The codec has no notion of two different bit depths. |
---|
505 | \\ |
---|
506 | |
---|
507 | \Option{OutputBitDepth} & |
---|
508 | \ShortOption{\None} & |
---|
509 | \Default{0 \\ (InternalBitDepth)} & |
---|
510 | Specifies the bit depth of the output locally reconstructed video file. |
---|
511 | |
---|
512 | Note: This option has no effect on the decoding process. |
---|
513 | \\ |
---|
514 | |
---|
515 | \Option{InputBitDepthC}% |
---|
516 | \Option{InternalBitDepthC}% |
---|
517 | \Option{OutputBitDepthC} & |
---|
518 | \ShortOption{\None} & |
---|
519 | \Default{(InputBitDepth)}% |
---|
520 | \Default{(InternalBitDepth)}% |
---|
521 | \Default{(InternalBitDepthC)} & |
---|
522 | Specifies the various bit-depths for chroma components. These only need |
---|
523 | to be specified if non-equal luma and chroma bit-depth processing is |
---|
524 | required. |
---|
525 | \\ |
---|
526 | |
---|
527 | \Option{ConformanceMode} & |
---|
528 | \ShortOption{\None} & |
---|
529 | \Default{0} & |
---|
530 | Specifies the conformance mode (cropping/padding parameters) to be applied to the input |
---|
531 | video. The following modes are available: |
---|
532 | \par |
---|
533 | \begin{tabular}{cp{0.45\textwidth}} |
---|
534 | 0 & No cropping / padding \\ |
---|
535 | 1 & Automatic padding to the next minimum CU size \\ |
---|
536 | 2 & Padding according to parameters HorizontalPadding and VerticalPadding \\ |
---|
537 | 3 & Cropping according to parameters ConfLeft, ConfRight, ConfTop and ConfBottom \\ |
---|
538 | \end{tabular} |
---|
539 | \\ |
---|
540 | |
---|
541 | \Option{HorizontalPadding}% |
---|
542 | \Option{VerticalPadding} & |
---|
543 | \ShortOption{-pdx}% |
---|
544 | \ShortOption{-pdy} & |
---|
545 | \Default{0} & |
---|
546 | Specifies the horizontal and vertical padding to be applied to the input |
---|
547 | video in luma samples. Must be a multiple of the chroma resolution |
---|
548 | (e.g. a multiple of two for 4:2:0). |
---|
549 | \\ |
---|
550 | |
---|
551 | \Option{ConfLeft}% |
---|
552 | \Option{ConfRight}% |
---|
553 | \Option{ConfTop}% |
---|
554 | \Option{ConfBottom} & |
---|
555 | \ShortOption{\None} & |
---|
556 | \Default{0} & |
---|
557 | Specifies the horizontal and vertical cropping to be applied to the |
---|
558 | input video in luma samples. Must be a multiple of the chroma |
---|
559 | resolution (e.g. a multiple of two for 4:2:0). |
---|
560 | \\ |
---|
561 | |
---|
562 | \Option{FrameRate} & |
---|
563 | \ShortOption{-fr} & |
---|
564 | \Default{0} & |
---|
565 | Specifies the frame rate of the input video. |
---|
566 | |
---|
567 | Note: This option only affects the reported bit rates. |
---|
568 | \\ |
---|
569 | |
---|
570 | \Option{FrameSkip} & |
---|
571 | \ShortOption{-fs} & |
---|
572 | \Default{0} & |
---|
573 | Specifies a number of frames to skip at beginning of input video file. |
---|
574 | \\ |
---|
575 | |
---|
576 | \Option{FramesToBeEncoded} & |
---|
577 | \ShortOption{-f} & |
---|
578 | \Default{0 \\ (all)} & |
---|
579 | Specifies the number of frames to be encoded. |
---|
580 | \\ |
---|
581 | \end{OptionTable} |
---|
582 | |
---|
583 | %% |
---|
584 | %% profile, level and conformance options |
---|
585 | %% |
---|
586 | \begin{OptionTable}{Profile and level parameters} |
---|
587 | \Option{Profile} & |
---|
588 | \ShortOption{\None} & |
---|
589 | \Default{none} & |
---|
590 | Specifies the profile to which the encoded bitstream complies. |
---|
591 | Valid values are: none, main, main10, main-still-picture. |
---|
592 | |
---|
593 | Compatibility flags are automatically determined according to the profile. |
---|
594 | If --Profile=main, then main10 will always be signalled as compatible. |
---|
595 | If --Profile=main10, then main will be signalled as compatible if the bit-depth is 8-bit. |
---|
596 | |
---|
597 | NB: There is currently no validation that the encoder configuration complies with the profile and level constraints. |
---|
598 | \\ |
---|
599 | |
---|
600 | \Option{Level} & |
---|
601 | \ShortOption{\None} & |
---|
602 | \Default{none} & |
---|
603 | Specifies the level to which the encoded bitstream complies. |
---|
604 | Valid values are: none, 1, 2, 2.1, 3, 3.1, 4, 4.1, 5, 5.1, 5.2, 6, 6.1, 6.2. |
---|
605 | |
---|
606 | NB: There is currently no validation that the encoder configuration complies with the profile and level constraints. |
---|
607 | \\ |
---|
608 | |
---|
609 | \Option{Tier} & |
---|
610 | \ShortOption{\None} & |
---|
611 | \Default{main} & |
---|
612 | Specifies the level tier to which the encoded bitsream complies. |
---|
613 | Valid values are: main, high. |
---|
614 | |
---|
615 | NB: There is currently no validation that the encoder configuration complies with the profile and level constraints. |
---|
616 | \\ |
---|
617 | |
---|
618 | \Option{ProgressiveSource} & |
---|
619 | \ShortOption{\None} & |
---|
620 | \Default{false} & |
---|
621 | Specifies the value of general_progressive_source_flag |
---|
622 | \\ |
---|
623 | |
---|
624 | \Option{InterlacedSource} & |
---|
625 | \ShortOption{\None} & |
---|
626 | \Default{false} & |
---|
627 | Specifies the value of general_interlaced_source_flag |
---|
628 | \\ |
---|
629 | |
---|
630 | \Option{NonPackedSource} & |
---|
631 | \ShortOption{\None} & |
---|
632 | \Default{false} & |
---|
633 | Specifies the value of general_non_packed_constraint_flag |
---|
634 | \\ |
---|
635 | |
---|
636 | \Option{FrameOnly} & |
---|
637 | \ShortOption{\None} & |
---|
638 | \Default{false} & |
---|
639 | Specifies the value of general_frame_only_constraint_flag |
---|
640 | \\ |
---|
641 | |
---|
642 | \end{OptionTable} |
---|
643 | |
---|
644 | |
---|
645 | %% |
---|
646 | %% Unit definition parameters |
---|
647 | %% |
---|
648 | \begin{OptionTable}{Unit definition parameters} |
---|
649 | \Option{MaxCUWidth} & |
---|
650 | \ShortOption{\None} & |
---|
651 | \Default{64} & |
---|
652 | Defines the maximum CU width. |
---|
653 | \\ |
---|
654 | |
---|
655 | \Option{MaxCUHeight} & |
---|
656 | \ShortOption{\None} & |
---|
657 | \Default{64} & |
---|
658 | Defines the maximum CU height. |
---|
659 | \\ |
---|
660 | |
---|
661 | \Option{MaxCUSize} & |
---|
662 | \ShortOption{\None} & |
---|
663 | \Default{64} & |
---|
664 | Defines the maximum CU size. |
---|
665 | \\ |
---|
666 | |
---|
667 | \Option{MaxPartitionDepth} & |
---|
668 | \ShortOption{-h} & |
---|
669 | \Default{4} & |
---|
670 | Defines the depth of the CU tree. |
---|
671 | \\ |
---|
672 | |
---|
673 | \Option{QuadtreeTULog2MaxSize} & |
---|
674 | \ShortOption{\None} & |
---|
675 | \Default{6 \\ ($= \mathrm{log}_2(64)$)} & |
---|
676 | Defines the Maximum TU size in logarithm base 2. |
---|
677 | \\ |
---|
678 | |
---|
679 | \Option{QuadtreeTULog2MinSize} & |
---|
680 | \ShortOption{\None} & |
---|
681 | \Default{2 \\ ($= \mathrm{log}_2(4)$)} & |
---|
682 | Defines the Minimum TU size in logarithm base 2. |
---|
683 | \\ |
---|
684 | |
---|
685 | \Option{QuadtreeTUMaxDepthIntra} & |
---|
686 | \ShortOption{\None} & |
---|
687 | \Default{1} & |
---|
688 | Defines the depth of the TU tree for intra CUs. |
---|
689 | \\ |
---|
690 | |
---|
691 | \Option{QuadtreeTUMaxDepthInter} & |
---|
692 | \ShortOption{\None} & |
---|
693 | \Default{2} & |
---|
694 | Defines the depth of the TU tree for inter CUs. |
---|
695 | \\ |
---|
696 | \end{OptionTable} |
---|
697 | |
---|
698 | |
---|
699 | %% |
---|
700 | %% Coding structure parameters |
---|
701 | %% |
---|
702 | \begin{OptionTable}{Coding structure parameters} |
---|
703 | \Option{IntraPeriod} & |
---|
704 | \ShortOption{-ip} & |
---|
705 | \Default{$-1$} & |
---|
706 | Specifies the intra frame period. |
---|
707 | A value of $-1$ implies an infinite period. |
---|
708 | \\ |
---|
709 | |
---|
710 | \Option{DecodingRefreshType} & |
---|
711 | \ShortOption{-dr} & |
---|
712 | \Default{0} & |
---|
713 | Specifies the type of decoding refresh to apply at the intra frame period |
---|
714 | picture. |
---|
715 | \par |
---|
716 | \begin{tabular}{cp{0.45\textwidth}} |
---|
717 | 0 & Applies an I picture (not a clean random access point). \\ |
---|
718 | 1 & Applies a non-IDR clean random access point (open GOP). \\ |
---|
719 | 2 & Applies an IDR random access point (closed GOP). \\ |
---|
720 | \end{tabular} |
---|
721 | \\ |
---|
722 | |
---|
723 | \Option{GOPSize} & |
---|
724 | \ShortOption{-g} & |
---|
725 | \Default{1} & |
---|
726 | Specifies the size of the cyclic GOP structure. |
---|
727 | \\ |
---|
728 | |
---|
729 | \Option{Frame\emph{N}} & |
---|
730 | \ShortOption{\None} & |
---|
731 | \Default{\NotSet} & |
---|
732 | Multiple options that define the cyclic GOP structure that will be used |
---|
733 | repeatedly throughout the sequence. The table should contain GOPSize |
---|
734 | elements. |
---|
735 | \par |
---|
736 | See section~\ref{sec:gop-structure} for further details. |
---|
737 | \\ |
---|
738 | |
---|
739 | \Option{ListCombination} & |
---|
740 | \ShortOption{-lc} & |
---|
741 | \Default{true} & |
---|
742 | Enables or disables the use of the combined reference list for uni-prediction |
---|
743 | in B-slices. |
---|
744 | \par |
---|
745 | \begin{tabular}{cp{0.45\textwidth}} |
---|
746 | 0 & Reference list~0 and reference list~1 are identical and reference |
---|
747 | list~0 is used as the combined reference list. \\ |
---|
748 | 1 & The combined reference list is derived from reference list~0 and |
---|
749 | reference list~1. \\ |
---|
750 | \end{tabular} |
---|
751 | NB: LComb can only be 0 in low delay coding (more precisely, when list 0 |
---|
752 | and list 1 are the same) |
---|
753 | \\ |
---|
754 | \end{OptionTable} |
---|
755 | |
---|
756 | |
---|
757 | %% |
---|
758 | %% Motion estimation parameters |
---|
759 | %% |
---|
760 | \begin{OptionTable}{Motion estimation parameters} |
---|
761 | \Option{FastSearch} & |
---|
762 | \ShortOption{\None} & |
---|
763 | \Default{true} & |
---|
764 | Enables or disables the use of a fast motion search. |
---|
765 | \par |
---|
766 | \begin{tabular}{cp{0.45\textwidth}} |
---|
767 | 0 & Full search method \\ |
---|
768 | 1 & Fast search method \\ |
---|
769 | \end{tabular} |
---|
770 | \\ |
---|
771 | |
---|
772 | \Option{SearchRange} & |
---|
773 | \ShortOption{-sr} & |
---|
774 | \Default{96} & |
---|
775 | Specifies the search range used for motion estimation. |
---|
776 | |
---|
777 | Note: the search range is defined around a predictor. Motion vectors |
---|
778 | derived by the motion estimation may thus have values larger than the |
---|
779 | search range. |
---|
780 | \\ |
---|
781 | |
---|
782 | \Option{BipredSearchRange} & |
---|
783 | \ShortOption{\None} & |
---|
784 | \Default{4} & |
---|
785 | Specifies the search range used for bi-prediction refinement in motion |
---|
786 | estimation. |
---|
787 | \\ |
---|
788 | |
---|
789 | \Option{HadamardME} & |
---|
790 | \ShortOption{\None} & |
---|
791 | \Default{true} & |
---|
792 | Enables or disables the use of the Hadamard transform in fractional-pel motion |
---|
793 | estimation. |
---|
794 | \par |
---|
795 | \begin{tabular}{cp{0.45\textwidth}} |
---|
796 | 0 & SAD for cost estimation \\ |
---|
797 | 1 & Hadamard for cost estimation \\ |
---|
798 | \end{tabular} |
---|
799 | \\ |
---|
800 | |
---|
801 | \Option{ASR} & |
---|
802 | \ShortOption{\None} & |
---|
803 | \Default{false} & |
---|
804 | Enables or disables the use of adaptive search ranges, where the motion |
---|
805 | search range is dynamically adjusted according to the POC difference |
---|
806 | between the current and the reference pictures. |
---|
807 | \begin{displaymath} |
---|
808 | \resizebox{\hsize}{!}{$ |
---|
809 | \mathrm{SearchRange}’ = \mathrm{Round}\left( |
---|
810 | \mathrm{SearchRange} |
---|
811 | * \mathrm{ADAPT\_SR\_SCALE} |
---|
812 | * \frac{\mathrm{abs}( |
---|
813 | \mathrm{POCcur} - \mathrm{POCref} )}{ |
---|
814 | \mathrm{RateGOPSize}}\right) |
---|
815 | $} |
---|
816 | \end{displaymath} |
---|
817 | \\ |
---|
818 | \end{OptionTable} |
---|
819 | |
---|
820 | |
---|
821 | %% |
---|
822 | %% Mode decision parameters |
---|
823 | %% |
---|
824 | \begin{OptionTable}{Mode decision parameters} |
---|
825 | \Option{LambdaModifier$N$} & |
---|
826 | \ShortOption{-LM$N$} & |
---|
827 | \Default{1.0} & |
---|
828 | Specifies a value that is multiplied with the Lagrange multiplier |
---|
829 | $\lambda$, for use in the rate-distortion optimised cost calculation |
---|
830 | when encoding temporal layer~$N$. |
---|
831 | \par |
---|
832 | $N$ may be in the range 0--7. |
---|
833 | \\ |
---|
834 | |
---|
835 | \Option{FEN} & |
---|
836 | \ShortOption{\None} & |
---|
837 | \Default{false} & |
---|
838 | Enables or disables the use of fast encoder mode. When enabled, |
---|
839 | the following occurs: |
---|
840 | \begin{itemize} |
---|
841 | \item In the SAD computation for blocks having size larger than 8, only |
---|
842 | the lines of even rows in the block are considered. |
---|
843 | \item The number of iterations used in the bi-directional motion vector |
---|
844 | refinement in the motion estimation process is reduced from 4 to 1. |
---|
845 | \end{itemize} |
---|
846 | \\ |
---|
847 | |
---|
848 | \Option{FDM} & |
---|
849 | \ShortOption{\None} & |
---|
850 | \Default{true} & |
---|
851 | Enables or disables the use of fast encoder decisions for 2Nx2N merge |
---|
852 | mode. When enabled, the RD cost for the merge mode of the current |
---|
853 | candidate is not evaluated if the merge skip mode was the best merge |
---|
854 | mode for one of the previous candidates. |
---|
855 | \\ |
---|
856 | |
---|
857 | \Option{RDpenalty} & |
---|
858 | \ShortOption{\None} & |
---|
859 | \Default{0} & |
---|
860 | RD-penalty for 32x32 TU for intra in non-intra slices. |
---|
861 | Enabling this parameter can reduce the visibility of CU boundaries in the coded picture. |
---|
862 | \par |
---|
863 | \begin{tabular}{cp{0.45\textwidth}} |
---|
864 | 0 & No RD-penalty \\ |
---|
865 | 1 & RD-penalty \\ |
---|
866 | 2 & Maximum RD-penalty (no 32x32 TU)\\ |
---|
867 | \end{tabular} |
---|
868 | \\ |
---|
869 | |
---|
870 | \end{OptionTable} |
---|
871 | |
---|
872 | %% |
---|
873 | %% Quantization parameters |
---|
874 | %% |
---|
875 | \begin{OptionTable}{Quantization parameters} |
---|
876 | \Option{QP} & |
---|
877 | \ShortOption{-q} & |
---|
878 | \Default{30.0} & |
---|
879 | Specifies the base value of the quantization parameter. |
---|
880 | \\ |
---|
881 | |
---|
882 | \Option{CbQpOffset}% |
---|
883 | \Option{CrQpOffset} & |
---|
884 | \ShortOption{-cbqpofs}% |
---|
885 | \ShortOption{-crqpofs} & |
---|
886 | \Default{0}% |
---|
887 | \Default{0} & |
---|
888 | Global offset to apply to the luma QP to derive the QP of Cb and Cr |
---|
889 | respectively. These options correspond to the values of cb_qp_offset |
---|
890 | and cr_qp_offset, that are transmitted in the PPS. Valid values are in |
---|
891 | the range $[-12, 12]$. |
---|
892 | \\ |
---|
893 | |
---|
894 | \Option{MaxCuDQPDepth} & |
---|
895 | \ShortOption{\None} & |
---|
896 | \Default{0} & |
---|
897 | Defines maximum depth of a minimum CuDQP for sub-LCU-level delta QP. |
---|
898 | MaxCuDQPDepth shall be greater than or equal to SliceGranularity. |
---|
899 | \\ |
---|
900 | |
---|
901 | \Option{RDOQ} & |
---|
902 | \ShortOption{\None} & |
---|
903 | \Default{true} & |
---|
904 | Enables or disables rate-distortion-optimized quantization. |
---|
905 | \\ |
---|
906 | |
---|
907 | \Option{RDOQTS} & |
---|
908 | \ShortOption{\None} & |
---|
909 | \Default{true} & |
---|
910 | Enables or disables rate-distortion-optimized quantization for transform-skipped TUs. |
---|
911 | \\ |
---|
912 | |
---|
913 | \Option{DeltaQpRD} & |
---|
914 | \ShortOption{-dqr} & |
---|
915 | \Default{0} & |
---|
916 | Specifies the maximum QP offset at slice level for multi-pass slice |
---|
917 | encoding. When encoding, each slice is tested multiple times by using |
---|
918 | slice QP values in the range $[-\mathrm{DeltaQpRD}, \mathrm{DeptaQpRD}]$, |
---|
919 | and the best QP value is chosen as the slice QP. |
---|
920 | \\ |
---|
921 | |
---|
922 | \Option{MaxDeltaQP} & |
---|
923 | \ShortOption{-d} & |
---|
924 | \Default{0} & |
---|
925 | Specifies the maximum QP offset at the largest coding unit level for |
---|
926 | the block-level adaptive QP assignment scheme. In the encoder, each |
---|
927 | largest coding unit is tested multiple times by using the QP values in |
---|
928 | the range $[-\mathrm{MaxDeltaQP}, \mathrm{MaxDeltaQP}]$, and the best QP |
---|
929 | value is chosen as the QP value of the largest coding unit. |
---|
930 | \\ |
---|
931 | |
---|
932 | \Option{dQPFile} & |
---|
933 | \ShortOption{-m} & |
---|
934 | \Default{\NotSet} & |
---|
935 | Specifies a file containing a list of QP deltas. The $n$-th line |
---|
936 | (where $n$ is 0 for the first line) of this file corresponds to the QP |
---|
937 | value delta for the picture with POC value $n$. |
---|
938 | \\ |
---|
939 | |
---|
940 | \Option{AdaptiveQpSelection} & |
---|
941 | \ShortOption{-aqps} & |
---|
942 | \Default{false} & |
---|
943 | Specifies whether QP values for non-I frames will be calculated on the |
---|
944 | fly based on statistics of previously coded frames. |
---|
945 | \\ |
---|
946 | \Option{RecalculateQPAccordingToLambda} & |
---|
947 | \ShortOption{\None} & |
---|
948 | \Default{false} & |
---|
949 | Recalculate QP values according to lambda values. Do not suggest to be enabled in all intra case. |
---|
950 | \\ |
---|
951 | \end{OptionTable} |
---|
952 | |
---|
953 | |
---|
954 | |
---|
955 | %% |
---|
956 | %% Entropy coding parameters |
---|
957 | %% |
---|
958 | \begin{OptionTable}{Entropy coding parameters} |
---|
959 | \Option{SBACRD} & |
---|
960 | \ShortOption{\None} & |
---|
961 | \Default{true} & |
---|
962 | Enables or disables the use of bit counts from arithmetic coder in |
---|
963 | rate-distortion decisions. |
---|
964 | \\ |
---|
965 | \end{OptionTable} |
---|
966 | |
---|
967 | |
---|
968 | %% |
---|
969 | %% Slice coding parameters |
---|
970 | %% |
---|
971 | \begin{OptionTable}{Slice coding parameters} |
---|
972 | %\Option{SliceGranularity} & |
---|
973 | %\ShortOption{\None} & |
---|
974 | %\Default{0} & |
---|
975 | %Determines the depth in an LCU at which slices may begin and end. |
---|
976 | %\par |
---|
977 | %\begin{tabular}{cp{0.45\textwidth}} |
---|
978 | % 0 & Slice addresses are LCU aligned \\ |
---|
979 | % $1 \leq n \leq 3$ |
---|
980 | % & Slice start addresses are aligned to CUs at depth $n$ \\ |
---|
981 | %\end{tabular} |
---|
982 | % |
---|
983 | %Note: The smallest permissible alignment is 16x16 CUs. |
---|
984 | %Values of $n$ must satisfy this constraint, for example, with a 64x64 |
---|
985 | %LCU, $n$ must be less than or equal to 2. |
---|
986 | %\\ |
---|
987 | |
---|
988 | \Option{SliceMode} & |
---|
989 | \ShortOption{\None} & |
---|
990 | \Default{0} & |
---|
991 | Controls the slice partitioning method in conjunction with |
---|
992 | SliceArgument. |
---|
993 | \par |
---|
994 | \begin{tabular}{cp{0.45\textwidth}} |
---|
995 | 0 & Single slice \\ |
---|
996 | 1 & Maximum number of CTUs per slice \\ |
---|
997 | 2 & Maximum number of bytes per slice \\ |
---|
998 | 3 & Maximum number of tiles per slice \\ |
---|
999 | \end{tabular} |
---|
1000 | \\ |
---|
1001 | |
---|
1002 | \Option{SliceArgument} & |
---|
1003 | \ShortOption{\None} & |
---|
1004 | \Default{\NotSet} & |
---|
1005 | Specifies the maximum number of CTUs, bytes or tiles in a slice depending on the |
---|
1006 | SliceMode setting. |
---|
1007 | \\ |
---|
1008 | |
---|
1009 | \Option{SliceSegmentMode} & |
---|
1010 | \ShortOption{\None} & |
---|
1011 | \Default{0} & |
---|
1012 | Enables (dependent) slice segment coding in conjunction with |
---|
1013 | SliceSegmentArgument. |
---|
1014 | \par |
---|
1015 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1016 | 0 & Single slice \\ |
---|
1017 | 1 & Maximum number of CTUs per slice segment\\ |
---|
1018 | 2 & Maximum number of bytes per slice segment\\ |
---|
1019 | 3 & Maximum number of tiles per slice segment\\ |
---|
1020 | \end{tabular} |
---|
1021 | \\ |
---|
1022 | |
---|
1023 | \Option{SliceSegmentArgument} & |
---|
1024 | \ShortOption{\None} & |
---|
1025 | \Default{\NotSet} & |
---|
1026 | Defines the maximum number of CTUs, bytes or tiles a slice segment |
---|
1027 | depending on the SliceSegmentMode setting. |
---|
1028 | \\ |
---|
1029 | |
---|
1030 | \Option{WaveFrontSynchro} & |
---|
1031 | \ShortOption{\None} & |
---|
1032 | \Default{false} & |
---|
1033 | Enables the use of specific CABAC probabilities synchronization at the |
---|
1034 | beginning of each line of CTBs in order to produce a bitstream that can |
---|
1035 | be encoded or decoded using one or more cores. |
---|
1036 | \\ |
---|
1037 | |
---|
1038 | \Option{NumTileColumnsMinus1}% |
---|
1039 | \Option{NumTileRowsMinus1} & |
---|
1040 | \ShortOption{\None} & |
---|
1041 | \Default{0} & |
---|
1042 | Specifies the tile based picture partitioning geometry as |
---|
1043 | $\mathrm{NumTileColumnsMinus1} + 1 \times \mathrm{NumTileRowsMinus1} + 1$ |
---|
1044 | columns and rows. |
---|
1045 | \\ |
---|
1046 | |
---|
1047 | \Option{UniformSpacingIdc} & |
---|
1048 | \ShortOption{\None} & |
---|
1049 | \Default{0} & |
---|
1050 | Controls the mode used to determine per row and column tile sizes. |
---|
1051 | \par |
---|
1052 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1053 | 0 & Each tile column width and tile row height is explicitly set |
---|
1054 | by ColumnWidthArray and RowHeightArray respectively \\ |
---|
1055 | 1 & Tile columns and tile rows are uniformly spaced. \\ |
---|
1056 | \end{tabular} |
---|
1057 | \\ |
---|
1058 | |
---|
1059 | \Option{ColumnWidthArray}% |
---|
1060 | \Option{RowHeightArray} & |
---|
1061 | \ShortOption{\None} & |
---|
1062 | \Default{\NotSet} & |
---|
1063 | Specifies a space or comma separated list of widths and heights, |
---|
1064 | respectively, of each tile column or tile row. The first value in the |
---|
1065 | list corresponds to the leftmost tile column or topmost tile row. |
---|
1066 | \\ |
---|
1067 | \end{OptionTable} |
---|
1068 | |
---|
1069 | |
---|
1070 | |
---|
1071 | %% |
---|
1072 | %% Deblocking filter parameters |
---|
1073 | %% |
---|
1074 | \begin{OptionTable}{Deblocking filter parameters} |
---|
1075 | \Option{LoopFilterDisable} & |
---|
1076 | \ShortOption{\None} & |
---|
1077 | \Default{false} & |
---|
1078 | Enables or disables the in-loop deblocking filter. |
---|
1079 | \\ |
---|
1080 | |
---|
1081 | \Option{LFCrossSliceBoundaryFlag} & |
---|
1082 | \ShortOption{\None} & |
---|
1083 | \Default{true} & |
---|
1084 | Enables or disables the use of in-loop filtering across slice |
---|
1085 | boundaries. |
---|
1086 | \\ |
---|
1087 | |
---|
1088 | \Option{DeblockingFilterControlPresent}& |
---|
1089 | \ShortOption{\None}& |
---|
1090 | \Default{false}& |
---|
1091 | Enables or disables the presence of the deblocking filter control |
---|
1092 | parameters in the picture parameter set and in the slice segment header. |
---|
1093 | When disabled, the default deblocking filter parameters are used. |
---|
1094 | \\ |
---|
1095 | |
---|
1096 | \Option{LoopFilterOffsetInPPS}& |
---|
1097 | \ShortOption{\None}& |
---|
1098 | \Default{false}& |
---|
1099 | If enabled, the in-loop deblocking filter control parameters are sent in PPS. |
---|
1100 | Otherwise, the in-loop deblocking filter control parameters are sent in the slice segment header. |
---|
1101 | If deblocking filter parameters are sent in PPS, the same values of deblocking filter parameters |
---|
1102 | are used for all pictures in the sequence (i.e. deblocking parameter = base parameter value). |
---|
1103 | If deblocking filter parameters are sent in the slice segment header, varying deblocking filter |
---|
1104 | parameters can be specified by setting parameters tcOffsetDiv2 and betaOffsetDiv2 in the GOP structure table. |
---|
1105 | In this case, the final value of the deblocking filter parameter sent for a certain GOP picture is equal to |
---|
1106 | (base parameter + GOP parameter for this picture). Intra-pictures use the base parameters values. |
---|
1107 | \\ |
---|
1108 | |
---|
1109 | \Option{LoopFilterTcOffset_div2}& |
---|
1110 | \ShortOption{\None}& |
---|
1111 | \Default{0}& |
---|
1112 | Specifies the base value for the in-loop deblocking filter parameter tc_offset_div2. The final value of tc_offset_div2 |
---|
1113 | shall be an integer number in the range $-6..6$. |
---|
1114 | \\ |
---|
1115 | |
---|
1116 | \Option{LoopFilterBetaOffset_div2}& |
---|
1117 | \ShortOption{\None}& |
---|
1118 | \Default{0}& |
---|
1119 | Specifies the base value for the in-loop deblocking filter parameter beta_offset_div2. The final value of beta_offset_div2 |
---|
1120 | shall be an integer number in the range $-6..6$. |
---|
1121 | \\ |
---|
1122 | |
---|
1123 | \end{OptionTable} |
---|
1124 | |
---|
1125 | |
---|
1126 | |
---|
1127 | %% |
---|
1128 | %% Coding tools parameters |
---|
1129 | %% |
---|
1130 | \begin{OptionTable}{Coding tools parameters} |
---|
1131 | %\Option{ALF} & |
---|
1132 | %\ShortOption{\None} & |
---|
1133 | %\Default{true} & |
---|
1134 | %Enables or disables the adaptive loop filter. |
---|
1135 | %\\ |
---|
1136 | |
---|
1137 | %\Option{ALFLowLatencyEncode} & |
---|
1138 | %\ShortOption{\None} & |
---|
1139 | %\Default{false} & |
---|
1140 | %Specifies the operating mode (low latency or high efficiency) of the |
---|
1141 | %adaptive loop filter. |
---|
1142 | %\\ |
---|
1143 | |
---|
1144 | \Option{SAO} & |
---|
1145 | \ShortOption{\None} & |
---|
1146 | \Default{true} & |
---|
1147 | Enables or disables the sample adaptive offset (SAO) filter. |
---|
1148 | \\ |
---|
1149 | |
---|
1150 | \Option{SAOLcuBoundary} & |
---|
1151 | \ShortOption{\None} & |
---|
1152 | \Default{false} & |
---|
1153 | Enables or disables SAO parameter estimation using non-deblocked pixels |
---|
1154 | for LCU bottom and right boundary areas. |
---|
1155 | \\ |
---|
1156 | |
---|
1157 | %\Option{LMChroma} & |
---|
1158 | %\ShortOption{\None} & |
---|
1159 | %\Default{true} & |
---|
1160 | %Enables or disables the intra chroma-from-luma prediction mode. |
---|
1161 | %\\ |
---|
1162 | |
---|
1163 | %\Option{NSQT} & |
---|
1164 | %\ShortOption{\None} & |
---|
1165 | %\Default{true} & |
---|
1166 | %Enables or disables the non-square quadtree transform. |
---|
1167 | %\\ |
---|
1168 | |
---|
1169 | \Option{ConstrainedIntraPred} & |
---|
1170 | \ShortOption{\None} & |
---|
1171 | \Default{false} & |
---|
1172 | Enables or disables constrained intra prediction. Constrained intra |
---|
1173 | prediction only permits samples from intra blocks in the same slice as the |
---|
1174 | current block to be used for intra prediction. |
---|
1175 | \\ |
---|
1176 | |
---|
1177 | \Option{TransquantBypassEnableFlag} & |
---|
1178 | \ShortOption{\None} & |
---|
1179 | \Default{false} & |
---|
1180 | Enables or disables the ability to bypass the transform, |
---|
1181 | quantization and filtering stages at CU level. |
---|
1182 | This option corresponds to the value of |
---|
1183 | transquant_bypass_enable_flag that is transmitted in the PPS. |
---|
1184 | |
---|
1185 | See CUTransquantBypassFlagValue for further details. |
---|
1186 | \\ |
---|
1187 | |
---|
1188 | \Option{CUTransquantBypassFlagValue} & |
---|
1189 | \ShortOption{\None} & |
---|
1190 | \Default{0} & |
---|
1191 | Controls the per CU transformation, quantization and filtering |
---|
1192 | mode decision. |
---|
1193 | This option corresponds to the value of the per CU cu_transquant_bypass_flag. |
---|
1194 | \par |
---|
1195 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1196 | 0 & Bypass is not performed on any CU \\ |
---|
1197 | 1 & Bypass is performed on all CUs \\ |
---|
1198 | \end{tabular} |
---|
1199 | |
---|
1200 | This option has no effect if TransquantBypassEnableFlag is disabled. |
---|
1201 | \\ |
---|
1202 | |
---|
1203 | \Option{PCMEnabledFlag} & |
---|
1204 | \ShortOption{\None} & |
---|
1205 | \Default{false} & |
---|
1206 | Enables or disables the use of PCM. |
---|
1207 | \\ |
---|
1208 | |
---|
1209 | \Option{PCMLog2MaxSize} & |
---|
1210 | \ShortOption{\None} & |
---|
1211 | \Default{5 \\ ($= \mathrm{log}_2(32)$)} & |
---|
1212 | Specifies log2 of the maximum PCM block size. When PCM is enabled, the |
---|
1213 | PCM mode is available for 2Nx2N intra PUs smaller than or equal to the |
---|
1214 | specified maximum PCM block size |
---|
1215 | \\ |
---|
1216 | |
---|
1217 | \Option{PCMLog2MinSize} & |
---|
1218 | \ShortOption{\None} & |
---|
1219 | \Default{3} & |
---|
1220 | Specifies log2 of the minimum PCM block size. When PCM is enabled, the |
---|
1221 | PCM mode is available for 2Nx2N intra PUs larger than or equal to the |
---|
1222 | specified minimum PCM block size. |
---|
1223 | \par |
---|
1224 | When larger than PCMLog2MaxSize, PCM mode is not used. |
---|
1225 | \\ |
---|
1226 | |
---|
1227 | \Option{PCMInputBitDepthFlag} & |
---|
1228 | \ShortOption{\None} & |
---|
1229 | \Default{1} & |
---|
1230 | If enabled specifies that PCM sample bit-depth is set equal to |
---|
1231 | InputBitDepth. Otherwise, it specifies that PCM sample bit-depth is set |
---|
1232 | equal to InternalBitDepth. |
---|
1233 | \\ |
---|
1234 | |
---|
1235 | \Option{PCMFilterDisableFlag} & |
---|
1236 | \ShortOption{\None} & |
---|
1237 | \Default{false} & |
---|
1238 | If enabled specifies that loop-filtering on reconstructed samples of PCM |
---|
1239 | blocks is skipped. Otherwise, it specifies that loop-filtering on |
---|
1240 | reconstructed samples of PCM blocks is not skipped. |
---|
1241 | % 0 = (loop-filtering is not skipped for PCM samples). |
---|
1242 | \\ |
---|
1243 | |
---|
1244 | \Option{WeightedPredP} & |
---|
1245 | \ShortOption{-wpP} & |
---|
1246 | \Default{false} & |
---|
1247 | Enables the use of weighted prediction in P slices. |
---|
1248 | \\ |
---|
1249 | |
---|
1250 | \Option{WeightedPredB} & |
---|
1251 | \ShortOption{-wpB} & |
---|
1252 | \Default{false} & |
---|
1253 | Enables the use of weighted prediction in B slices. |
---|
1254 | \\ |
---|
1255 | |
---|
1256 | \Option{SignHideFlag} & |
---|
1257 | \ShortOption{-SBH} & |
---|
1258 | \Default{true} & |
---|
1259 | If enabled specifies that for each 4x4 coefficient group for which the |
---|
1260 | number of coefficients between the first nonzero coefficient and the |
---|
1261 | last nonzero coefficient along the scanning line exceeds 4, the sign bit |
---|
1262 | of the first nonzero coefficient will not be directly transmitted in the |
---|
1263 | bitstream, but may be inferred from the parity of the sum of all nonzero |
---|
1264 | coefficients in the current coefficient group. |
---|
1265 | \\ |
---|
1266 | |
---|
1267 | \Option{StrongIntraSmoothing} & |
---|
1268 | \ShortOption{-sis} & |
---|
1269 | \Default{true} & |
---|
1270 | If enabled specifies that for 32x32 intra prediction block, the intra smoothing |
---|
1271 | when applied is either the 1:2:1 smoothing filter or a stronger bi-linear |
---|
1272 | interpolation filter. Key reference sample values are tested and if the criteria |
---|
1273 | is satisfied, the stronger intra smoothing filter is applied. |
---|
1274 | If disabled, the intra smoothing filter when applied is the 1:2:1 smoothing filter. |
---|
1275 | \\ |
---|
1276 | |
---|
1277 | \Option{TMVPMode} & |
---|
1278 | \ShortOption{\None} & |
---|
1279 | \Default{1} & |
---|
1280 | Controls the temporal motion vector prediction mode. |
---|
1281 | \par |
---|
1282 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1283 | 0 & Disabled for all slices. \\ |
---|
1284 | 1 & Enabled for all slices. \\ |
---|
1285 | 2 & Disabled only for the first picture of each GOPSize. \\ |
---|
1286 | \end{tabular} |
---|
1287 | \\ |
---|
1288 | |
---|
1289 | \Option{TransformSkip} & |
---|
1290 | \ShortOption{\None} & |
---|
1291 | \Default{false} & |
---|
1292 | Enables or disables transform-skipping mode decision for 4x4 TUs |
---|
1293 | \footnote{Enables transform_skip_enabled and per 4x4 TU tests}. |
---|
1294 | \\ |
---|
1295 | |
---|
1296 | \Option{TransformSkipFast} & |
---|
1297 | \ShortOption{\None} & |
---|
1298 | \Default{false} & |
---|
1299 | Enables or disables reduced testing of the transform-skipping mode |
---|
1300 | decision for chroma TUs. When enabled, no RDO search is performed for |
---|
1301 | chroma TUs, instead they are transform-skipped if the four corresponding |
---|
1302 | luma TUs are also skipped. |
---|
1303 | \par |
---|
1304 | This option has no effect if TransformSkip is disabled. |
---|
1305 | \\ |
---|
1306 | \end{OptionTable} |
---|
1307 | |
---|
1308 | %% |
---|
1309 | %% Rate control parameters |
---|
1310 | %% |
---|
1311 | \begin{OptionTable}{Rate control parameters} |
---|
1312 | |
---|
1313 | \Option{RateControl} & |
---|
1314 | \ShortOption{\None} & |
---|
1315 | \Default{false} & |
---|
1316 | Rate control: enables rate control or not. |
---|
1317 | \\ |
---|
1318 | |
---|
1319 | \Option{TargetBitrate} & |
---|
1320 | \ShortOption{\None} & |
---|
1321 | \Default{0} & |
---|
1322 | Rate control: target bitrate, in bps. |
---|
1323 | \\ |
---|
1324 | |
---|
1325 | \Option{KeepHierarchicalBit} & |
---|
1326 | \ShortOption{\None} & |
---|
1327 | \Default{false} & |
---|
1328 | Rate control: keep hierarchical bit allocation in rate control algorithm. |
---|
1329 | It is suggested to enable hierarchical bit allocation for hierarchical-B coding structure. |
---|
1330 | \\ |
---|
1331 | |
---|
1332 | \Option{LCULevelRateControl} & |
---|
1333 | \ShortOption{\None} & |
---|
1334 | \Default{true} & |
---|
1335 | Rate control: true: LCU level RC; false: picture level RC. |
---|
1336 | \\ |
---|
1337 | |
---|
1338 | \Option{RCLCUSeparateModel} & |
---|
1339 | \ShortOption{\None} & |
---|
1340 | \Default{true} & |
---|
1341 | Rate control: use LCU level separate R-lambda model or not. |
---|
1342 | When LCULevelRateControl is equal to false, this parameter is meaningless. |
---|
1343 | \\ |
---|
1344 | |
---|
1345 | \Option{InitialQP} & |
---|
1346 | \ShortOption{\None} & |
---|
1347 | \Default{0} & |
---|
1348 | Rate control: initial QP value for the first picture. |
---|
1349 | 0 to auto determine the initial QP value. |
---|
1350 | \\ |
---|
1351 | |
---|
1352 | \Option{RCForceIntraQP} & |
---|
1353 | \ShortOption{\None} & |
---|
1354 | \Default{false} & |
---|
1355 | Rate control: force intra QP to be equal to initial QP or not. |
---|
1356 | \\ |
---|
1357 | \end{OptionTable} |
---|
1358 | |
---|
1359 | %% |
---|
1360 | %% VUI parameters |
---|
1361 | %% |
---|
1362 | \begin{OptionTable}{VUI parameters} |
---|
1363 | \Option{VuiParametersPresent} & |
---|
1364 | \ShortOption{-vui} & |
---|
1365 | \Default{false} & |
---|
1366 | Enable generation of vui_parameters(). |
---|
1367 | \\ |
---|
1368 | \Option{AspectRatioInfoPresent} & |
---|
1369 | \ShortOption{} & |
---|
1370 | \Default{false} & |
---|
1371 | Signals whether aspect_ratio_idc is present. |
---|
1372 | \\ |
---|
1373 | \Option{AspectRatioIdc} & |
---|
1374 | \ShortOption{} & |
---|
1375 | \Default{0} & |
---|
1376 | aspect_ratio_idc |
---|
1377 | \\ |
---|
1378 | \Option{SarWidth} & |
---|
1379 | \ShortOption{} & |
---|
1380 | \Default{0} & |
---|
1381 | Specifies the horizontal size of the sample aspect ratio. |
---|
1382 | \\ |
---|
1383 | \Option{SarHeight} & |
---|
1384 | \ShortOption{} & |
---|
1385 | \Default{0} & |
---|
1386 | Specifies the vertical size of the sample aspect ratio. |
---|
1387 | \\ |
---|
1388 | \Option{OverscanInfoPresent} & |
---|
1389 | \ShortOption{} & |
---|
1390 | \Default{false} & |
---|
1391 | Signals whether overscan_info_present_flag is present. |
---|
1392 | \\ |
---|
1393 | \Option{OverscanAppropriate} & |
---|
1394 | \ShortOption{} & |
---|
1395 | \Default{false} & |
---|
1396 | Indicates whether cropped decoded pictures are suitable for display using overscan. |
---|
1397 | \par |
---|
1398 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1399 | 0 & Indicates that the decoded pictures should not be displayed using overscan. \\ |
---|
1400 | 1 & Indicates that the decoded pictures may be displayed using overscan. \\ |
---|
1401 | \end{tabular} |
---|
1402 | \\ |
---|
1403 | \Option{VideoSignalTypePresent} & |
---|
1404 | \ShortOption{} & |
---|
1405 | \Default{false} & |
---|
1406 | Signals whether video_format, video_full_range_flag, and colour_description_present_flag are present. |
---|
1407 | \\ |
---|
1408 | \Option{VideoFormat} & |
---|
1409 | \ShortOption{} & |
---|
1410 | \Default{5} & |
---|
1411 | Indicates representation of pictures. |
---|
1412 | \\ |
---|
1413 | \Option{VideoFullRange} & |
---|
1414 | \ShortOption{} & |
---|
1415 | \Default{false} & |
---|
1416 | Indicates the black level and range of luma and chroma signals. |
---|
1417 | \par |
---|
1418 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1419 | 0 & Indicates that the luma and chroma signals are to be scaled prior to display. \\ |
---|
1420 | 1 & Indicates that the luma and chroma signals are not to be scaled prior to display. \\ |
---|
1421 | \end{tabular} |
---|
1422 | \\ |
---|
1423 | \Option{ColourDescriptionPresent} & |
---|
1424 | \ShortOption{} & |
---|
1425 | \Default{false} & |
---|
1426 | Signals whether colour_primaries, transfer_characteristics and matrix_coefficients are present. |
---|
1427 | \\ |
---|
1428 | \Option{ColourPrimaries} & |
---|
1429 | \ShortOption{} & |
---|
1430 | \Default{2} & |
---|
1431 | Indicates chromaticity coordinates of the source primaries. |
---|
1432 | \\ |
---|
1433 | \Option{TransferCharateristics} & |
---|
1434 | \ShortOption{} & |
---|
1435 | \Default{2} & |
---|
1436 | Indicates the opto-electronic transfer characteristics of the source. |
---|
1437 | \\ |
---|
1438 | \Option{MatrixCoefficients} & |
---|
1439 | \ShortOption{} & |
---|
1440 | \Default{2} & |
---|
1441 | Describes the matrix coefficients used in deriving luma and chroma from RGB primaries. |
---|
1442 | \\ |
---|
1443 | \Option{ChromaLocInfoPresent} & |
---|
1444 | \ShortOption{} & |
---|
1445 | \Default{false} & |
---|
1446 | Signals whether chroma_sample_loc_type_top_field and chroma_sample_loc_type_bottom_field are present. |
---|
1447 | \\ |
---|
1448 | \Option{ChromaSampleLocTypeTopField} & |
---|
1449 | \ShortOption{} & |
---|
1450 | \Default{0} & |
---|
1451 | Specifies the location of chroma samples for top field. |
---|
1452 | \\ |
---|
1453 | \Option{ChromaSampleLocTypeBottomField} & |
---|
1454 | \ShortOption{} & |
---|
1455 | \Default{0} & |
---|
1456 | Specifies the location of chroma samples for bottom field. |
---|
1457 | \\ |
---|
1458 | \Option{NeutralChromaIndication} & |
---|
1459 | \ShortOption{} & |
---|
1460 | \Default{false} & |
---|
1461 | Indicates that the value of all decoded chroma samples is equal to 1<<(BitDepthCr-1). |
---|
1462 | \\ |
---|
1463 | |
---|
1464 | \Option{DefaultDisplayWindowFlag} & |
---|
1465 | \ShortOption{\None} & |
---|
1466 | \Default{0} & |
---|
1467 | Indicates the presence of the Default Window parameters. |
---|
1468 | \par |
---|
1469 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1470 | 0 & Disabled \\ |
---|
1471 | 1 & Enabled \\ |
---|
1472 | \end{tabular} |
---|
1473 | \\ |
---|
1474 | |
---|
1475 | \Option{DefDispWinLeftOffset}% |
---|
1476 | \Option{DefDispWinRightOffset}% |
---|
1477 | \Option{DefDispWinTopOffset}% |
---|
1478 | \Option{DefDispWinBottomOffset} & |
---|
1479 | \ShortOption{\None} & |
---|
1480 | \Default{0} & |
---|
1481 | Specifies the horizontal and vertical offset to be applied to the |
---|
1482 | input video from the conformance window in luma samples. |
---|
1483 | Must be a multiple of the chroma resolution (e.g. a multiple of two for 4:2:0). |
---|
1484 | \\ |
---|
1485 | |
---|
1486 | \Option{BitstreamRestriction} & |
---|
1487 | \ShortOption{} & |
---|
1488 | \Default{false} & |
---|
1489 | Signals whether bitstream restriction parameters are present. |
---|
1490 | \\ |
---|
1491 | \Option{TilesFixedStructure} & |
---|
1492 | \ShortOption{} & |
---|
1493 | \Default{false} & |
---|
1494 | Indicates that each active picture parameter set has the same values of the syntax elements related to tiles. |
---|
1495 | \\ |
---|
1496 | \Option{MotionVectorsOverPicBoundaries} & |
---|
1497 | \ShortOption{} & |
---|
1498 | \Default{false} & |
---|
1499 | Indicates that no samples outside the picture boundaries are used for inter prediction. |
---|
1500 | \\ |
---|
1501 | \Option{MaxBytesPerPicDenom} & |
---|
1502 | \ShortOption{} & |
---|
1503 | \Default{2} & |
---|
1504 | Indicates a number of bytes not exceeded by the sum of the sizes of the VCL NAL units associated with any coded picture. |
---|
1505 | \\ |
---|
1506 | \Option{MaxBitsPerMinCuDenom} & |
---|
1507 | \ShortOption{} & |
---|
1508 | \Default{1} & |
---|
1509 | Indicates an upper bound for the number of bits of coding_unit() data. |
---|
1510 | \\ |
---|
1511 | \Option{Log2MaxMvLengthHorizontal} & |
---|
1512 | \ShortOption{} & |
---|
1513 | \Default{15} & |
---|
1514 | Indicate the maximum absolute value of a decoded horizontal MV component in quarter-pel luma units. |
---|
1515 | \\ |
---|
1516 | \Option{Log2MaxMvLengthVertical} & |
---|
1517 | \ShortOption{} & |
---|
1518 | \Default{15} & |
---|
1519 | Indicate the maximum absolute value of a decoded vertical MV component in quarter-pel luma units. |
---|
1520 | \\ |
---|
1521 | \end{OptionTable} |
---|
1522 | |
---|
1523 | %% |
---|
1524 | %% SEI messages |
---|
1525 | %% |
---|
1526 | \begin{OptionTable}{SEI messages} |
---|
1527 | \Option{SEIDecodedPictureHash} & |
---|
1528 | \ShortOption{\None} & |
---|
1529 | \Default{0} & |
---|
1530 | Enables or disables the calculation and insertion of the Decoded picture hash |
---|
1531 | SEI messages. |
---|
1532 | \par |
---|
1533 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1534 | 0 & Disabled \\ |
---|
1535 | 1 & Transmits MD5 in SEI message and writes the value to the encoder |
---|
1536 | log \\ |
---|
1537 | 2 & Transmits CRC in SEI message and writes the value to the encoder |
---|
1538 | log \\ |
---|
1539 | 3 & Transmits checksum in SEI message and writes the value to the encoder |
---|
1540 | log \\ |
---|
1541 | \end{tabular} |
---|
1542 | \\ |
---|
1543 | \Option{SEIpictureDigest} & |
---|
1544 | \ShortOption{\None} & |
---|
1545 | \Default{0} & |
---|
1546 | Deprecated alias for SEIDecodedPictureHash. |
---|
1547 | Do not use anymore. |
---|
1548 | \\ |
---|
1549 | \Option{SEIRecoveryPoint} & |
---|
1550 | \ShortOption{\None} & |
---|
1551 | \Default{0} & |
---|
1552 | Enables or disables the insertion of the Recovery point |
---|
1553 | SEI messages. |
---|
1554 | \\ |
---|
1555 | \Option{SEIActiveParameterSets} & |
---|
1556 | \ShortOption{\None} & |
---|
1557 | \Default{0} & |
---|
1558 | Enables or disables the insertion of the Active parameter sets |
---|
1559 | SEI messages. |
---|
1560 | \\ |
---|
1561 | \Option{SEIBufferingPeriod} & |
---|
1562 | \ShortOption{\None} & |
---|
1563 | \Default{0} & |
---|
1564 | Enables or disables the insertion of the Buffering period |
---|
1565 | SEI messages. This option has no effect if VuiParametersPresent is disabled. |
---|
1566 | SEIBufferingPeriod requires SEIActiveParameterSets to be enabled. |
---|
1567 | \\ |
---|
1568 | \Option{SEIPictureTiming} & |
---|
1569 | \ShortOption{\None} & |
---|
1570 | \Default{0} & |
---|
1571 | Enables or disables the insertion of the Picture timing |
---|
1572 | SEI messages. This option has no effect if VuiParametersPresent is disabled. |
---|
1573 | \\ |
---|
1574 | \Option{SEIDecodingUnitInfo} & |
---|
1575 | \ShortOption{\None} & |
---|
1576 | \Default{0} & |
---|
1577 | Enables or disables the insertion of the Decoding unit information |
---|
1578 | SEI messages. This option has no effect if VuiParametersPresent is disabled. |
---|
1579 | \\ |
---|
1580 | \Option{SEIGradualDecodingRefreshInfo} & |
---|
1581 | \ShortOption{\None} & |
---|
1582 | \Default{0} & |
---|
1583 | Enables or disables the insertion of the Gradual decoding refresh information |
---|
1584 | SEI messages. |
---|
1585 | \\ |
---|
1586 | \Option{SEITemporalLevel0Index} & |
---|
1587 | \ShortOption{\None} & |
---|
1588 | \Default{0} & |
---|
1589 | Enables or disables the insertion of the Temporal level zero index |
---|
1590 | SEI messages. |
---|
1591 | \\ |
---|
1592 | \Option{SEIDisplayOrientation} & |
---|
1593 | \ShortOption{\None} & |
---|
1594 | \Default{0} & |
---|
1595 | Enables or disables the insertion of the Display orientation |
---|
1596 | SEI messages. |
---|
1597 | \par |
---|
1598 | \begin{tabular}{cp{0.30\textwidth}} |
---|
1599 | 0 & Disabled \\ |
---|
1600 | N: $0 < N < (2^{16} - 1)$ & Enable display orientation SEI message with |
---|
1601 | \mbox{anticlockwise_rotation = N} |
---|
1602 | and \mbox{display_orientation_repetition_period = 1} \\ |
---|
1603 | \end{tabular} |
---|
1604 | \\ |
---|
1605 | \Option{SEIFramePacking} & |
---|
1606 | \ShortOption{\None} & |
---|
1607 | \Default{0} & |
---|
1608 | Enables or disables the insertion of the Frame packing arrangement SEI messages. |
---|
1609 | \\ |
---|
1610 | \Option{SEIFramePackingType} & |
---|
1611 | \ShortOption{\None} & |
---|
1612 | \Default{0} & |
---|
1613 | Indicates the arrangement type in the Frame packing arrangement SEI message. |
---|
1614 | This option has no effect if SEIFramePacking is disabled. |
---|
1615 | \par |
---|
1616 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1617 | 0 & Checkerboard \\ |
---|
1618 | 1 & Line Alternate \\ |
---|
1619 | 2 & Column Alternate \\ |
---|
1620 | 3 & Side by Side \\ |
---|
1621 | 4 & Top Bottom \\ |
---|
1622 | 5 & Frame Alternate \\ |
---|
1623 | 6 & 2D Image \\ |
---|
1624 | 7 & Tile Format \\ |
---|
1625 | \end{tabular} |
---|
1626 | \\ |
---|
1627 | \Option{SEIFramePackingInterpretation} & |
---|
1628 | \ShortOption{\None} & |
---|
1629 | \Default{0} & |
---|
1630 | Indicates the constituent frames relationship in the Frame packing arrangement SEI message. |
---|
1631 | This option has no effect if SEIFramePacking is disabled. |
---|
1632 | \par |
---|
1633 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1634 | 0 & Unspecified \\ |
---|
1635 | 1 & Frame 0 is associated with the left view of a stereo pair \\ |
---|
1636 | 2 & Frame 0 is associated with the right view of a stereo pair \\ |
---|
1637 | \end{tabular} |
---|
1638 | \\ |
---|
1639 | \Option{SEIFramePackingQuincunx} & |
---|
1640 | \ShortOption{\None} & |
---|
1641 | \Default{0} & |
---|
1642 | Enables or disables the quincunx_sampling signalling in the |
---|
1643 | Frame packing arrangement SEI messages. This option has no |
---|
1644 | effect if SEIFramePacking is disabled. |
---|
1645 | \\ |
---|
1646 | \Option{SEIFramePackingId} & |
---|
1647 | \ShortOption{\None} & |
---|
1648 | \Default{0} & |
---|
1649 | Indicates the session number in the Frame packing arrangement |
---|
1650 | SEI messages. This option has no effect if SEIFramePacking is |
---|
1651 | disabled. |
---|
1652 | \\ |
---|
1653 | \end{OptionTable} |
---|
1654 | |
---|
1655 | %% |
---|
1656 | %% |
---|
1657 | %% |
---|
1658 | \subsection{Hardcoded encoder parameters} |
---|
1659 | \begin{MacroTable}{CommonDef.h constants} |
---|
1660 | ADAPT_SR_SCALE & |
---|
1661 | 1 & |
---|
1662 | Defines a scaling factor used to derive the motion search range is |
---|
1663 | adaptive (see ASR configuration parameter). Default value is 1. |
---|
1664 | \\ |
---|
1665 | |
---|
1666 | MAX_GOP & |
---|
1667 | 64 & |
---|
1668 | maximum size of value of hierarchical GOP. |
---|
1669 | \\ |
---|
1670 | |
---|
1671 | MAX_NUM_REF & |
---|
1672 | 4 & |
---|
1673 | maximum number of multiple reference frames |
---|
1674 | \\ |
---|
1675 | |
---|
1676 | MAX_NUM_REF_LC & |
---|
1677 | 8 & |
---|
1678 | maximum number of combined reference frames |
---|
1679 | \\ |
---|
1680 | |
---|
1681 | AMVP_MAX_NUM_CANDS & |
---|
1682 | 2 & |
---|
1683 | maximum number of final candidates |
---|
1684 | \\ |
---|
1685 | |
---|
1686 | AMVP_MAX_NUM_CANDS_MEM & |
---|
1687 | 3 & |
---|
1688 | \\ |
---|
1689 | |
---|
1690 | MRG_MAX_NUM_CANDS & |
---|
1691 | 5 & |
---|
1692 | \\ |
---|
1693 | |
---|
1694 | DYN_REF_FREE & |
---|
1695 | off & |
---|
1696 | dynamic free of reference memories |
---|
1697 | \\ |
---|
1698 | |
---|
1699 | MAX_TLAYER & |
---|
1700 | 8 & |
---|
1701 | maximum number of temporal layers |
---|
1702 | \\ |
---|
1703 | |
---|
1704 | HB_LAMBDA_FOR_LDC & |
---|
1705 | on & |
---|
1706 | use of B-style lambda for non-key pictures in low-delay mode |
---|
1707 | \\ |
---|
1708 | |
---|
1709 | GPB_SIMPLE & |
---|
1710 | on & |
---|
1711 | Fast estimation of generalized B in low-delay mode |
---|
1712 | \\ |
---|
1713 | |
---|
1714 | GPB_SIMPLE_UNI & |
---|
1715 | on & |
---|
1716 | Fast estimation of generalized B in low-delay mode for uni-direction |
---|
1717 | \\ |
---|
1718 | |
---|
1719 | FASTME_SMOOTHER_MV & |
---|
1720 | on & |
---|
1721 | Fast ME using smoother MV assumption |
---|
1722 | \\ |
---|
1723 | |
---|
1724 | ADAPT_SR_SCALE & |
---|
1725 | on & |
---|
1726 | division factor for adaptive search range |
---|
1727 | \\ |
---|
1728 | |
---|
1729 | CLIP_TO_709_RANGE & |
---|
1730 | off & |
---|
1731 | \\ |
---|
1732 | |
---|
1733 | EARLY_SKIP_THRES & |
---|
1734 | 1.5 & |
---|
1735 | early skip if RD < EARLY_SKIP_THRES*avg[BestSkipRD] |
---|
1736 | \\ |
---|
1737 | |
---|
1738 | MAX_NUM_REF_PICS & |
---|
1739 | 16 & |
---|
1740 | \\ |
---|
1741 | |
---|
1742 | MAX_CHROMA_FORMAT_IDC & |
---|
1743 | 3 & |
---|
1744 | \\ |
---|
1745 | \end{MacroTable} |
---|
1746 | |
---|
1747 | \subsubsection*{TypeDef.h} |
---|
1748 | Numerous constants that guard individual adoptions are defined within |
---|
1749 | \url{source/Lib/TLibCommon/TypeDef.h}. |
---|
1750 | |
---|
1751 | %% |
---|
1752 | %% |
---|
1753 | %% |
---|
1754 | \clearpage |
---|
1755 | \section{Using the decoder} |
---|
1756 | \begin{verbatim} |
---|
1757 | TappDecoder -b str.bin -o dec.yuv [options] |
---|
1758 | \end{verbatim} |
---|
1759 | |
---|
1760 | \begin{OptionTable}{Decoder options} |
---|
1761 | \Option{} & |
---|
1762 | \ShortOption{-h} & |
---|
1763 | \Default{\None} & |
---|
1764 | Prints usage information. |
---|
1765 | \\ |
---|
1766 | |
---|
1767 | \Option{} & |
---|
1768 | \ShortOption{-o} & |
---|
1769 | \Default{\NotSet} & |
---|
1770 | Defines reconstructed YUV file name. |
---|
1771 | \\ |
---|
1772 | |
---|
1773 | \Option{} & |
---|
1774 | \ShortOption{-s} & |
---|
1775 | \Default{0} & |
---|
1776 | Defines the number of pictures in decoding order to skip. |
---|
1777 | \\ |
---|
1778 | |
---|
1779 | \Option{OutputBitDepth} & |
---|
1780 | \ShortOption{-d} & |
---|
1781 | \Default{0 \\ (Native)} & |
---|
1782 | Specifies the luma bit-depth of the reconstructed YUV file (the value 0 indicates |
---|
1783 | that the native bit-depth is used) |
---|
1784 | \\ |
---|
1785 | |
---|
1786 | \Option{OutputBitDepthC} & |
---|
1787 | \ShortOption{\None} & |
---|
1788 | \Default{0 \\ (Native)} & |
---|
1789 | Defines the chroma bit-depth of the reconstructed YUV file (the value 0 indicates |
---|
1790 | that the native bit-depth is used) |
---|
1791 | \\ |
---|
1792 | |
---|
1793 | \Option{SEIPictureDigest} & |
---|
1794 | \ShortOption{\None} & |
---|
1795 | \Default{1} & |
---|
1796 | Enable or disable verification of any Picture hash SEI messages. When |
---|
1797 | this parameter is set to 0, the feature is disabled and all messages are |
---|
1798 | ignored. When set to 1 (default), the feature is enabled and the decoder |
---|
1799 | has the following behaviour: |
---|
1800 | \begin{itemize} |
---|
1801 | \item |
---|
1802 | If Picture hash SEI messages are included in the bitstream, the same type |
---|
1803 | of hash is calculated for each decoded picture and written to the |
---|
1804 | log together with an indication whether the calculted value matches |
---|
1805 | the value in the SEI message. |
---|
1806 | Decoding will continue even if there is a mismatch. |
---|
1807 | |
---|
1808 | \item |
---|
1809 | After decoding is complete, if any MD5sum comparison failed, a warning |
---|
1810 | is printed and the decoder exits with the status EXIT_FAILURE |
---|
1811 | |
---|
1812 | \item |
---|
1813 | The per-picture MD5 log message has the following formats: |
---|
1814 | [MD5:d41d8cd98f00b204e9800998ecf8427e,(OK)], |
---|
1815 | [MD5:d41d8cd98f00b204e9800998ecf8427e,(unk)], |
---|
1816 | [MD5:d41d8cd98f00b204e9800998ecf8427e,(***ERROR***)] [rxMD5:b9e1...] |
---|
1817 | where, "(unk)" implies that no MD5 was signalled for this picture, |
---|
1818 | "(OK)" implies that the decoder agrees with the signalled MD5, |
---|
1819 | "(***ERROR***)" implies that the decoder disagrees with the signalled |
---|
1820 | MD5. "[rxMD5:...]" is the signalled MD5 if different. |
---|
1821 | \end{itemize} |
---|
1822 | \\ |
---|
1823 | |
---|
1824 | \Option{RespectDefDispWindow} & |
---|
1825 | \ShortOption{-w} & |
---|
1826 | \Default{0} & |
---|
1827 | Video region to be output by the decoder. |
---|
1828 | \par |
---|
1829 | \begin{tabular}{cp{0.45\textwidth}} |
---|
1830 | 0 & Output content inside the conformance window. \\ |
---|
1831 | 1 & Output content inside the default window. \\ |
---|
1832 | \end{tabular} |
---|
1833 | \\ |
---|
1834 | |
---|
1835 | \end{OptionTable} |
---|
1836 | |
---|
1837 | |
---|
1838 | \end{document} |
---|