Context navigation

← Previous revision
Latest revision
Next revision →
Blame
Revision log

software-manual.tex @ 530

Visit:

Last change on this file since 530 was 324, checked in by tech, 12 years ago
Initial development version for update to latest HM version. Includes MV-HEVC and basic extensions for 3D-HEVC.
File size: 54.3 KB

Line
1	\documentclass[a4paper,11pt]{jctvcdoc}
2
3	\usepackage{geometry}[2010/02/12]
4
5	\usepackage{hyperref}
6	\hypersetup{colorlinks=true}
7	\usepackage{color,soul}
8
9	\usepackage[position=bottom]{subfig}
10	\captionsetup[subfloat]{position=top}
11	\usepackage{multirow}
12	\usepackage{dcolumn}
13	\newcolumntype{.}{D{.}{.}{-1}}
14	\usepackage{colortbl}
15	\usepackage{makecell}
16	\usepackage{longtable}
17	\usepackage{array}
18	\usepackage{algorithm2e}
19
20	\usepackage[strings]{underscore}
21	\usepackage{csquotes}
22	\MakeOuterQuote{"}
23	\EnableQuotes
24
25	\newcommand\None{}
26	\newcommand\NotSet{}
27	\makeatletter
28	\newcommand{\Option}[1]{\ifx\optOption\@empty\gdef\optOption{#1}\else\g@addto@macro\optOption{ \\ #1}\fi}
29	\newcommand{\ShortOption}[1]{\ifx\optShortOption\@empty\gdef\optShortOption{#1}\else\g@addto@macro\optShortOption{ \\ #1}\fi}
30	\newcommand{\Default}[1]{\ifx\optDefault\@empty\gdef\optDefault{#1}\else\g@addto@macro\optDefault{ \\ #1}\fi}
31	\newcommand{\clearOptions}{\gdef\optOption{}\gdef\optShortOption{}\gdef\optDefault{}}
32	\makeatother
33	\newenvironment{OptionTable}[1]{%
34	\footnotesize
35	\def\arraystretch{1.8}
36	\clearOptions
37	\begin{longtable}{l<{\makecell[tl]{\optOption}}%
38	>{\texttt\bgroup}l<{\makecell[tl]{\optShortOption}\egroup}%
39	c<{\makecell[tc]{\optDefault}}%
40	>{\def\arraystretch{1.0}}p{0.5\textwidth}<{\clearOptions}}
41	\caption{#1} \\
42	\hspace{12em}&&\hspace{8em}&\kill
43	\hline
44	\thead{Option} &
45	\egroup\thead{Shorthand}\bgroup &
46	\thead{Default} &
47	\thead{Description} \\
48	\hline
49	\endfirsthead
50	\caption[]{#1 (Continued)} \\
51	\hspace{12em}&&\hspace{8em}&\kill
52	\hline
53	\thead{Option} &
54	\egroup\thead{Shorthand}\bgroup &
55	\thead{Default} &
56	\thead{Description} \\
57	\hline
58	\endhead
59	\multicolumn{4}{r}{Continued...}\\
60	\hline
61	\endfoot
62	\hline
63	\endlastfoot
64	}{%
65	\hline
66	\end{longtable}
67	}
68
69	\newenvironment{MacroTable}[1]{%
70	\footnotesize
71	\def\arraystretch{1.3}
72	\clearOptions
73	\begin{longtable}{lcp{0.5\textwidth}}
74	\caption{#1} \\
75	%\hspace{12em}&&\hspace{8em}&\kill
76	\hline
77	\thead{Option} &
78	\thead{Default} &
79	\thead{Description} \\
80	\hline
81	\endfirsthead
82	\caption[]{#1 (Continued)} \\
83	\hline
84	\thead{Option} &
85	\thead{Default} &
86	\thead{Description} \\
87	\hline
88	\endhead
89	\multicolumn{3}{r}{Continued...}\\
90	\hline
91	\endfoot
92	\hline
93	\endlastfoot
94	}{%
95	\end{longtable}
96	}
97
98	\title{HM Software Manual}
99	\author{%
100	Frank Bossen
101	\email{bossen@docomoinnovations.com}
102	\and
103	David Flynn
104	\email{davidf@rd.bbc.co.uk}
105	\and
106	Karsten S\"uhring
107	\email{Karsten.Suehring@hhi.fraunhofer.de}
108	}
109
110	\jctvcmeeting{}
111	\jctvcdocnum{Software Manual}
112	\jctvcdocstatus{Software AHG working document}
113	\jctvcdocpurpose{Information}
114	\jctvcdocsource{AHG chairs}
115
116	\begin{document}
117	\maketitle
118	\begin{abstract}
119	This document is a user manual describing usage of reference software
120	for the HEVC project. It applies to version 10.0
121	of the software.
122	\end{abstract}
123
124	\tableofcontents
125	\listoftables
126
127	\section{General Information}
128	Reference software is being made available to provide a reference
129	implementation of the draft HEVC standard being developed by the Joint
130	Collaborative Team on Video Coding (JCT-VC) regrouping experts from
131	ITU-T SG 16 and ISO/IEC SC29 WG11. One of the main goals of the
132	reference software is to provide a basis upon which to conduct
133	experiments in order to determine which coding tools provide desired
134	coding performance. It is not meant to be a particularly efficient
135	implementation of anything, and one may notice its apparent
136	unsuitability for a particular use. It should not be construed to be a
137	reflection of how complex a production-quality implementation of a
138	future HEVC standard would be.
139
140	This document aims to provide guidance on the usage of the reference
141	software. It is widely suspected to be incomplete and suggestions for
142	improvements are welcome. Such suggestions and general inquiries may be
143	sent to the general JCT-VC email reflector on
144	\url{jct-vc@lists.rwth-aachen.de} (registration required).
145
146	\subsection*{Bug reporting}
147	Bugs should be reported on the issue tracker set up at
148	\url{http://hevc.kw.bbc.co.uk/trac/}
149
150	\section{Installation and compilation}
151	The software may be retrieved from one of the following SVN servers
152	(mirrored):
153	\begin{itemize}
154	\item \url{https://hevc.hhi.fraunhofer.de/svn/svn_HEVCSoftware/}
155	\item \url{svn://hevc.kw.bbc.co.uk/svn/jctvc-hm/}
156	\end{itemize}
157
158	Table~\ref{tab:project-files} enumerates various project files that are
159	provided for development environments.
160
161	\begin{table}[ht]
162	\footnotesize
163	\caption{Available project files}
164	\label{tab:project-files}
165	\centering
166	\begin{tabular}{ll}
167	\hline
168	\thead{Environment} &
169	\thead{Location of project file} \\
170	% Environment & Location of project file \\
171	\hline
172	MS Visual Studio 8 & build/HM_vc8.sln \\
173	MS Visual Studio 9 & build/HM_vc9.sln \\
174	Xcode & HM.xcodeproj \\
175	Linux & build/linux/makefile \\
176	\hline
177	\end{tabular}
178	\end{table}
179
180	%%%%
181	%%%%
182	%%%%
183	\section{Using the encoder}
184	\begin{verbatim}
185	TAppEncoder [-h] [-c config.cfg] [--parameter=value]
186	\end{verbatim}
187
188	\begin{table}[ht]
189	\footnotesize
190	\centering
191	\begin{tabular}{lp{0.5\textwidth}}
192	\hline
193	\thead{Option} &
194	\thead{Description} \\
195	\hline
196	\texttt{-h} & Prints parameter usage. \\
197	\texttt{-c} & Defines configuration file to use. Multiple configuration files
198	may be used with repeated --c options. \\
199	\texttt{--}\emph{parameter}\texttt{=}\emph{value}
200	& Assigns value to a given parameter as further described below.
201	Some parameters are also supported by shorthand
202	"--\em{opt}~\emph{value}".\\
203	\hline
204	\end{tabular}
205	\end{table}
206
207	Sample configuration files are provided in the cfg/ folder.
208
209	\subsection{GOP structure table}
210	\label{sec:gop-structure}
211	Defines the cyclic GOP structure that will be used repeatedly
212	throughout the sequence. The table should contain GOPSize lines,
213	named Frame1, Frame2, etc. The frames are listed in decoding
214	order, so Frame1 is the first frame in decoding order, Frame2 is
215	the second and so on. Among other things, the table specifies all
216	reference pictures kept by the decoder for each frame. This
217	includes pictures that are used for reference for the current
218	picture as well as pictures that will be used for reference in
219	the future. The encoder will not automatically calculate what
220	pictures that has to be kept for future references, they have to
221	be specified. Note that some specified reference frames for
222	pictures encoded in the very first GOP after an IDR frame might
223	not be available. This is handled automatically by the encoder,
224	so the reference pictures can be given in the GOP structure table
225	as if there were infinitely many identical GOPs before the
226	current one. Each line in the table contains the parameters used
227	for the corresponding frame, separated by whitespace:
228
229	\begin{itemize}
230	\item[]\textbf{Type}: Slice type, can be either I, P or B.
231
232	\item[]\textbf{POC}: Display order of the frame within a GOP, ranging
233	from 1 to GOPSize.
234
235	\item[]\textbf{QPOffset}: QP offset is added to the QP parameter to set
236	the final QP value to use for this frame.
237
238	\item[]\textbf{QPFactor}: Weight used during rate distortion
239	optimization. Higher values mean lower quality and less bits. Typical
240	range is between
241	0.3 and 1.
242
243	\item[]\textbf{tcOffsetDiv2}: In-loop deblocking filter parameter tcOffsetDiv2
244	is added to the base parameter LoopFilterTcOffset_div2 to set the final tc_offset_div2
245	parameter for this picture signalled in the slice segment header. The final
246	value of tc_offset_div2 shall be an integer number in the range $-6..6$.
247
248	\item[]\textbf{betaOffsetDiv2}: In-loop deblocking filter parameter betaOffsetDiv2
249	is added to the base parameter LoopFilterBetaOffset_div2 to set the final beta_offset_div2
250	parameter for this picture signalled in the slice segment header. The final
251	value of beta_offset_div2 shall be an integer number in the range $-6..6$.
252
253	\item[]\textbf{temporal_id}: Temporal layer of the frame. A frame cannot
254	predict from a frame with a higher temporal id. If a frame with higher
255	temporal IDs is listed among a frame's reference pictures, it is
256	not used, but is kept for possible use in future frames.
257
258	\item[]\textbf{num_ref_pics_active}: Size of reference picture lists L0
259	and L1, indicating how many reference pictures in each direction that
260	are used during coding.
261
262	\item[]\textbf{num_ref_pics}: The number of reference pictures kept for
263	this frame. This includes pictures that are used for reference for the
264	current picture as well as pictures that will be used for reference in
265	the future.
266
267	\item[]\textbf{reference_pictures}: A space-separated list of
268	num_ref_pics integers, specifying the POC of the reference pictures
269	kept, relative the POC of the current frame. The picture list shall be
270	ordered, first with negative numbers from largest to smallest, followed
271	by positive numbers from smallest to largest (e.g. \verb\|-1 -3 -5 1 3\|).
272	Note that any pictures not supplied in this list will be discarded and
273	therefore not available as reference pictures later.
274
275	\item[]\textbf{predict}: Defines the value of the syntax element
276	inter_ref_pic_set_prediction_flag. A value of 0 indicates that the
277	reference picture set is encoded without inter RPS prediction and the
278	subsequent parameters deltaRIdx$-1$, deltaRPS, num_ref_idcs and
279	Reference_idcs are ignored and do not need to be present. A value of 1
280	indicates that the reference picture set is encoded with inter
281	prediction RPS using the subsequent parameters deltaRIdx$-1$, deltaRPS,
282	num_ref_idcs and Reference_idcs in the line. A value of 2 indicates that
283	the reference picture set is encoded with inter RPS but only the
284	deltaRIdx$-1$ parameters is needed. The deltaRPS, num_ref_idcs and
285	Reference_idcs values are automatically derived by the encoder based on
286	the POC and refPic values of the current line and the RPS pointed to by
287	the deltaRIdx$-1$ parameters.
288
289	\item[]\textbf{deltaRIdx$-1$}: The difference between the index of the
290	curent RPS and the predictor RPS minus 1.
291
292	\item[]\textbf{deltaRPS}: The difference between the POC of the
293	predictor RPS and POC the current RPS.
294
295	\item[]\textbf{num_ref_idcs}: The number of ref_idcs to encode for the
296	current RPS. The value is equal to the value of num_ref_pics of the
297	predictor RPS plus 1.
298
299	\item[]\textbf{reference_idcs}: A space-separated list of num_ref_idcs
300	integers, specifying the ref idcs of the inter RPS prediction. The value
301	of ref_idcs may be 0, 1 or 2 indicating that the reference picture is a
302	reference picture used by the current picture, a reference picture used
303	for future picture or not a reference picture anymore, respectively. The
304	first num_ref_pics of ref_idcs correspond to the Reference pictures in
305	the predictor RPS. The last ref_idcs corresponds to the predictor
306	picture.
307	\end{itemize}
308
309	For example, consider the coding structure of Figure~\ref{fig:gop-example}.
310	This coding structure is of size 4. The pictures are listed in decoding
311	order. Frame1 shall therefore describe picture with $\textrm{POC}=4$. It
312	references picture 0, and therefore has $-4$ as a reference picture.
313	Similarly, Frame2 has a POC of 2, and since it references pictures 0 and
314	4, its reference pictures are listed as \verb\|-2 2\|. Frame3 is a special
315	case: even though it only references pictures with POC 0 and 2, it also
316	needs to include the picture with POC 4, which must be kept in order to
317	be used as a reference picture in the future. The reference picture list
318	for Frame3 therefore becomes \verb\|-1 1 3\|. Frame4 has a POC of 3 and
319	its list of reference pictures is \verb\|-1 1\|.
320
321	\begin{figure}[h]
322	\caption{A GOP structure}
323	\label{fig:gop-example}
324	\centering
325	\includegraphics[width=0.7\textwidth]{gop-structure-example}
326	\end{figure}
327
328	Inter RPS prediction may be used for Frame2, Frame3 and Frame4, hence
329	the predict parameter is set to 1 for these frames. Frame2 uses Frame1
330	as the predictor hence the deltaRIdx$-1$ is 0. Similarly for Frame3 and
331	Frame4 which use Frame2 and Frame3 as predictors, respectively. The
332	deltaRPS is equal to the POC of the predictor minus the POC of the
333	current picture, therefore the deltaRPS for Frame2 is $4 -2 = 2$, for
334	Frame3 is $2 - 1 = 1$ and for Frame4 is $1 - 3 = -2$.
335
336	In Frame2, reference pictures with POC 0 and 2 are used, so the
337	reference idcs for Frame2 are \verb\|1 1\| indicating that the reference
338	picture, $-4$, in Frame1 is still a reference picture in Frame2 and
339	Frame1 is also a reference picture in Frame2. The reference idcs for
340	Frame3 are \verb\|1 1 1\|. The first and second “1”s indicating that
341	the reference pictures "$-2$ $2$" in Frame2 are still reference pictures in
342	Frame3 and the last “1” indicating that Frame2 is also a reference
343	picture in Frame3. In Frame 4, the reference idcs are \verb\|0 1 1 0\|.
344	The first “0” indicates that the reference pictures “-1” in Frame 3 is
345	no longer a reference picture in Frame4. The next two “1”s indicate that
346	the reference pictures “$1$ $3$” are now reference pictures of Frame4.
347	The final “0” indicates that Frame3 is not a reference picture.
348
349	In order to specify this to the encoder, the parameters in
350	Table~\ref{tab:gop-example} could be used.
351
352	\begin{table}[ht]
353	\footnotesize
354	\caption{GOP structure example}
355	\label{tab:gop-example}
356	\centering
357	\begin{tabular}{lrrrr}
358	\hline
359	\thead{} &
360	\thead{Frame1} &
361	\thead{Frame2} &
362	\thead{Frame3} &
363	\thead{Frame4} \\
364	\hline
365	Type & P & B & B & B \\
366	POC & 4 & 2 & 1 & 3 \\
367	QPoffset & 1 & 2 & 3 & 3 \\
368	QPfactor & 0.5 & 0.5 & 0.5 & 0.5 \\
369	tcOffsetDiv2 & 0 & 1 & 2 & 2 \\
370	betaOffsetDiv2 & 0 & 0 & 0 & 0 \\
371	temporal_id & 0 & 1 & 2 & 2 \\
372	num_ref_pics_active & 1 & 1 & 1 & 1 \\
373	num_ref_pics & 1 & 2 & 3 & 2 \\
374	reference_pictures & $-$4 & $-$2 2 & $-$1 1 3 & $-$1 1 \\
375	predict & 0 & 1 & 1 & 1 \\
376	deltaRIdx$-$1 & & 0 & 0 & 0 \\
377	deltaRPS & & 2 & 1 & $-$2 \\
378	num_ref_idcs & & 2 & 3 & 4 \\
379	reference_idcs & & 1 1 & 1 1 1 & 0 1 1 0 \\
380	\hline
381	\end{tabular}
382	\end{table}
383
384	Here, the frames used for prediction have been given higher
385	quality by assigning a lower QP offset. Also, the non-reference
386	frames have been marked as belonging to a higher temporal layer,
387	to make it possible to decode only every other frame. Note: each
388	line should contain information for one frame, so this
389	configuration would be specified as:
390
391	\begin{verbatim}
392	Frame1: P 4 1 0.5 0 0 0 1 1 -4 0
393	Frame2: B 2 2 0.5 1 0 1 1 2 -2 2 1 0 2 2 1 1
394	Frame3: B 1 3 0.5 2 0 2 1 3 -1 1 3 1 0 1 3 1 1 1
395	Frame4: B 3 3 0.5 2 0 2 1 2 -1 1 1 0 -2 4 0 1 1 0
396	\end{verbatim}
397
398	The values of deltaRIdx$-1$, deltaRPS, num_ref_idcs and reference
399	idcs of Frame$K$ can be derived from the POC value of Frame$_K$ and
400	the POC, num_ref_pics and reference_pictures values of Frame$_M$, where
401	$K$ is the index of the RPS to be inter coded and the $M$ is the
402	index of the reference RPS, as follows.
403
404	\setlength{\algomargin}{2em}
405	\begin{algorithm}[h]
406	\SetKwData{deltaRIdx}{deltaRIdx}
407	\SetKwData{deltaRPS}{deltaRPS}
408	\SetKwData{numrefidcs}{num_ref_idcs}
409	\SetKwData{numrefpics}{num_ref_pics}
410	\SetKwData{referencepictures}{reference_pictures}
411	\SetKwData{referenceidcs}{reference_idcs}
412	\SetKwData{POC}{POC}
413
414	$\deltaRIdx_K - 1 \leftarrow K - M - 1$ \;
415	$\deltaRPS_K \leftarrow \POC_M - \POC_K$ \;
416	$\numrefidcs_K \leftarrow \numrefpics_M + 1$ \;
417
418	\For{$j \leftarrow 0$ \KwTo $\numrefpics_M$}{
419	\For{$i \leftarrow 0$ \KwTo $\numrefidcs_K$}{
420	\eIf{$\referencepictures_{M,j} + \deltaRPS_K == \referencepictures_{K,i}$}{
421	\lIf{$\referencepictures_{K,i}$ is used by the current frame}{
422	$\referenceidcs_{K,j} = 1$} \;
423	\lElse{$\referenceidcs_{K,j} = 2$} \;
424	}{
425	$\referenceidcs_K[j] = 0$ \;
426	}
427	}
428	}
429
430	\tcc{$\referencepictures_{M,\numrefpics_M}$ does not exist and is assumed to be 0}
431	\end{algorithm}
432
433	Note: The above (automatic) generation of the inter RPS parameter
434	values has been integrated into the encoder, and is activated by
435	the value of predict $= 2$ followed by the value of deltaRIdx$-1$,
436	only, as described above.
437
438
439
440	%%%%
441	%%%%
442	%%%%
443	\newgeometry{tmargin=1.6cm,lmargin=1cm,rmargin=1cm,bmargin=1in,nohead}
444	\subsection{Encoder parameters}
445
446	%%
447	%% File, I/O and source parameters
448	%%
449	\begin{OptionTable}{File, I/O and source parameters}
450	\Option{InputFile} &
451	\ShortOption{-i} &
452	\Default{\NotSet} &
453	Specifies the input video file.
454
455	Video data must be in a raw 4:2:0 planar format (Y$'$CbCr).
456
457	Note: When the bit depth of samples is larger than 8, each sample is encoded in
458	2 bytes (little endian, LSB-justified).
459	\\
460
461	\Option{BitstreamFile} &
462	\ShortOption{-b} &
463	\Default{\NotSet} &
464	Specifies the output coded bit stream file.
465	\\
466
467	\Option{ReconFile} &
468	\ShortOption{-o} &
469	\Default{\NotSet} &
470	Specifies the output locally reconstructed video file.
471	\\
472
473	\Option{SourceWidth}%
474	\Option{SourceHeight} &
475	\ShortOption{-wdt}%
476	\ShortOption{-hgt} &
477	\Default{0}%
478	\Default{0} &
479	Specifies the width and height of the input video in luma samples.
480	\\
481
482	\Option{InputBitDepth} &
483	\ShortOption{\None} &
484	\Default{8} &
485	Specifies the bit depth of the input video.
486	\\
487
488	\Option{InternalBitDepth} &
489	\ShortOption{\None} &
490	\Default{0 \\ (InputBitDepth)} &
491	Specifies the bit depth used for coding.
492
493	If the input video is a different bit depth to InternalBitDepth, it is
494	automatically converted by:
495	\begin{displaymath}
496	\left\lfloor
497	\frac{\mathrm{Pel} * 2^{\mathrm{InternalBitDepth}}}{
498	2^{\mathrm{InputBitDepth}}}
499	\right\rfloor
500	\end{displaymath}
501
502	Note: The effect of this option is as if the input video is externally
503	converted to the InternalBitDepth and then coded with this value as
504	InputBitDepth. The codec has no notion of two different bit depths.
505	\\
506
507	\Option{OutputBitDepth} &
508	\ShortOption{\None} &
509	\Default{0 \\ (InternalBitDepth)} &
510	Specifies the bit depth of the output locally reconstructed video file.
511
512	Note: This option has no effect on the decoding process.
513	\\
514
515	\Option{InputBitDepthC}%
516	\Option{InternalBitDepthC}%
517	\Option{OutputBitDepthC} &
518	\ShortOption{\None} &
519	\Default{(InputBitDepth)}%
520	\Default{(InternalBitDepth)}%
521	\Default{(InternalBitDepthC)} &
522	Specifies the various bit-depths for chroma components. These only need
523	to be specified if non-equal luma and chroma bit-depth processing is
524	required.
525	\\
526
527	\Option{ConformanceMode} &
528	\ShortOption{\None} &
529	\Default{0} &
530	Specifies the conformance mode (cropping/padding parameters) to be applied to the input
531	video. The following modes are available:
532	\par
533	\begin{tabular}{cp{0.45\textwidth}}
534	0 & No cropping / padding \\
535	1 & Automatic padding to the next minimum CU size \\
536	2 & Padding according to parameters HorizontalPadding and VerticalPadding \\
537	3 & Cropping according to parameters ConfLeft, ConfRight, ConfTop and ConfBottom \\
538	\end{tabular}
539	\\
540
541	\Option{HorizontalPadding}%
542	\Option{VerticalPadding} &
543	\ShortOption{-pdx}%
544	\ShortOption{-pdy} &
545	\Default{0} &
546	Specifies the horizontal and vertical padding to be applied to the input
547	video in luma samples. Must be a multiple of the chroma resolution
548	(e.g. a multiple of two for 4:2:0).
549	\\
550
551	\Option{ConfLeft}%
552	\Option{ConfRight}%
553	\Option{ConfTop}%
554	\Option{ConfBottom} &
555	\ShortOption{\None} &
556	\Default{0} &
557	Specifies the horizontal and vertical cropping to be applied to the
558	input video in luma samples. Must be a multiple of the chroma
559	resolution (e.g. a multiple of two for 4:2:0).
560	\\
561
562	\Option{FrameRate} &
563	\ShortOption{-fr} &
564	\Default{0} &
565	Specifies the frame rate of the input video.
566
567	Note: This option only affects the reported bit rates.
568	\\
569
570	\Option{FrameSkip} &
571	\ShortOption{-fs} &
572	\Default{0} &
573	Specifies a number of frames to skip at beginning of input video file.
574	\\
575
576	\Option{FramesToBeEncoded} &
577	\ShortOption{-f} &
578	\Default{0 \\ (all)} &
579	Specifies the number of frames to be encoded.
580	\\
581	\end{OptionTable}
582
583	%%
584	%% profile, level and conformance options
585	%%
586	\begin{OptionTable}{Profile and level parameters}
587	\Option{Profile} &
588	\ShortOption{\None} &
589	\Default{none} &
590	Specifies the profile to which the encoded bitstream complies.
591	Valid values are: none, main, main10, main-still-picture.
592
593	Compatibility flags are automatically determined according to the profile.
594	If --Profile=main, then main10 will always be signalled as compatible.
595	If --Profile=main10, then main will be signalled as compatible if the bit-depth is 8-bit.
596
597	NB: There is currently no validation that the encoder configuration complies with the profile and level constraints.
598	\\
599
600	\Option{Level} &
601	\ShortOption{\None} &
602	\Default{none} &
603	Specifies the level to which the encoded bitstream complies.
604	Valid values are: none, 1, 2, 2.1, 3, 3.1, 4, 4.1, 5, 5.1, 5.2, 6, 6.1, 6.2.
605
606	NB: There is currently no validation that the encoder configuration complies with the profile and level constraints.
607	\\
608
609	\Option{Tier} &
610	\ShortOption{\None} &
611	\Default{main} &
612	Specifies the level tier to which the encoded bitsream complies.
613	Valid values are: main, high.
614
615	NB: There is currently no validation that the encoder configuration complies with the profile and level constraints.
616	\\
617
618	\Option{ProgressiveSource} &
619	\ShortOption{\None} &
620	\Default{false} &
621	Specifies the value of general_progressive_source_flag
622	\\
623
624	\Option{InterlacedSource} &
625	\ShortOption{\None} &
626	\Default{false} &
627	Specifies the value of general_interlaced_source_flag
628	\\
629
630	\Option{NonPackedSource} &
631	\ShortOption{\None} &
632	\Default{false} &
633	Specifies the value of general_non_packed_constraint_flag
634	\\
635
636	\Option{FrameOnly} &
637	\ShortOption{\None} &
638	\Default{false} &
639	Specifies the value of general_frame_only_constraint_flag
640	\\
641
642	\end{OptionTable}
643
644
645	%%
646	%% Unit definition parameters
647	%%
648	\begin{OptionTable}{Unit definition parameters}
649	\Option{MaxCUWidth} &
650	\ShortOption{\None} &
651	\Default{64} &
652	Defines the maximum CU width.
653	\\
654
655	\Option{MaxCUHeight} &
656	\ShortOption{\None} &
657	\Default{64} &
658	Defines the maximum CU height.
659	\\
660
661	\Option{MaxCUSize} &
662	\ShortOption{\None} &
663	\Default{64} &
664	Defines the maximum CU size.
665	\\
666
667	\Option{MaxPartitionDepth} &
668	\ShortOption{-h} &
669	\Default{4} &
670	Defines the depth of the CU tree.
671	\\
672
673	\Option{QuadtreeTULog2MaxSize} &
674	\ShortOption{\None} &
675	\Default{6 \\ ($= \mathrm{log}_2(64)$)} &
676	Defines the Maximum TU size in logarithm base 2.
677	\\
678
679	\Option{QuadtreeTULog2MinSize} &
680	\ShortOption{\None} &
681	\Default{2 \\ ($= \mathrm{log}_2(4)$)} &
682	Defines the Minimum TU size in logarithm base 2.
683	\\
684
685	\Option{QuadtreeTUMaxDepthIntra} &
686	\ShortOption{\None} &
687	\Default{1} &
688	Defines the depth of the TU tree for intra CUs.
689	\\
690
691	\Option{QuadtreeTUMaxDepthInter} &
692	\ShortOption{\None} &
693	\Default{2} &
694	Defines the depth of the TU tree for inter CUs.
695	\\
696	\end{OptionTable}
697
698
699	%%
700	%% Coding structure parameters
701	%%
702	\begin{OptionTable}{Coding structure parameters}
703	\Option{IntraPeriod} &
704	\ShortOption{-ip} &
705	\Default{$-1$} &
706	Specifies the intra frame period.
707	A value of $-1$ implies an infinite period.
708	\\
709
710	\Option{DecodingRefreshType} &
711	\ShortOption{-dr} &
712	\Default{0} &
713	Specifies the type of decoding refresh to apply at the intra frame period
714	picture.
715	\par
716	\begin{tabular}{cp{0.45\textwidth}}
717	0 & Applies an I picture (not a clean random access point). \\
718	1 & Applies a non-IDR clean random access point (open GOP). \\
719	2 & Applies an IDR random access point (closed GOP). \\
720	\end{tabular}
721	\\
722
723	\Option{GOPSize} &
724	\ShortOption{-g} &
725	\Default{1} &
726	Specifies the size of the cyclic GOP structure.
727	\\
728
729	\Option{Frame\emph{N}} &
730	\ShortOption{\None} &
731	\Default{\NotSet} &
732	Multiple options that define the cyclic GOP structure that will be used
733	repeatedly throughout the sequence. The table should contain GOPSize
734	elements.
735	\par
736	See section~\ref{sec:gop-structure} for further details.
737	\\
738
739	\Option{ListCombination} &
740	\ShortOption{-lc} &
741	\Default{true} &
742	Enables or disables the use of the combined reference list for uni-prediction
743	in B-slices.
744	\par
745	\begin{tabular}{cp{0.45\textwidth}}
746	0 & Reference list~0 and reference list~1 are identical and reference
747	list~0 is used as the combined reference list. \\
748	1 & The combined reference list is derived from reference list~0 and
749	reference list~1. \\
750	\end{tabular}
751	NB: LComb can only be 0 in low delay coding (more precisely, when list 0
752	and list 1 are the same)
753	\\
754	\end{OptionTable}
755
756
757	%%
758	%% Motion estimation parameters
759	%%
760	\begin{OptionTable}{Motion estimation parameters}
761	\Option{FastSearch} &
762	\ShortOption{\None} &
763	\Default{true} &
764	Enables or disables the use of a fast motion search.
765	\par
766	\begin{tabular}{cp{0.45\textwidth}}
767	0 & Full search method \\
768	1 & Fast search method \\
769	\end{tabular}
770	\\
771
772	\Option{SearchRange} &
773	\ShortOption{-sr} &
774	\Default{96} &
775	Specifies the search range used for motion estimation.
776
777	Note: the search range is defined around a predictor. Motion vectors
778	derived by the motion estimation may thus have values larger than the
779	search range.
780	\\
781
782	\Option{BipredSearchRange} &
783	\ShortOption{\None} &
784	\Default{4} &
785	Specifies the search range used for bi-prediction refinement in motion
786	estimation.
787	\\
788
789	\Option{HadamardME} &
790	\ShortOption{\None} &
791	\Default{true} &
792	Enables or disables the use of the Hadamard transform in fractional-pel motion
793	estimation.
794	\par
795	\begin{tabular}{cp{0.45\textwidth}}
796	0 & SAD for cost estimation \\
797	1 & Hadamard for cost estimation \\
798	\end{tabular}
799	\\
800
801	\Option{ASR} &
802	\ShortOption{\None} &
803	\Default{false} &
804	Enables or disables the use of adaptive search ranges, where the motion
805	search range is dynamically adjusted according to the POC difference
806	between the current and the reference pictures.
807	\begin{displaymath}
808	\resizebox{\hsize}{!}{$
809	\mathrm{SearchRange}’ = \mathrm{Round}\left(
810	\mathrm{SearchRange}
811	* \mathrm{ADAPT\_SR\_SCALE}
812	* \frac{\mathrm{abs}(
813	\mathrm{POCcur} - \mathrm{POCref} )}{
814	\mathrm{RateGOPSize}}\right)
815	$}
816	\end{displaymath}
817	\\
818	\end{OptionTable}
819
820
821	%%
822	%% Mode decision parameters
823	%%
824	\begin{OptionTable}{Mode decision parameters}
825	\Option{LambdaModifier$N$} &
826	\ShortOption{-LM$N$} &
827	\Default{1.0} &
828	Specifies a value that is multiplied with the Lagrange multiplier
829	$\lambda$, for use in the rate-distortion optimised cost calculation
830	when encoding temporal layer~$N$.
831	\par
832	$N$ may be in the range 0--7.
833	\\
834
835	\Option{FEN} &
836	\ShortOption{\None} &
837	\Default{false} &
838	Enables or disables the use of fast encoder mode. When enabled,
839	the following occurs:
840	\begin{itemize}
841	\item In the SAD computation for blocks having size larger than 8, only
842	the lines of even rows in the block are considered.
843	\item The number of iterations used in the bi-directional motion vector
844	refinement in the motion estimation process is reduced from 4 to 1.
845	\end{itemize}
846	\\
847
848	\Option{FDM} &
849	\ShortOption{\None} &
850	\Default{true} &
851	Enables or disables the use of fast encoder decisions for 2Nx2N merge
852	mode. When enabled, the RD cost for the merge mode of the current
853	candidate is not evaluated if the merge skip mode was the best merge
854	mode for one of the previous candidates.
855	\\
856
857	\Option{RDpenalty} &
858	\ShortOption{\None} &
859	\Default{0} &
860	RD-penalty for 32x32 TU for intra in non-intra slices.
861	Enabling this parameter can reduce the visibility of CU boundaries in the coded picture.
862	\par
863	\begin{tabular}{cp{0.45\textwidth}}
864	0 & No RD-penalty \\
865	1 & RD-penalty \\
866	2 & Maximum RD-penalty (no 32x32 TU)\\
867	\end{tabular}
868	\\
869
870	\end{OptionTable}
871
872	%%
873	%% Quantization parameters
874	%%
875	\begin{OptionTable}{Quantization parameters}
876	\Option{QP} &
877	\ShortOption{-q} &
878	\Default{30.0} &
879	Specifies the base value of the quantization parameter.
880	\\
881
882	\Option{CbQpOffset}%
883	\Option{CrQpOffset} &
884	\ShortOption{-cbqpofs}%
885	\ShortOption{-crqpofs} &
886	\Default{0}%
887	\Default{0} &
888	Global offset to apply to the luma QP to derive the QP of Cb and Cr
889	respectively. These options correspond to the values of cb_qp_offset
890	and cr_qp_offset, that are transmitted in the PPS. Valid values are in
891	the range $[-12, 12]$.
892	\\
893
894	\Option{MaxCuDQPDepth} &
895	\ShortOption{\None} &
896	\Default{0} &
897	Defines maximum depth of a minimum CuDQP for sub-LCU-level delta QP.
898	MaxCuDQPDepth shall be greater than or equal to SliceGranularity.
899	\\
900
901	\Option{RDOQ} &
902	\ShortOption{\None} &
903	\Default{true} &
904	Enables or disables rate-distortion-optimized quantization.
905	\\
906
907	\Option{RDOQTS} &
908	\ShortOption{\None} &
909	\Default{true} &
910	Enables or disables rate-distortion-optimized quantization for transform-skipped TUs.
911	\\
912
913	\Option{DeltaQpRD} &
914	\ShortOption{-dqr} &
915	\Default{0} &
916	Specifies the maximum QP offset at slice level for multi-pass slice
917	encoding. When encoding, each slice is tested multiple times by using
918	slice QP values in the range $[-\mathrm{DeltaQpRD}, \mathrm{DeptaQpRD}]$,
919	and the best QP value is chosen as the slice QP.
920	\\
921
922	\Option{MaxDeltaQP} &
923	\ShortOption{-d} &
924	\Default{0} &
925	Specifies the maximum QP offset at the largest coding unit level for
926	the block-level adaptive QP assignment scheme. In the encoder, each
927	largest coding unit is tested multiple times by using the QP values in
928	the range $[-\mathrm{MaxDeltaQP}, \mathrm{MaxDeltaQP}]$, and the best QP
929	value is chosen as the QP value of the largest coding unit.
930	\\
931
932	\Option{dQPFile} &
933	\ShortOption{-m} &
934	\Default{\NotSet} &
935	Specifies a file containing a list of QP deltas. The $n$-th line
936	(where $n$ is 0 for the first line) of this file corresponds to the QP
937	value delta for the picture with POC value $n$.
938	\\
939
940	\Option{AdaptiveQpSelection} &
941	\ShortOption{-aqps} &
942	\Default{false} &
943	Specifies whether QP values for non-I frames will be calculated on the
944	fly based on statistics of previously coded frames.
945	\\
946	\Option{RecalculateQPAccordingToLambda} &
947	\ShortOption{\None} &
948	\Default{false} &
949	Recalculate QP values according to lambda values. Do not suggest to be enabled in all intra case.
950	\\
951	\end{OptionTable}
952
953
954
955	%%
956	%% Entropy coding parameters
957	%%
958	\begin{OptionTable}{Entropy coding parameters}
959	\Option{SBACRD} &
960	\ShortOption{\None} &
961	\Default{true} &
962	Enables or disables the use of bit counts from arithmetic coder in
963	rate-distortion decisions.
964	\\
965	\end{OptionTable}
966
967
968	%%
969	%% Slice coding parameters
970	%%
971	\begin{OptionTable}{Slice coding parameters}
972	%\Option{SliceGranularity} &
973	%\ShortOption{\None} &
974	%\Default{0} &
975	%Determines the depth in an LCU at which slices may begin and end.
976	%\par
977	%\begin{tabular}{cp{0.45\textwidth}}
978	% 0 & Slice addresses are LCU aligned \\
979	% $1 \leq n \leq 3$
980	% & Slice start addresses are aligned to CUs at depth $n$ \\
981	%\end{tabular}
982	%
983	%Note: The smallest permissible alignment is 16x16 CUs.
984	%Values of $n$ must satisfy this constraint, for example, with a 64x64
985	%LCU, $n$ must be less than or equal to 2.
986	%\\
987
988	\Option{SliceMode} &
989	\ShortOption{\None} &
990	\Default{0} &
991	Controls the slice partitioning method in conjunction with
992	SliceArgument.
993	\par
994	\begin{tabular}{cp{0.45\textwidth}}
995	0 & Single slice \\
996	1 & Maximum number of CTUs per slice \\
997	2 & Maximum number of bytes per slice \\
998	3 & Maximum number of tiles per slice \\
999	\end{tabular}
1000	\\
1001
1002	\Option{SliceArgument} &
1003	\ShortOption{\None} &
1004	\Default{\NotSet} &
1005	Specifies the maximum number of CTUs, bytes or tiles in a slice depending on the
1006	SliceMode setting.
1007	\\
1008
1009	\Option{SliceSegmentMode} &
1010	\ShortOption{\None} &
1011	\Default{0} &
1012	Enables (dependent) slice segment coding in conjunction with
1013	SliceSegmentArgument.
1014	\par
1015	\begin{tabular}{cp{0.45\textwidth}}
1016	0 & Single slice \\
1017	1 & Maximum number of CTUs per slice segment\\
1018	2 & Maximum number of bytes per slice segment\\
1019	3 & Maximum number of tiles per slice segment\\
1020	\end{tabular}
1021	\\
1022
1023	\Option{SliceSegmentArgument} &
1024	\ShortOption{\None} &
1025	\Default{\NotSet} &
1026	Defines the maximum number of CTUs, bytes or tiles a slice segment
1027	depending on the SliceSegmentMode setting.
1028	\\
1029
1030	\Option{WaveFrontSynchro} &
1031	\ShortOption{\None} &
1032	\Default{false} &
1033	Enables the use of specific CABAC probabilities synchronization at the
1034	beginning of each line of CTBs in order to produce a bitstream that can
1035	be encoded or decoded using one or more cores.
1036	\\
1037
1038	\Option{NumTileColumnsMinus1}%
1039	\Option{NumTileRowsMinus1} &
1040	\ShortOption{\None} &
1041	\Default{0} &
1042	Specifies the tile based picture partitioning geometry as
1043	$\mathrm{NumTileColumnsMinus1} + 1 \times \mathrm{NumTileRowsMinus1} + 1$
1044	columns and rows.
1045	\\
1046
1047	\Option{UniformSpacingIdc} &
1048	\ShortOption{\None} &
1049	\Default{0} &
1050	Controls the mode used to determine per row and column tile sizes.
1051	\par
1052	\begin{tabular}{cp{0.45\textwidth}}
1053	0 & Each tile column width and tile row height is explicitly set
1054	by ColumnWidthArray and RowHeightArray respectively \\
1055	1 & Tile columns and tile rows are uniformly spaced. \\
1056	\end{tabular}
1057	\\
1058
1059	\Option{ColumnWidthArray}%
1060	\Option{RowHeightArray} &
1061	\ShortOption{\None} &
1062	\Default{\NotSet} &
1063	Specifies a space or comma separated list of widths and heights,
1064	respectively, of each tile column or tile row. The first value in the
1065	list corresponds to the leftmost tile column or topmost tile row.
1066	\\
1067	\end{OptionTable}
1068
1069
1070
1071	%%
1072	%% Deblocking filter parameters
1073	%%
1074	\begin{OptionTable}{Deblocking filter parameters}
1075	\Option{LoopFilterDisable} &
1076	\ShortOption{\None} &
1077	\Default{false} &
1078	Enables or disables the in-loop deblocking filter.
1079	\\
1080
1081	\Option{LFCrossSliceBoundaryFlag} &
1082	\ShortOption{\None} &
1083	\Default{true} &
1084	Enables or disables the use of in-loop filtering across slice
1085	boundaries.
1086	\\
1087
1088	\Option{DeblockingFilterControlPresent}&
1089	\ShortOption{\None}&
1090	\Default{false}&
1091	Enables or disables the presence of the deblocking filter control
1092	parameters in the picture parameter set and in the slice segment header.
1093	When disabled, the default deblocking filter parameters are used.
1094	\\
1095
1096	\Option{LoopFilterOffsetInPPS}&
1097	\ShortOption{\None}&
1098	\Default{false}&
1099	If enabled, the in-loop deblocking filter control parameters are sent in PPS.
1100	Otherwise, the in-loop deblocking filter control parameters are sent in the slice segment header.
1101	If deblocking filter parameters are sent in PPS, the same values of deblocking filter parameters
1102	are used for all pictures in the sequence (i.e. deblocking parameter = base parameter value).
1103	If deblocking filter parameters are sent in the slice segment header, varying deblocking filter
1104	parameters can be specified by setting parameters tcOffsetDiv2 and betaOffsetDiv2 in the GOP structure table.
1105	In this case, the final value of the deblocking filter parameter sent for a certain GOP picture is equal to
1106	(base parameter + GOP parameter for this picture). Intra-pictures use the base parameters values.
1107	\\
1108
1109	\Option{LoopFilterTcOffset_div2}&
1110	\ShortOption{\None}&
1111	\Default{0}&
1112	Specifies the base value for the in-loop deblocking filter parameter tc_offset_div2. The final value of tc_offset_div2
1113	shall be an integer number in the range $-6..6$.
1114	\\
1115
1116	\Option{LoopFilterBetaOffset_div2}&
1117	\ShortOption{\None}&
1118	\Default{0}&
1119	Specifies the base value for the in-loop deblocking filter parameter beta_offset_div2. The final value of beta_offset_div2
1120	shall be an integer number in the range $-6..6$.
1121	\\
1122
1123	\end{OptionTable}
1124
1125
1126
1127	%%
1128	%% Coding tools parameters
1129	%%
1130	\begin{OptionTable}{Coding tools parameters}
1131	%\Option{ALF} &
1132	%\ShortOption{\None} &
1133	%\Default{true} &
1134	%Enables or disables the adaptive loop filter.
1135	%\\
1136
1137	%\Option{ALFLowLatencyEncode} &
1138	%\ShortOption{\None} &
1139	%\Default{false} &
1140	%Specifies the operating mode (low latency or high efficiency) of the
1141	%adaptive loop filter.
1142	%\\
1143
1144	\Option{SAO} &
1145	\ShortOption{\None} &
1146	\Default{true} &
1147	Enables or disables the sample adaptive offset (SAO) filter.
1148	\\
1149
1150	\Option{SAOLcuBoundary} &
1151	\ShortOption{\None} &
1152	\Default{false} &
1153	Enables or disables SAO parameter estimation using non-deblocked pixels
1154	for LCU bottom and right boundary areas.
1155	\\
1156
1157	%\Option{LMChroma} &
1158	%\ShortOption{\None} &
1159	%\Default{true} &
1160	%Enables or disables the intra chroma-from-luma prediction mode.
1161	%\\
1162
1163	%\Option{NSQT} &
1164	%\ShortOption{\None} &
1165	%\Default{true} &
1166	%Enables or disables the non-square quadtree transform.
1167	%\\
1168
1169	\Option{ConstrainedIntraPred} &
1170	\ShortOption{\None} &
1171	\Default{false} &
1172	Enables or disables constrained intra prediction. Constrained intra
1173	prediction only permits samples from intra blocks in the same slice as the
1174	current block to be used for intra prediction.
1175	\\
1176
1177	\Option{TransquantBypassEnableFlag} &
1178	\ShortOption{\None} &
1179	\Default{false} &
1180	Enables or disables the ability to bypass the transform,
1181	quantization and filtering stages at CU level.
1182	This option corresponds to the value of
1183	transquant_bypass_enable_flag that is transmitted in the PPS.
1184
1185	See CUTransquantBypassFlagValue for further details.
1186	\\
1187
1188	\Option{CUTransquantBypassFlagValue} &
1189	\ShortOption{\None} &
1190	\Default{0} &
1191	Controls the per CU transformation, quantization and filtering
1192	mode decision.
1193	This option corresponds to the value of the per CU cu_transquant_bypass_flag.
1194	\par
1195	\begin{tabular}{cp{0.45\textwidth}}
1196	0 & Bypass is not performed on any CU \\
1197	1 & Bypass is performed on all CUs \\
1198	\end{tabular}
1199
1200	This option has no effect if TransquantBypassEnableFlag is disabled.
1201	\\
1202
1203	\Option{PCMEnabledFlag} &
1204	\ShortOption{\None} &
1205	\Default{false} &
1206	Enables or disables the use of PCM.
1207	\\
1208
1209	\Option{PCMLog2MaxSize} &
1210	\ShortOption{\None} &
1211	\Default{5 \\ ($= \mathrm{log}_2(32)$)} &
1212	Specifies log2 of the maximum PCM block size. When PCM is enabled, the
1213	PCM mode is available for 2Nx2N intra PUs smaller than or equal to the
1214	specified maximum PCM block size
1215	\\
1216
1217	\Option{PCMLog2MinSize} &
1218	\ShortOption{\None} &
1219	\Default{3} &
1220	Specifies log2 of the minimum PCM block size. When PCM is enabled, the
1221	PCM mode is available for 2Nx2N intra PUs larger than or equal to the
1222	specified minimum PCM block size.
1223	\par
1224	When larger than PCMLog2MaxSize, PCM mode is not used.
1225	\\
1226
1227	\Option{PCMInputBitDepthFlag} &
1228	\ShortOption{\None} &
1229	\Default{1} &
1230	If enabled specifies that PCM sample bit-depth is set equal to
1231	InputBitDepth. Otherwise, it specifies that PCM sample bit-depth is set
1232	equal to InternalBitDepth.
1233	\\
1234
1235	\Option{PCMFilterDisableFlag} &
1236	\ShortOption{\None} &
1237	\Default{false} &
1238	If enabled specifies that loop-filtering on reconstructed samples of PCM
1239	blocks is skipped. Otherwise, it specifies that loop-filtering on
1240	reconstructed samples of PCM blocks is not skipped.
1241	% 0 = (loop-filtering is not skipped for PCM samples).
1242	\\
1243
1244	\Option{WeightedPredP} &
1245	\ShortOption{-wpP} &
1246	\Default{false} &
1247	Enables the use of weighted prediction in P slices.
1248	\\
1249
1250	\Option{WeightedPredB} &
1251	\ShortOption{-wpB} &
1252	\Default{false} &
1253	Enables the use of weighted prediction in B slices.
1254	\\
1255
1256	\Option{SignHideFlag} &
1257	\ShortOption{-SBH} &
1258	\Default{true} &
1259	If enabled specifies that for each 4x4 coefficient group for which the
1260	number of coefficients between the first nonzero coefficient and the
1261	last nonzero coefficient along the scanning line exceeds 4, the sign bit
1262	of the first nonzero coefficient will not be directly transmitted in the
1263	bitstream, but may be inferred from the parity of the sum of all nonzero
1264	coefficients in the current coefficient group.
1265	\\
1266
1267	\Option{StrongIntraSmoothing} &
1268	\ShortOption{-sis} &
1269	\Default{true} &
1270	If enabled specifies that for 32x32 intra prediction block, the intra smoothing
1271	when applied is either the 1:2:1 smoothing filter or a stronger bi-linear
1272	interpolation filter. Key reference sample values are tested and if the criteria
1273	is satisfied, the stronger intra smoothing filter is applied.
1274	If disabled, the intra smoothing filter when applied is the 1:2:1 smoothing filter.
1275	\\
1276
1277	\Option{TMVPMode} &
1278	\ShortOption{\None} &
1279	\Default{1} &
1280	Controls the temporal motion vector prediction mode.
1281	\par
1282	\begin{tabular}{cp{0.45\textwidth}}
1283	0 & Disabled for all slices. \\
1284	1 & Enabled for all slices. \\
1285	2 & Disabled only for the first picture of each GOPSize. \\
1286	\end{tabular}
1287	\\
1288
1289	\Option{TransformSkip} &
1290	\ShortOption{\None} &
1291	\Default{false} &
1292	Enables or disables transform-skipping mode decision for 4x4 TUs
1293	\footnote{Enables transform_skip_enabled and per 4x4 TU tests}.
1294	\\
1295
1296	\Option{TransformSkipFast} &
1297	\ShortOption{\None} &
1298	\Default{false} &
1299	Enables or disables reduced testing of the transform-skipping mode
1300	decision for chroma TUs. When enabled, no RDO search is performed for
1301	chroma TUs, instead they are transform-skipped if the four corresponding
1302	luma TUs are also skipped.
1303	\par
1304	This option has no effect if TransformSkip is disabled.
1305	\\
1306	\end{OptionTable}
1307
1308	%%
1309	%% Rate control parameters
1310	%%
1311	\begin{OptionTable}{Rate control parameters}
1312
1313	\Option{RateControl} &
1314	\ShortOption{\None} &
1315	\Default{false} &
1316	Rate control: enables rate control or not.
1317	\\
1318
1319	\Option{TargetBitrate} &
1320	\ShortOption{\None} &
1321	\Default{0} &
1322	Rate control: target bitrate, in bps.
1323	\\
1324
1325	\Option{KeepHierarchicalBit} &
1326	\ShortOption{\None} &
1327	\Default{false} &
1328	Rate control: keep hierarchical bit allocation in rate control algorithm.
1329	It is suggested to enable hierarchical bit allocation for hierarchical-B coding structure.
1330	\\
1331
1332	\Option{LCULevelRateControl} &
1333	\ShortOption{\None} &
1334	\Default{true} &
1335	Rate control: true: LCU level RC; false: picture level RC.
1336	\\
1337
1338	\Option{RCLCUSeparateModel} &
1339	\ShortOption{\None} &
1340	\Default{true} &
1341	Rate control: use LCU level separate R-lambda model or not.
1342	When LCULevelRateControl is equal to false, this parameter is meaningless.
1343	\\
1344
1345	\Option{InitialQP} &
1346	\ShortOption{\None} &
1347	\Default{0} &
1348	Rate control: initial QP value for the first picture.
1349	0 to auto determine the initial QP value.
1350	\\
1351
1352	\Option{RCForceIntraQP} &
1353	\ShortOption{\None} &
1354	\Default{false} &
1355	Rate control: force intra QP to be equal to initial QP or not.
1356	\\
1357	\end{OptionTable}
1358
1359	%%
1360	%% VUI parameters
1361	%%
1362	\begin{OptionTable}{VUI parameters}
1363	\Option{VuiParametersPresent} &
1364	\ShortOption{-vui} &
1365	\Default{false} &
1366	Enable generation of vui_parameters().
1367	\\
1368	\Option{AspectRatioInfoPresent} &
1369	\ShortOption{} &
1370	\Default{false} &
1371	Signals whether aspect_ratio_idc is present.
1372	\\
1373	\Option{AspectRatioIdc} &
1374	\ShortOption{} &
1375	\Default{0} &
1376	aspect_ratio_idc
1377	\\
1378	\Option{SarWidth} &
1379	\ShortOption{} &
1380	\Default{0} &
1381	Specifies the horizontal size of the sample aspect ratio.
1382	\\
1383	\Option{SarHeight} &
1384	\ShortOption{} &
1385	\Default{0} &
1386	Specifies the vertical size of the sample aspect ratio.
1387	\\
1388	\Option{OverscanInfoPresent} &
1389	\ShortOption{} &
1390	\Default{false} &
1391	Signals whether overscan_info_present_flag is present.
1392	\\
1393	\Option{OverscanAppropriate} &
1394	\ShortOption{} &
1395	\Default{false} &
1396	Indicates whether cropped decoded pictures are suitable for display using overscan.
1397	\par
1398	\begin{tabular}{cp{0.45\textwidth}}
1399	0 & Indicates that the decoded pictures should not be displayed using overscan. \\
1400	1 & Indicates that the decoded pictures may be displayed using overscan. \\
1401	\end{tabular}
1402	\\
1403	\Option{VideoSignalTypePresent} &
1404	\ShortOption{} &
1405	\Default{false} &
1406	Signals whether video_format, video_full_range_flag, and colour_description_present_flag are present.
1407	\\
1408	\Option{VideoFormat} &
1409	\ShortOption{} &
1410	\Default{5} &
1411	Indicates representation of pictures.
1412	\\
1413	\Option{VideoFullRange} &
1414	\ShortOption{} &
1415	\Default{false} &
1416	Indicates the black level and range of luma and chroma signals.
1417	\par
1418	\begin{tabular}{cp{0.45\textwidth}}
1419	0 & Indicates that the luma and chroma signals are to be scaled prior to display. \\
1420	1 & Indicates that the luma and chroma signals are not to be scaled prior to display. \\
1421	\end{tabular}
1422	\\
1423	\Option{ColourDescriptionPresent} &
1424	\ShortOption{} &
1425	\Default{false} &
1426	Signals whether colour_primaries, transfer_characteristics and matrix_coefficients are present.
1427	\\
1428	\Option{ColourPrimaries} &
1429	\ShortOption{} &
1430	\Default{2} &
1431	Indicates chromaticity coordinates of the source primaries.
1432	\\
1433	\Option{TransferCharateristics} &
1434	\ShortOption{} &
1435	\Default{2} &
1436	Indicates the opto-electronic transfer characteristics of the source.
1437	\\
1438	\Option{MatrixCoefficients} &
1439	\ShortOption{} &
1440	\Default{2} &
1441	Describes the matrix coefficients used in deriving luma and chroma from RGB primaries.
1442	\\
1443	\Option{ChromaLocInfoPresent} &
1444	\ShortOption{} &
1445	\Default{false} &
1446	Signals whether chroma_sample_loc_type_top_field and chroma_sample_loc_type_bottom_field are present.
1447	\\
1448	\Option{ChromaSampleLocTypeTopField} &
1449	\ShortOption{} &
1450	\Default{0} &
1451	Specifies the location of chroma samples for top field.
1452	\\
1453	\Option{ChromaSampleLocTypeBottomField} &
1454	\ShortOption{} &
1455	\Default{0} &
1456	Specifies the location of chroma samples for bottom field.
1457	\\
1458	\Option{NeutralChromaIndication} &
1459	\ShortOption{} &
1460	\Default{false} &
1461	Indicates that the value of all decoded chroma samples is equal to 1<<(BitDepthCr-1).
1462	\\
1463
1464	\Option{DefaultDisplayWindowFlag} &
1465	\ShortOption{\None} &
1466	\Default{0} &
1467	Indicates the presence of the Default Window parameters.
1468	\par
1469	\begin{tabular}{cp{0.45\textwidth}}
1470	0 & Disabled \\
1471	1 & Enabled \\
1472	\end{tabular}
1473	\\
1474
1475	\Option{DefDispWinLeftOffset}%
1476	\Option{DefDispWinRightOffset}%
1477	\Option{DefDispWinTopOffset}%
1478	\Option{DefDispWinBottomOffset} &
1479	\ShortOption{\None} &
1480	\Default{0} &
1481	Specifies the horizontal and vertical offset to be applied to the
1482	input video from the conformance window in luma samples.
1483	Must be a multiple of the chroma resolution (e.g. a multiple of two for 4:2:0).
1484	\\
1485
1486	\Option{BitstreamRestriction} &
1487	\ShortOption{} &
1488	\Default{false} &
1489	Signals whether bitstream restriction parameters are present.
1490	\\
1491	\Option{TilesFixedStructure} &
1492	\ShortOption{} &
1493	\Default{false} &
1494	Indicates that each active picture parameter set has the same values of the syntax elements related to tiles.
1495	\\
1496	\Option{MotionVectorsOverPicBoundaries} &
1497	\ShortOption{} &
1498	\Default{false} &
1499	Indicates that no samples outside the picture boundaries are used for inter prediction.
1500	\\
1501	\Option{MaxBytesPerPicDenom} &
1502	\ShortOption{} &
1503	\Default{2} &
1504	Indicates a number of bytes not exceeded by the sum of the sizes of the VCL NAL units associated with any coded picture.
1505	\\
1506	\Option{MaxBitsPerMinCuDenom} &
1507	\ShortOption{} &
1508	\Default{1} &
1509	Indicates an upper bound for the number of bits of coding_unit() data.
1510	\\
1511	\Option{Log2MaxMvLengthHorizontal} &
1512	\ShortOption{} &
1513	\Default{15} &
1514	Indicate the maximum absolute value of a decoded horizontal MV component in quarter-pel luma units.
1515	\\
1516	\Option{Log2MaxMvLengthVertical} &
1517	\ShortOption{} &
1518	\Default{15} &
1519	Indicate the maximum absolute value of a decoded vertical MV component in quarter-pel luma units.
1520	\\
1521	\end{OptionTable}
1522
1523	%%
1524	%% SEI messages
1525	%%
1526	\begin{OptionTable}{SEI messages}
1527	\Option{SEIDecodedPictureHash} &
1528	\ShortOption{\None} &
1529	\Default{0} &
1530	Enables or disables the calculation and insertion of the Decoded picture hash
1531	SEI messages.
1532	\par
1533	\begin{tabular}{cp{0.45\textwidth}}
1534	0 & Disabled \\
1535	1 & Transmits MD5 in SEI message and writes the value to the encoder
1536	log \\
1537	2 & Transmits CRC in SEI message and writes the value to the encoder
1538	log \\
1539	3 & Transmits checksum in SEI message and writes the value to the encoder
1540	log \\
1541	\end{tabular}
1542	\\
1543	\Option{SEIpictureDigest} &
1544	\ShortOption{\None} &
1545	\Default{0} &
1546	Deprecated alias for SEIDecodedPictureHash.
1547	Do not use anymore.
1548	\\
1549	\Option{SEIRecoveryPoint} &
1550	\ShortOption{\None} &
1551	\Default{0} &
1552	Enables or disables the insertion of the Recovery point
1553	SEI messages.
1554	\\
1555	\Option{SEIActiveParameterSets} &
1556	\ShortOption{\None} &
1557	\Default{0} &
1558	Enables or disables the insertion of the Active parameter sets
1559	SEI messages.
1560	\\
1561	\Option{SEIBufferingPeriod} &
1562	\ShortOption{\None} &
1563	\Default{0} &
1564	Enables or disables the insertion of the Buffering period
1565	SEI messages. This option has no effect if VuiParametersPresent is disabled.
1566	SEIBufferingPeriod requires SEIActiveParameterSets to be enabled.
1567	\\
1568	\Option{SEIPictureTiming} &
1569	\ShortOption{\None} &
1570	\Default{0} &
1571	Enables or disables the insertion of the Picture timing
1572	SEI messages. This option has no effect if VuiParametersPresent is disabled.
1573	\\
1574	\Option{SEIDecodingUnitInfo} &
1575	\ShortOption{\None} &
1576	\Default{0} &
1577	Enables or disables the insertion of the Decoding unit information
1578	SEI messages. This option has no effect if VuiParametersPresent is disabled.
1579	\\
1580	\Option{SEIGradualDecodingRefreshInfo} &
1581	\ShortOption{\None} &
1582	\Default{0} &
1583	Enables or disables the insertion of the Gradual decoding refresh information
1584	SEI messages.
1585	\\
1586	\Option{SEITemporalLevel0Index} &
1587	\ShortOption{\None} &
1588	\Default{0} &
1589	Enables or disables the insertion of the Temporal level zero index
1590	SEI messages.
1591	\\
1592	\Option{SEIDisplayOrientation} &
1593	\ShortOption{\None} &
1594	\Default{0} &
1595	Enables or disables the insertion of the Display orientation
1596	SEI messages.
1597	\par
1598	\begin{tabular}{cp{0.30\textwidth}}
1599	0 & Disabled \\
1600	N: $0 < N < (2^{16} - 1)$ & Enable display orientation SEI message with
1601	\mbox{anticlockwise_rotation = N}
1602	and \mbox{display_orientation_repetition_period = 1} \\
1603	\end{tabular}
1604	\\
1605	\Option{SEIFramePacking} &
1606	\ShortOption{\None} &
1607	\Default{0} &
1608	Enables or disables the insertion of the Frame packing arrangement SEI messages.
1609	\\
1610	\Option{SEIFramePackingType} &
1611	\ShortOption{\None} &
1612	\Default{0} &
1613	Indicates the arrangement type in the Frame packing arrangement SEI message.
1614	This option has no effect if SEIFramePacking is disabled.
1615	\par
1616	\begin{tabular}{cp{0.45\textwidth}}
1617	0 & Checkerboard \\
1618	1 & Line Alternate \\
1619	2 & Column Alternate \\
1620	3 & Side by Side \\
1621	4 & Top Bottom \\
1622	5 & Frame Alternate \\
1623	6 & 2D Image \\
1624	7 & Tile Format \\
1625	\end{tabular}
1626	\\
1627	\Option{SEIFramePackingInterpretation} &
1628	\ShortOption{\None} &
1629	\Default{0} &
1630	Indicates the constituent frames relationship in the Frame packing arrangement SEI message.
1631	This option has no effect if SEIFramePacking is disabled.
1632	\par
1633	\begin{tabular}{cp{0.45\textwidth}}
1634	0 & Unspecified \\
1635	1 & Frame 0 is associated with the left view of a stereo pair \\
1636	2 & Frame 0 is associated with the right view of a stereo pair \\
1637	\end{tabular}
1638	\\
1639	\Option{SEIFramePackingQuincunx} &
1640	\ShortOption{\None} &
1641	\Default{0} &
1642	Enables or disables the quincunx_sampling signalling in the
1643	Frame packing arrangement SEI messages. This option has no
1644	effect if SEIFramePacking is disabled.
1645	\\
1646	\Option{SEIFramePackingId} &
1647	\ShortOption{\None} &
1648	\Default{0} &
1649	Indicates the session number in the Frame packing arrangement
1650	SEI messages. This option has no effect if SEIFramePacking is
1651	disabled.
1652	\\
1653	\end{OptionTable}
1654
1655	%%
1656	%%
1657	%%
1658	\subsection{Hardcoded encoder parameters}
1659	\begin{MacroTable}{CommonDef.h constants}
1660	ADAPT_SR_SCALE &
1661	1 &
1662	Defines a scaling factor used to derive the motion search range is
1663	adaptive (see ASR configuration parameter). Default value is 1.
1664	\\
1665
1666	MAX_GOP &
1667	64 &
1668	maximum size of value of hierarchical GOP.
1669	\\
1670
1671	MAX_NUM_REF &
1672	4 &
1673	maximum number of multiple reference frames
1674	\\
1675
1676	MAX_NUM_REF_LC &
1677	8 &
1678	maximum number of combined reference frames
1679	\\
1680
1681	AMVP_MAX_NUM_CANDS &
1682	2 &
1683	maximum number of final candidates
1684	\\
1685
1686	AMVP_MAX_NUM_CANDS_MEM &
1687	3 &
1688	\\
1689
1690	MRG_MAX_NUM_CANDS &
1691	5 &
1692	\\
1693
1694	DYN_REF_FREE &
1695	off &
1696	dynamic free of reference memories
1697	\\
1698
1699	MAX_TLAYER &
1700	8 &
1701	maximum number of temporal layers
1702	\\
1703
1704	HB_LAMBDA_FOR_LDC &
1705	on &
1706	use of B-style lambda for non-key pictures in low-delay mode
1707	\\
1708
1709	GPB_SIMPLE &
1710	on &
1711	Fast estimation of generalized B in low-delay mode
1712	\\
1713
1714	GPB_SIMPLE_UNI &
1715	on &
1716	Fast estimation of generalized B in low-delay mode for uni-direction
1717	\\
1718
1719	FASTME_SMOOTHER_MV &
1720	on &
1721	Fast ME using smoother MV assumption
1722	\\
1723
1724	ADAPT_SR_SCALE &
1725	on &
1726	division factor for adaptive search range
1727	\\
1728
1729	CLIP_TO_709_RANGE &
1730	off &
1731	\\
1732
1733	EARLY_SKIP_THRES &
1734	1.5 &
1735	early skip if RD < EARLY_SKIP_THRES*avg[BestSkipRD]
1736	\\
1737
1738	MAX_NUM_REF_PICS &
1739	16 &
1740	\\
1741
1742	MAX_CHROMA_FORMAT_IDC &
1743	3 &
1744	\\
1745	\end{MacroTable}
1746
1747	\subsubsection*{TypeDef.h}
1748	Numerous constants that guard individual adoptions are defined within
1749	\url{source/Lib/TLibCommon/TypeDef.h}.
1750
1751	%%
1752	%%
1753	%%
1754	\clearpage
1755	\section{Using the decoder}
1756	\begin{verbatim}
1757	TappDecoder -b str.bin -o dec.yuv [options]
1758	\end{verbatim}
1759
1760	\begin{OptionTable}{Decoder options}
1761	\Option{} &
1762	\ShortOption{-h} &
1763	\Default{\None} &
1764	Prints usage information.
1765	\\
1766
1767	\Option{} &
1768	\ShortOption{-o} &
1769	\Default{\NotSet} &
1770	Defines reconstructed YUV file name.
1771	\\
1772
1773	\Option{} &
1774	\ShortOption{-s} &
1775	\Default{0} &
1776	Defines the number of pictures in decoding order to skip.
1777	\\
1778
1779	\Option{OutputBitDepth} &
1780	\ShortOption{-d} &
1781	\Default{0 \\ (Native)} &
1782	Specifies the luma bit-depth of the reconstructed YUV file (the value 0 indicates
1783	that the native bit-depth is used)
1784	\\
1785
1786	\Option{OutputBitDepthC} &
1787	\ShortOption{\None} &
1788	\Default{0 \\ (Native)} &
1789	Defines the chroma bit-depth of the reconstructed YUV file (the value 0 indicates
1790	that the native bit-depth is used)
1791	\\
1792
1793	\Option{SEIPictureDigest} &
1794	\ShortOption{\None} &
1795	\Default{1} &
1796	Enable or disable verification of any Picture hash SEI messages. When
1797	this parameter is set to 0, the feature is disabled and all messages are
1798	ignored. When set to 1 (default), the feature is enabled and the decoder
1799	has the following behaviour:
1800	\begin{itemize}
1801	\item
1802	If Picture hash SEI messages are included in the bitstream, the same type
1803	of hash is calculated for each decoded picture and written to the
1804	log together with an indication whether the calculted value matches
1805	the value in the SEI message.
1806	Decoding will continue even if there is a mismatch.
1807
1808	\item
1809	After decoding is complete, if any MD5sum comparison failed, a warning
1810	is printed and the decoder exits with the status EXIT_FAILURE
1811
1812	\item
1813	The per-picture MD5 log message has the following formats:
1814	[MD5:d41d8cd98f00b204e9800998ecf8427e,(OK)],
1815	[MD5:d41d8cd98f00b204e9800998ecf8427e,(unk)],
1816	[MD5:d41d8cd98f00b204e9800998ecf8427e,(*ERROR*)] [rxMD5:b9e1...]
1817	where, "(unk)" implies that no MD5 was signalled for this picture,
1818	"(OK)" implies that the decoder agrees with the signalled MD5,
1819	"(*ERROR*)" implies that the decoder disagrees with the signalled
1820	MD5. "[rxMD5:...]" is the signalled MD5 if different.
1821	\end{itemize}
1822	\\
1823
1824	\Option{RespectDefDispWindow} &
1825	\ShortOption{-w} &
1826	\Default{0} &
1827	Video region to be output by the decoder.
1828	\par
1829	\begin{tabular}{cp{0.45\textwidth}}
1830	0 & Output content inside the conformance window. \\
1831	1 & Output content inside the default window. \\
1832	\end{tabular}
1833	\\
1834
1835	\end{OptionTable}
1836
1837
1838	\end{document}

Note: See TracBrowser for help on using the repository browser.

JCT-3V 3D-HEVC

Context navigation

source: 3DVCSoftware/branches/HTM-DEV-0.3-dev2/doc/software-manual.tex @ 530

Download in other formats: