<?xml version="1.0" encoding="UTF-8"?><toc><section id="sec_foreword"><title>Foreword</title></section><section id="sec_intro"><title>Introduction</title></section><section id="sec_1"><label>1</label><title>Scope</title></section><section id="sec_2"><label>2</label><title>Normative references</title></section><section id="sec_3"><label>3</label><title>Terms, definitions, abbreviated terms and symbols</title><section id="sec_3.1"><label>3.1</label><title>Terms and definitions</title></section><section id="sec_3.2"><label>3.2</label><title>Abbreviated terms</title></section><section id="sec_3.3"><label>3.3</label><title>Symbols</title><section id="sec_3.3.1"><label>3.3.1</label><title>Arithmetic operators and mathematical functions</title></section><section id="sec_3.3.2"><label>3.3.2</label><title>Order of operation precedence</title></section><section id="sec_3.3.3"><label>3.3.3</label><title>Range notation</title></section><section id="sec_3.3.4"><label>3.3.4</label><title>Variables</title></section><section id="sec_3.3.5"><label>3.3.5</label><title>Processes</title></section><section id="sec_3.3.6"><label>3.3.6</label><title>Syntax structures</title></section><section id="sec_3.3.7"><label>3.3.7</label><title>Conventions for indicating the number of boxes in tables</title></section></section></section><section id="sec_4"><label>4</label><title>Overview</title><section id="sec_4.1"><label>4.1</label><title>Overall architecture</title></section><section id="sec_4.2"><label>4.2</label><title>Projected omnidirectional video/images</title><section id="sec_4.2.1"><label>4.2.1</label><title>General</title></section><section id="sec_4.2.2"><label>4.2.2</label><title>Stitching, rotation, projection, and region-wise packing</title></section></section><section id="sec_4.3"><label>4.3</label><title>Fisheye omnidirectional video/images</title></section><section id="sec_4.4"><label>4.4</label><title>Mesh omnidirectional video</title></section><section id="sec_4.5"><label>4.5</label><title>Streaming methods for omnidirectional video</title><section id="sec_4.5.1"><label>4.5.1</label><title>Overview</title></section><section id="sec_4.5.2"><label>4.5.2</label><title>Tile-based streaming with viewport-specific author-driven binding</title></section><section id="sec_4.5.3"><label>4.5.3</label><title>Tile-based streaming with free-viewport author-driven binding</title></section><section id="sec_4.5.4"><label>4.5.4</label><title>Tile-based streaming with late binding</title><section id="sec_4.5.4.1"><label>4.5.4.1</label><title>Strategy</title></section><section id="sec_4.5.4.2"><label>4.5.4.2</label><title>Bitstream rewriting</title><section id="sec_4.5.4.2.1"><label>4.5.4.2.1</label><title>General</title></section><section id="sec_4.5.4.2.2"><label>4.5.4.2.2</label><title>HEVC bitstream rewriting</title></section><section id="sec_4.5.4.2.3"><label>4.5.4.2.3</label><title>VVC bitstream rewriting</title></section></section></section></section><section id="sec_4.6"><label>4.6</label><title>Additional functionalities</title></section><section id="sec_4.7"><label>4.7</label><title>Conformance and interoperability</title><section id="sec_4.7.1"><label>4.7.1</label><title>General</title></section><section id="sec_4.7.2"><label>4.7.2</label><title>Media profiles</title><section id="sec_4.7.2.1"><label>4.7.2.1</label><title>General</title></section><section id="sec_4.7.2.2"><label>4.7.2.2</label><title>File decoding process and file decoder requirements for video and image media profiles</title></section><section id="sec_4.7.2.3"><label>4.7.2.3</label><title>File decoding process and file decoder requirements for audio media profiles</title></section></section><section id="sec_4.7.3"><label>4.7.3</label><title>Presentation profiles</title></section><section id="sec_4.7.4"><label>4.7.4</label><title>Toolset brands</title></section><section id="sec_4.7.5"><label>4.7.5</label><title>Summary of referenceable code points</title><section id="sec_4.7.5.1"><label>4.7.5.1</label><title>Brands</title></section><section id="sec_4.7.5.2"><label>4.7.5.2</label><title>Uniform resource names</title></section><section id="sec_4.7.5.3"><label>4.7.5.3</label><title>Restricted scheme types</title></section><section id="sec_4.7.5.4"><label>4.7.5.4</label><title>Sample entry types</title></section><section id="sec_4.7.5.5"><label>4.7.5.5</label><title>Box types</title></section><section id="sec_4.7.5.6"><label>4.7.5.6</label><title>Track grouping types</title></section><section id="sec_4.7.5.7"><label>4.7.5.7</label><title>Entity grouping types</title></section><section id="sec_4.7.5.8"><label>4.7.5.8</label><title>Sample grouping types</title></section></section></section></section><section id="sec_5"><label>5</label><title>Omnidirectional video projection and region-wise packing</title><section id="sec_5.1"><label>5.1</label><title>Coordinate system</title></section><section id="sec_5.2"><label>5.2</label><title>Omnidirectional projection formats</title><section id="sec_5.2.1"><label>5.2.1</label><title>General</title></section><section id="sec_5.2.2"><label>5.2.2</label><title>Equirectangular projection for one sample location</title></section><section id="sec_5.2.3"><label>5.2.3</label><title>Cubemap projection for one sample location</title></section></section><section id="sec_5.3"><label>5.3</label><title>Conversion from the local coordinate axes to the global coordinate axes</title></section><section id="sec_5.4"><label>5.4</label><title>Region-wise packing formats</title><section id="sec_5.4.1"><label>5.4.1</label><title>General</title></section><section id="sec_5.4.2"><label>5.4.2</label><title>Conversion of one sample location for rectangular region-wise packing</title></section></section></section><section id="sec_6"><label>6</label><title>Fisheye omnidirectional video</title><section id="sec_6.1"><label>6.1</label><title>General</title></section><section id="sec_6.2"><label>6.2</label><title>The FisheyeVideoEssentialInfoStruct() syntax structure</title><section id="sec_6.2.1"><label>6.2.1</label><title>Syntax</title></section><section id="sec_6.2.2"><label>6.2.2</label><title>Semantics</title></section></section><section id="sec_6.3"><label>6.3</label><title>The FisheyeVideoSupplementalInfoStruct() syntax structure</title><section id="sec_6.3.1"><label>6.3.1</label><title>Syntax</title></section><section id="sec_6.3.2"><label>6.3.2</label><title>Semantics</title></section></section></section><section id="sec_7"><label>7</label><title>Omnidirectional media storage and metadata signalling in the ISOBMFF</title><section id="sec_7.1"><label>7.1</label><title>Generic extensions to the ISOBMFF</title><section id="sec_7.1.1"><label>7.1.1</label><title>Indication of a track not intended to be presented alone</title></section><section id="sec_7.1.2"><label>7.1.2</label><title>Clarifications on the stereo video box</title></section><section id="sec_7.1.3"><label>7.1.3</label><title>Generic sub-picture track grouping extensions</title><section id="sec_7.1.3.1"><label>7.1.3.1</label><title>Updated semantics of track_group_type</title></section><section id="sec_7.1.3.2"><label>7.1.3.2</label><title>Two dimensional spatial relationship</title><section id="sec_7.1.3.2.1"><label>7.1.3.2.1</label><title>Definition</title></section><section id="sec_7.1.3.2.2"><label>7.1.3.2.2</label><title>Syntax</title></section><section id="sec_7.1.3.2.3"><label>7.1.3.2.3</label><title>Semantics</title></section></section><section id="sec_7.1.3.3"><label>7.1.3.3</label><title>Spatial relationship 2D sample group</title><section id="sec_7.1.3.3.1"><label>7.1.3.3.1</label><title>Definition</title></section><section id="sec_7.1.3.3.2"><label>7.1.3.3.2</label><title>Syntax</title></section><section id="sec_7.1.3.3.3"><label>7.1.3.3.3</label><title>Semantics</title></section></section></section><section id="sec_7.1.4"><label>7.1.4</label><title>Media offset box</title><section id="sec_7.1.4.1"><label>7.1.4.1</label><title>Definition</title></section><section id="sec_7.1.4.2"><label>7.1.4.2</label><title>Syntax</title></section><section id="sec_7.1.4.3"><label>7.1.4.3</label><title>Semantics</title></section></section></section><section id="sec_7.2"><label>7.2</label><title>Generic extensions to ISO/IEC 14496-15</title><section id="sec_7.2.1"><label>7.2.1</label><title>Containing of SpatialRelationship2DDescriptionBox for HEVC tile base track and HEVC tile tracks</title></section></section><section id="sec_7.3"><label>7.3</label><title>OMAF-specific extensions to the ISOBMFF</title><section id="sec_7.3.1"><label>7.3.1</label><title>Sync samples in timed metadata tracks</title></section></section><section id="sec_7.4"><label>7.4</label><title>OMAF-specific extensions to ISO/IEC 14496-15</title><section id="sec_7.4.1"><label>7.4.1</label><title>Coverage information box in an HEVC tile base track</title></section></section><section id="sec_7.5"><label>7.5</label><title>Structures and semantics that are common for video tracks and image items</title><section id="sec_7.5.1"><label>7.5.1</label><title>Semantics of sample locations within a decoded picture</title><section id="sec_7.5.1.1"><label>7.5.1.1</label><title>Relation of decoded pictures to global coordinate axes</title></section><section id="sec_7.5.1.2"><label>7.5.1.2</label><title>Mapping of luma sample locations within a decoded picture to sphere coordinates relative to the global coordinate axes</title></section><section id="sec_7.5.1.3"><label>7.5.1.3</label><title>Conversion from a sample location in a projected picture to sphere coordinates relative to the global coordinate axes</title></section></section><section id="sec_7.5.2"><label>7.5.2</label><title>Projection format structure</title><section id="sec_7.5.2.1"><label>7.5.2.1</label><title>Syntax</title></section><section id="sec_7.5.2.2"><label>7.5.2.2</label><title>Semantics</title></section></section><section id="sec_7.5.3"><label>7.5.3</label><title>Region-wise packing structure</title><section id="sec_7.5.3.1"><label>7.5.3.1</label><title>Definition</title></section><section id="sec_7.5.3.2"><label>7.5.3.2</label><title>Syntax of the rectangular region packing structure</title></section><section id="sec_7.5.3.3"><label>7.5.3.3</label><title>Semantics of the rectangular region packing structure</title></section><section id="sec_7.5.3.4"><label>7.5.3.4</label><title>Syntax of the guard band structure</title></section><section id="sec_7.5.3.5"><label>7.5.3.5</label><title>Semantics of the guard band structure</title></section><section id="sec_7.5.3.6"><label>7.5.3.6</label><title>Syntax the region-wise packing structure</title></section><section id="sec_7.5.3.7"><label>7.5.3.7</label><title>Semantics of the region-wise packing structure</title></section><section id="sec_7.5.3.8"><label>7.5.3.8</label><title>Derivation of region-wise packing variables and constraints for the syntax elements of the region-wise packing structure</title></section></section><section id="sec_7.5.4"><label>7.5.4</label><title>Rotation structure</title><section id="sec_7.5.4.1"><label>7.5.4.1</label><title>Definition</title></section><section id="sec_7.5.4.2"><label>7.5.4.2</label><title>Syntax</title></section><section id="sec_7.5.4.3"><label>7.5.4.3</label><title>Semantics</title></section></section><section id="sec_7.5.5"><label>7.5.5</label><title>Content coverage structure</title><section id="sec_7.5.5.1"><label>7.5.5.1</label><title>Definition</title></section><section id="sec_7.5.5.2"><label>7.5.5.2</label><title>Syntax</title></section><section id="sec_7.5.5.3"><label>7.5.5.3</label><title>Semantics</title></section></section><section id="sec_7.5.6"><label>7.5.6</label><title>Sphere region structure</title><section id="sec_7.5.6.1"><label>7.5.6.1</label><title>Definition</title></section><section id="sec_7.5.6.2"><label>7.5.6.2</label><title>Syntax</title></section><section id="sec_7.5.6.3"><label>7.5.6.3</label><title>Semantics</title></section></section></section><section id="sec_7.6"><label>7.6</label><title>Restricted video schemes for omnidirectional video</title><section id="sec_7.6.1"><label>7.6.1</label><title>Scheme types</title><section id="sec_7.6.1.1"><label>7.6.1.1</label><title>Open-ended and closed scheme types</title></section><section id="sec_7.6.1.2"><label>7.6.1.2</label><title>Projected omnidirectional video ('podv')</title></section><section id="sec_7.6.1.3"><label>7.6.1.3</label><title>Equirectangular projected video ('erpv')</title></section><section id="sec_7.6.1.4"><label>7.6.1.4</label><title>Packed equirectangular or cubemap projected video ('ercm')</title></section><section id="sec_7.6.1.5"><label>7.6.1.5</label><title>Fisheye omnidirectional video ('fodv')</title></section><section id="sec_7.6.1.6"><label>7.6.1.6</label><title>Equirectangular or cubemap projected video with overlays ('ecov')</title></section><section id="sec_7.6.1.7"><label>7.6.1.7</label><title>Packed equirectangular or cubemap projected video with derived region-wise packing ('erc2')</title></section><section id="sec_7.6.1.8"><label>7.6.1.8</label><title>Open-ended scheme type for mesh omnidirectional video ('modv')</title></section><section id="sec_7.6.1.9"><label>7.6.1.9</label><title>Closed scheme type for mesh omnidirectional video ('meov')</title></section></section><section id="sec_7.6.2"><label>7.6.2</label><title>Projected omnidirectional video box</title><section id="sec_7.6.2.1"><label>7.6.2.1</label><title>Definition</title></section><section id="sec_7.6.2.2"><label>7.6.2.2</label><title>Syntax</title></section></section><section id="sec_7.6.3"><label>7.6.3</label><title>Fisheye omnidirectional video box</title><section id="sec_7.6.3.1"><label>7.6.3.1</label><title>Definition</title></section><section id="sec_7.6.3.2"><label>7.6.3.2</label><title>Syntax</title></section></section><section id="sec_7.6.4"><label>7.6.4</label><title>Region-wise packing box</title><section id="sec_7.6.4.1"><label>7.6.4.1</label><title>Definition</title></section><section id="sec_7.6.4.2"><label>7.6.4.2</label><title>Syntax</title></section><section id="sec_7.6.4.3"><label>7.6.4.3</label><title>Semantics</title></section></section><section id="sec_7.6.5"><label>7.6.5</label><title>Rotation box</title><section id="sec_7.6.5.1"><label>7.6.5.1</label><title>Definition</title></section><section id="sec_7.6.5.2"><label>7.6.5.2</label><title>Syntax</title></section></section><section id="sec_7.6.6"><label>7.6.6</label><title>Coverage information box</title><section id="sec_7.6.6.1"><label>7.6.6.1</label><title>Definition</title></section><section id="sec_7.6.6.2"><label>7.6.6.2</label><title>Syntax</title></section></section><section id="sec_7.6.7"><label>7.6.7</label><title>Mesh omnidirectional video box</title><section id="sec_7.6.7.1"><label>7.6.7.1</label><title>Definition</title></section><section id="sec_7.6.7.2"><label>7.6.7.2</label><title>Syntax</title></section></section><section id="sec_7.6.8"><label>7.6.8</label><title>Mesh box</title><section id="sec_7.6.8.1"><label>7.6.8.1</label><title>Definition</title></section><section id="sec_7.6.8.2"><label>7.6.8.2</label><title>Syntax</title></section><section id="sec_7.6.8.3"><label>7.6.8.3</label><title>Semantics</title></section><section id="sec_7.6.8.4"><label>7.6.8.4</label><title>3D parallelogram structure</title></section><section id="sec_7.6.8.5"><label>7.6.8.5</label><title>3D vector structure</title></section></section></section><section id="sec_7.7"><label>7.7</label><title>Timed metadata for sphere regions</title><section id="sec_7.7.1"><label>7.7.1</label><title>General</title></section><section id="sec_7.7.2"><label>7.7.2</label><title>Sample entry</title><section id="sec_7.7.2.1"><label>7.7.2.1</label><title>Definition</title></section><section id="sec_7.7.2.2"><label>7.7.2.2</label><title>Syntax</title></section><section id="sec_7.7.2.3"><label>7.7.2.3</label><title>Semantics</title></section></section><section id="sec_7.7.3"><label>7.7.3</label><title>Sample format</title><section id="sec_7.7.3.1"><label>7.7.3.1</label><title>Definition</title></section><section id="sec_7.7.3.2"><label>7.7.3.2</label><title>Syntax</title></section><section id="sec_7.7.3.3"><label>7.7.3.3</label><title>Semantics</title></section></section><section id="sec_7.7.4"><label>7.7.4</label><title>Initial viewing orientation</title><section id="sec_7.7.4.1"><label>7.7.4.1</label><title>Definition</title></section><section id="sec_7.7.4.2"><label>7.7.4.2</label><title>Sample syntax</title></section><section id="sec_7.7.4.3"><label>7.7.4.3</label><title>Sample semantics</title></section></section><section id="sec_7.7.5"><label>7.7.5</label><title>Recommended viewport</title><section id="sec_7.7.5.1"><label>7.7.5.1</label><title>Definition</title></section><section id="sec_7.7.5.2"><label>7.7.5.2</label><title>Sample entry syntax</title></section><section id="sec_7.7.5.3"><label>7.7.5.3</label><title>Sample entry semantics</title></section><section id="sec_7.7.5.4"><label>7.7.5.4</label><title>Sample syntax</title></section><section id="sec_7.7.5.5"><label>7.7.5.5</label><title>Sample semantics</title></section></section><section id="sec_7.7.6"><label>7.7.6</label><title>Timed text sphere location metadata</title><section id="sec_7.7.6.1"><label>7.7.6.1</label><title>General</title></section><section id="sec_7.7.6.2"><label>7.7.6.2</label><title>Sample entry format</title></section><section id="sec_7.7.6.3"><label>7.7.6.3</label><title>Sample format</title></section></section></section><section id="sec_7.8"><label>7.8</label><title>Signalling of region-wise quality ranking</title><section id="sec_7.8.1"><label>7.8.1</label><title>General</title></section><section id="sec_7.8.2"><label>7.8.2</label><title>Spherical region-wise quality ranking</title><section id="sec_7.8.2.1"><label>7.8.2.1</label><title>Definition</title></section><section id="sec_7.8.2.2"><label>7.8.2.2</label><title>Syntax</title></section><section id="sec_7.8.2.3"><label>7.8.2.3</label><title>Semantics</title></section></section><section id="sec_7.8.3"><label>7.8.3</label><title>2D region-wise quality ranking</title><section id="sec_7.8.3.1"><label>7.8.3.1</label><title>Definition</title></section><section id="sec_7.8.3.2"><label>7.8.3.2</label><title>Syntax</title></section><section id="sec_7.8.3.3"><label>7.8.3.3</label><title>Semantics</title></section></section></section><section id="sec_7.9"><label>7.9</label><title>Storage of omnidirectional images</title><section id="sec_7.9.1"><label>7.9.1</label><title>General</title></section><section id="sec_7.9.2"><label>7.9.2</label><title>Frame packing item property</title><section id="sec_7.9.2.1"><label>7.9.2.1</label><title>Definition</title></section><section id="sec_7.9.2.2"><label>7.9.2.2</label><title>Syntax</title></section><section id="sec_7.9.2.3"><label>7.9.2.3</label><title>Semantics</title></section></section><section id="sec_7.9.3"><label>7.9.3</label><title>Projection format item property</title><section id="sec_7.9.3.1"><label>7.9.3.1</label><title>Definition</title></section><section id="sec_7.9.3.2"><label>7.9.3.2</label><title>Syntax</title></section></section><section id="sec_7.9.4"><label>7.9.4</label><title>Essential fisheye image item property</title><section id="sec_7.9.4.1"><label>7.9.4.1</label><title>General</title></section><section id="sec_7.9.4.2"><label>7.9.4.2</label><title>Definition</title></section><section id="sec_7.9.4.3"><label>7.9.4.3</label><title>Syntax</title></section><section id="sec_7.9.4.4"><label>7.9.4.4</label><title>Semantics</title></section></section><section id="sec_7.9.5"><label>7.9.5</label><title>Supplemental fisheye image item property</title><section id="sec_7.9.5.1"><label>7.9.5.1</label><title>Definition</title></section><section id="sec_7.9.5.2"><label>7.9.5.2</label><title>Syntax</title></section><section id="sec_7.9.5.3"><label>7.9.5.3</label><title>Semantics</title></section></section><section id="sec_7.9.6"><label>7.9.6</label><title>Region-wise packing item property</title><section id="sec_7.9.6.1"><label>7.9.6.1</label><title>Definition</title></section><section id="sec_7.9.6.2"><label>7.9.6.2</label><title>Syntax</title></section><section id="sec_7.9.6.3"><label>7.9.6.3</label><title>Semantics</title></section></section><section id="sec_7.9.7"><label>7.9.7</label><title>Rotation item property</title><section id="sec_7.9.7.1"><label>7.9.7.1</label><title>General</title></section><section id="sec_7.9.7.2"><label>7.9.7.2</label><title>Definition</title></section><section id="sec_7.9.7.3"><label>7.9.7.3</label><title>Syntax</title></section></section><section id="sec_7.9.8"><label>7.9.8</label><title>Coverage information item property</title><section id="sec_7.9.8.1"><label>7.9.8.1</label><title>General</title></section><section id="sec_7.9.8.2"><label>7.9.8.2</label><title>Definition</title></section><section id="sec_7.9.8.3"><label>7.9.8.3</label><title>Syntax</title></section></section><section id="sec_7.9.9"><label>7.9.9</label><title>Initial viewing orientation item property</title><section id="sec_7.9.9.1"><label>7.9.9.1</label><title>Definition</title></section><section id="sec_7.9.9.2"><label>7.9.9.2</label><title>Syntax</title></section><section id="sec_7.9.9.3"><label>7.9.9.3</label><title>Semantics</title></section></section></section><section id="sec_7.10"><label>7.10</label><title>Storage of timed text for omnidirectional video</title><section id="sec_7.10.1"><label>7.10.1</label><title>General</title></section><section id="sec_7.10.2"><label>7.10.2</label><title>OMAF timed text configuration box</title><section id="sec_7.10.2.1"><label>7.10.2.1</label><title>Definition</title></section><section id="sec_7.10.2.2"><label>7.10.2.2</label><title>Syntax</title></section><section id="sec_7.10.2.3"><label>7.10.2.3</label><title>Semantics</title></section></section><section id="sec_7.10.3"><label>7.10.3</label><title>IMSC1 tracks</title></section><section id="sec_7.10.4"><label>7.10.4</label><title>WebVTT tracks</title></section></section><section id="sec_7.11"><label>7.11</label><title>ERP region timed metadata</title><section id="sec_7.11.1"><label>7.11.1</label><title>General</title></section><section id="sec_7.11.2"><label>7.11.2</label><title>Sample entry format</title></section><section id="sec_7.11.3"><label>7.11.3</label><title>Semantics</title></section><section id="sec_7.11.4"><label>7.11.4</label><title>Sample format</title><section id="sec_7.11.4.1"><label>7.11.4.1</label><title>Definition</title></section><section id="sec_7.11.4.2"><label>7.11.4.2</label><title>Syntax</title></section><section id="sec_7.11.4.3"><label>7.11.4.3</label><title>Semantics</title></section></section><section id="sec_7.11.5"><label>7.11.5</label><title>Generating ERP region metadata</title></section></section><section id="sec_7.12"><label>7.12</label><title>Storage and signalling of viewpoints for omnidirectional video and images</title><section id="sec_7.12.1"><label>7.12.1</label><title>Viewpoint information structures</title><section id="sec_7.12.1.1"><label>7.12.1.1</label><title>Definition</title></section><section id="sec_7.12.1.2"><label>7.12.1.2</label><title>Viewpoint position structure</title></section><section id="sec_7.12.1.3"><label>7.12.1.3</label><title>Viewpoint GPS position structure</title></section><section id="sec_7.12.1.4"><label>7.12.1.4</label><title>Viewpoint geomagnetic information structure</title></section><section id="sec_7.12.1.5"><label>7.12.1.5</label><title>Viewpoint global coordinate system rotation structure</title></section><section id="sec_7.12.1.6"><label>7.12.1.6</label><title>Viewpoint group structure</title></section><section id="sec_7.12.1.7"><label>7.12.1.7</label><title>Viewpoint switching list structure</title><section id="sec_7.12.1.7.1"><label>7.12.1.7.1</label><title>  Definition</title></section><section id="sec_7.12.1.7.2"><label>7.12.1.7.2</label><title>  Syntax</title></section><section id="sec_7.12.1.7.3"><label>7.12.1.7.3</label><title>  Semantics</title></section><section id="sec_7.12.1.7.4"><label>7.12.1.7.4</label><title>  Viewpoint timeline switch structure</title></section><section id="sec_7.12.1.7.5"><label>7.12.1.7.5</label><title>  Viewpoint switch region structure</title></section></section><section id="sec_7.12.1.8"><label>7.12.1.8</label><title>Viewpoint looping structure</title></section></section><section id="sec_7.12.2"><label>7.12.2</label><title>Viewpoint entity grouping</title><section id="sec_7.12.2.1"><label>7.12.2.1</label><title>Definition</title></section><section id="sec_7.12.2.2"><label>7.12.2.2</label><title>Syntax</title></section><section id="sec_7.12.2.3"><label>7.12.2.3</label><title>Semantics</title></section></section><section id="sec_7.12.3"><label>7.12.3</label><title>Timed metadata for viewpoints</title><section id="sec_7.12.3.1"><label>7.12.3.1</label><title>Dynamic viewpoint information</title><section id="sec_7.12.3.1.1"><label>7.12.3.1.1</label><title>General</title></section><section id="sec_7.12.3.1.2"><label>7.12.3.1.2</label><title>Sample entry</title></section><section id="sec_7.12.3.1.3"><label>7.12.3.1.3</label><title>Sample format</title></section></section><section id="sec_7.12.3.2"><label>7.12.3.2</label><title>Initial viewpoint</title><section id="sec_7.12.3.2.1"><label>7.12.3.2.1</label><title>General</title></section><section id="sec_7.12.3.2.2"><label>7.12.3.2.2</label><title>Sample entry</title></section><section id="sec_7.12.3.2.3"><label>7.12.3.2.3</label><title>Sample format</title></section></section><section id="sec_7.12.3.3"><label>7.12.3.3</label><title>Object centre points correspondence between viewpoints</title><section id="sec_7.12.3.3.1"><label>7.12.3.3.1</label><title>General</title></section><section id="sec_7.12.3.3.2"><label>7.12.3.3.2</label><title>Sample entry</title></section><section id="sec_7.12.3.3.3"><label>7.12.3.3.3</label><title>Sample format</title></section><section id="sec_7.12.3.3.4"><label>7.12.3.3.4</label><title>Information derivation and OMAF player behaviour</title></section></section></section></section><section id="sec_7.13"><label>7.13</label><title>Storage of omnidirectional video in sub-picture tracks</title><section id="sec_7.13.1"><label>7.13.1</label><title>General</title></section><section id="sec_7.13.2"><label>7.13.2</label><title>Projected omnidirectional video</title></section><section id="sec_7.13.3"><label>7.13.3</label><title>Indication of composition pictures being packed pictures or projected pictures</title></section><section id="sec_7.13.4"><label>7.13.4</label><title>Fisheye omnidirectional video</title></section></section><section id="sec_7.14"><label>7.14</label><title>Storage and signalling of overlays for omnidirectional video and images</title><section id="sec_7.14.1"><label>7.14.1</label><title>General</title></section><section id="sec_7.14.2"><label>7.14.2</label><title>Overlay structure</title><section id="sec_7.14.2.1"><label>7.14.2.1</label><title>Definition</title></section><section id="sec_7.14.2.2"><label>7.14.2.2</label><title>Syntax</title></section><section id="sec_7.14.2.3"><label>7.14.2.3</label><title>Semantics</title></section></section><section id="sec_7.14.3"><label>7.14.3</label><title>Overlay control structures</title><section id="sec_7.14.3.1"><label>7.14.3.1</label><title>Definition</title></section><section id="sec_7.14.3.2"><label>7.14.3.2</label><title>Viewport-relative overlay</title></section><section id="sec_7.14.3.3"><label>7.14.3.3</label><title>Sphere-relative projected omnidirectional overlay</title></section><section id="sec_7.14.3.4"><label>7.14.3.4</label><title>Sphere-relative two-dimensional overlay</title></section><section id="sec_7.14.3.5"><label>7.14.3.5</label><title>3D mesh overlay</title></section><section id="sec_7.14.3.6"><label>7.14.3.6</label><title>Source region for the overlay</title></section><section id="sec_7.14.3.7"><label>7.14.3.7</label><title>Overlay layering order</title></section><section id="sec_7.14.3.8"><label>7.14.3.8</label><title>Overlay opacity</title></section><section id="sec_7.14.3.9"><label>7.14.3.9</label><title>Controls for user interaction</title></section><section id="sec_7.14.3.10"><label>7.14.3.10</label><title>Overlay label</title></section><section id="sec_7.14.3.11"><label>7.14.3.11</label><title>Overlay priority</title></section><section id="sec_7.14.3.12"><label>7.14.3.12</label><title>Associated sphere region</title></section><section id="sec_7.14.3.13"><label>7.14.3.13</label><title>Overlay alpha composition</title></section><section id="sec_7.14.3.14"><label>7.14.3.14</label><title>Externally specified overlay information</title></section></section><section id="sec_7.14.4"><label>7.14.4</label><title>Overlay configuration box</title></section><section id="sec_7.14.5"><label>7.14.5</label><title>Overlay item property</title></section><section id="sec_7.14.6"><label>7.14.6</label><title>Overlay timed metadata track</title><section id="sec_7.14.6.1"><label>7.14.6.1</label><title>Definition</title></section><section id="sec_7.14.6.2"><label>7.14.6.2</label><title>Sample entry</title></section><section id="sec_7.14.6.3"><label>7.14.6.3</label><title>Sample</title></section></section><section id="sec_7.14.7"><label>7.14.7</label><title>Entity groups</title><section id="sec_7.14.7.1"><label>7.14.7.1</label><title>Grouping of overlays that are alternatives for switching</title><section id="sec_7.14.7.1.1"><label>7.14.7.1.1</label><title>Definition</title></section><section id="sec_7.14.7.1.2"><label>7.14.7.1.2</label><title>Syntax</title></section><section id="sec_7.14.7.1.3"><label>7.14.7.1.3</label><title>Semantics</title></section></section><section id="sec_7.14.7.2"><label>7.14.7.2</label><title>Grouping of overlays and background visual media that are intended to be presented together</title><section id="sec_7.14.7.2.1"><label>7.14.7.2.1</label><title>Definition</title></section><section id="sec_7.14.7.2.2"><label>7.14.7.2.2</label><title>Syntax</title></section><section id="sec_7.14.7.2.3"><label>7.14.7.2.3</label><title>Semantics</title></section></section></section><section id="sec_7.14.8"><label>7.14.8</label><title>Overlay alpha auxiliary image</title><section id="sec_7.14.8.1"><label>7.14.8.1</label><title>General</title></section><section id="sec_7.14.8.2"><label>7.14.8.2</label><title>Alpha auxiliary image constraints</title></section><section id="sec_7.14.8.3"><label>7.14.8.3</label><title>Alpha auxiliary video track constraints</title></section><section id="sec_7.14.8.4"><label>7.14.8.4</label><title>Alpha auxiliary image/image sequence encoding</title></section></section></section><section id="sec_7.15"><label>7.15</label><title>Signalling of viewing space information</title><section id="sec_7.15.1"><label>7.15.1</label><title>General</title></section><section id="sec_7.15.2"><label>7.15.2</label><title>Viewing space structure</title><section id="sec_7.15.2.1"><label>7.15.2.1</label><title>Definition</title></section><section id="sec_7.15.2.2"><label>7.15.2.2</label><title>Syntax</title></section><section id="sec_7.15.2.3"><label>7.15.2.3</label><title>Semantics</title></section></section><section id="sec_7.15.3"><label>7.15.3</label><title>Viewing space box</title><section id="sec_7.15.3.1"><label>7.15.3.1</label><title>Definition</title></section><section id="sec_7.15.3.2"><label>7.15.3.2</label><title>Syntax</title></section></section><section id="sec_7.15.4"><label>7.15.4</label><title>Viewing space item property</title><section id="sec_7.15.4.1"><label>7.15.4.1</label><title>Definition</title></section><section id="sec_7.15.4.2"><label>7.15.4.2</label><title>Syntax</title></section></section><section id="sec_7.15.5"><label>7.15.5</label><title>Time varying immersive viewing space signalling</title><section id="sec_7.15.5.1"><label>7.15.5.1</label><title>Definition</title></section><section id="sec_7.15.5.2"><label>7.15.5.2</label><title>Syntax and Semantics</title></section></section></section><section id="sec_7.16"><label>7.16</label><title>Mapping of rectangular regions to the 3D mesh</title><section id="sec_7.16.1"><label>7.16.1</label><title>General</title></section><section id="sec_7.16.2"><label>7.16.2</label><title>Tile mesh sample grouping</title><section id="sec_7.16.2.1"><label>7.16.2.1</label><title>Definition</title></section><section id="sec_7.16.2.2"><label>7.16.2.2</label><title>Syntax</title></section><section id="sec_7.16.2.3"><label>7.16.2.3</label><title>Semantics</title></section></section><section id="sec_7.16.3"><label>7.16.3</label><title>Rectangular region structure</title><section id="sec_7.16.3.1"><label>7.16.3.1</label><title>Definition</title></section><section id="sec_7.16.3.2"><label>7.16.3.2</label><title>Syntax</title></section><section id="sec_7.16.3.3"><label>7.16.3.3</label><title>Semantics</title></section></section><section id="sec_7.16.4"><label>7.16.4</label><title>Projection of a sample location onto the 3D mesh</title></section></section></section><section id="sec_8"><label>8</label><title>Omnidirectional media encapsulation and signalling in DASH</title><section id="sec_8.1"><label>8.1</label><title>Architecture of DASH delivery in OMAF</title></section><section id="sec_8.2"><label>8.2</label><title>Usage of DASH in OMAF</title><section id="sec_8.2.1"><label>8.2.1</label><title>General</title></section><section id="sec_8.2.2"><label>8.2.2</label><title>Signalling of stereoscopic frame packing</title></section><section id="sec_8.2.3"><label>8.2.3</label><title>Carriage of timed metadata</title><section id="sec_8.2.3.1"><label>8.2.3.1</label><title>General</title></section><section id="sec_8.2.3.2"><label>8.2.3.2</label><title>Carriage of ERP region timed metadata in DASH</title><section id="sec_8.2.3.2.1"><label>8.2.3.2.1</label><title>Constraints</title></section><section id="sec_8.2.3.2.2"><label>8.2.3.2.2</label><title>OMAF player behaviour to process ERP region metadata</title></section></section></section><section id="sec_8.2.4"><label>8.2.4</label><title>Associating Adaptation Sets or Representations with each other</title><section id="sec_8.2.4.1"><label>8.2.4.1</label><title>Individual association</title></section><section id="sec_8.2.4.2"><label>8.2.4.2</label><title>Collective association</title></section><section id="sec_8.2.4.3"><label>8.2.4.3</label><title>Overlay DASH association</title></section></section></section><section id="sec_8.3"><label>8.3</label><title>DASH MPD descriptors for omnidirectional media in the namespace "urn:mpeg:mpegI:omaf:2017"</title><section id="sec_8.3.1"><label>8.3.1</label><title>XML namespace and schema</title></section><section id="sec_8.3.2"><label>8.3.2</label><title>Signalling of projection type information</title></section><section id="sec_8.3.3"><label>8.3.3</label><title>Signalling of region-wise packing type</title></section><section id="sec_8.3.4"><label>8.3.4</label><title>Signalling of content coverage</title></section><section id="sec_8.3.5"><label>8.3.5</label><title>Signalling of spherical region-wise quality ranking</title></section><section id="sec_8.3.6"><label>8.3.6</label><title>Signalling of 2D region-wise quality ranking</title></section><section id="sec_8.3.7"><label>8.3.7</label><title>Signalling of fisheye omnidirectional video</title></section></section><section id="sec_8.4"><label>8.4</label><title>Carriage of images</title><section id="sec_8.4.1"><label>8.4.1</label><title>General</title></section><section id="sec_8.4.2"><label>8.4.2</label><title>Format and constraints for Segments</title></section></section><section id="sec_8.5"><label>8.5</label><title>DASH MPD descriptors for omnidirectional media in the namespace "urn:mpeg:mpegI:omaf:2020"</title><section id="sec_8.5.1"><label>8.5.1</label><title>XML namespace and schema</title></section><section id="sec_8.5.2"><label>8.5.2</label><title>Signalling of association</title></section><section id="sec_8.5.3"><label>8.5.3</label><title>Signalling of viewpoints</title></section><section id="sec_8.5.4"><label>8.5.4</label><title>Signalling of sub-picture composition identifier and its attributes</title></section><section id="sec_8.5.5"><label>8.5.5</label><title>Signalling of overlays</title></section><section id="sec_8.5.6"><label>8.5.6</label><title>Entity to group descriptor</title></section><section id="sec_8.5.7"><label>8.5.7</label><title>Content component attribute for Representation</title></section></section><section id="sec_8.6"><label>8.6</label><title>Segment formats</title><section id="sec_8.6.1"><label>8.6.1</label><title>Initialization Segment for OMAF base track</title><section id="sec_8.6.1.1"><label>8.6.1.1</label><title>General</title></section><section id="sec_8.6.1.2"><label>8.6.1.2</label><title>Stream header</title></section><section id="sec_8.6.1.3"><label>8.6.1.3</label><title>Track box format for OMAF base track</title></section><section id="sec_8.6.1.4"><label>8.6.1.4</label><title>Track box format for OMAF tile track</title></section></section><section id="sec_8.6.2"><label>8.6.2</label><title>Tile Index Segment</title></section><section id="sec_8.6.3"><label>8.6.3</label><title>Tile Data Segment</title></section></section></section><section id="sec_9"><label>9</label><title>Omnidirectional media encapsulation and signalling in MMT</title><section id="sec_9.1"><label>9.1</label><title>Architecture of MMT delivery in OMAF</title></section><section id="sec_9.2"><label>9.2</label><title>OMAF signalling in MPEG composition information</title></section><section id="sec_9.3"><label>9.3</label><title>VR application-specific MMT signalling</title><section id="sec_9.3.1"><label>9.3.1</label><title>General</title></section><section id="sec_9.3.2"><label>9.3.2</label><title>MMT signalling</title><section id="sec_9.3.2.1"><label>9.3.2.1</label><title>VRInformation asset descriptor</title><section id="sec_9.3.2.1.1"><label>9.3.2.1.1</label><title>General</title></section><section id="sec_9.3.2.1.2"><label>9.3.2.1.2</label><title>Syntax</title></section><section id="sec_9.3.2.1.3"><label>9.3.2.1.3</label><title>Semantics</title></section></section><section id="sec_9.3.2.2"><label>9.3.2.2</label><title>VRViewDependentSupportQuery</title><section id="sec_9.3.2.2.1"><label>9.3.2.2.1</label><title>Syntax</title></section><section id="sec_9.3.2.2.2"><label>9.3.2.2.2</label><title>Semantics</title></section></section><section id="sec_9.3.2.3"><label>9.3.2.3</label><title>VRViewDependentSupportResponse</title><section id="sec_9.3.2.3.1"><label>9.3.2.3.1</label><title>Syntax</title></section><section id="sec_9.3.2.3.2"><label>9.3.2.3.2</label><title>Semantics</title></section></section><section id="sec_9.3.2.4"><label>9.3.2.4</label><title>VRViewportChangeFeedback</title><section id="sec_9.3.2.4.1"><label>9.3.2.4.1</label><title>General</title></section><section id="sec_9.3.2.4.2"><label>9.3.2.4.2</label><title>Syntax</title></section><section id="sec_9.3.2.4.3"><label>9.3.2.4.3</label><title>Semantics</title></section></section><section id="sec_9.3.2.5"><label>9.3.2.5</label><title>VRViewDependentAssetInformation</title><section id="sec_9.3.2.5.1"><label>9.3.2.5.1</label><title>General</title></section><section id="sec_9.3.2.5.2"><label>9.3.2.5.2</label><title>Syntax</title></section><section id="sec_9.3.2.5.3"><label>9.3.2.5.3</label><title>Semantics</title></section></section><section id="sec_9.3.2.6"><label>9.3.2.6</label><title>VRROIGuide</title><section id="sec_9.3.2.6.1"><label>9.3.2.6.1</label><title>General</title></section><section id="sec_9.3.2.6.2"><label>9.3.2.6.2</label><title>Syntax</title></section><section id="sec_9.3.2.6.3"><label>9.3.2.6.3</label><title>Semantics</title></section></section><section id="sec_9.3.2.7"><label>9.3.2.7</label><title>Stereo video asset descriptor</title><section id="sec_9.3.2.7.1"><label>9.3.2.7.1</label><title>Syntax</title></section><section id="sec_9.3.2.7.2"><label>9.3.2.7.2</label><title>Semantics</title></section></section><section id="sec_9.3.2.8"><label>9.3.2.8</label><title>VR3DAudioAssetInformation</title><section id="sec_9.3.2.8.1"><label>9.3.2.8.1</label><title>General</title></section><section id="sec_9.3.2.8.2"><label>9.3.2.8.2</label><title>Syntax</title></section><section id="sec_9.3.2.8.3"><label>9.3.2.8.3</label><title>Semantics</title></section></section><section id="sec_9.3.2.9"><label>9.3.2.9</label><title>VR fisheye information asset descriptor</title><section id="sec_9.3.2.9.1"><label>9.3.2.9.1</label><title>General</title></section><section id="sec_9.3.2.9.2"><label>9.3.2.9.2</label><title>Syntax</title></section><section id="sec_9.3.2.9.3"><label>9.3.2.9.3</label><title>Semantics</title></section></section></section></section></section><section id="sec_10"><label>10</label><title>Media profiles</title><section id="sec_10.1"><label>10.1</label><title>Video profiles</title><section id="sec_10.1.1"><label>10.1.1</label><title>Overview</title></section><section id="sec_10.1.2"><label>10.1.2</label><title>HEVC-based viewport-independent OMAF video profile</title><section id="sec_10.1.2.1"><label>10.1.2.1</label><title>General</title></section><section id="sec_10.1.2.2"><label>10.1.2.2</label><title>Elementary stream constraints</title></section><section id="sec_10.1.2.3"><label>10.1.2.3</label><title>SEI message related ISO Base Media File Format constraints</title></section><section id="sec_10.1.2.4"><label>10.1.2.4</label><title>ISO Base Media File Format constraints</title></section><section id="sec_10.1.2.5"><label>10.1.2.5</label><title>File decoding process</title></section><section id="sec_10.1.2.6"><label>10.1.2.6</label><title>Expected OMAF player operation</title></section></section><section id="sec_10.1.3"><label>10.1.3</label><title>HEVC-based viewport-dependent OMAF video profile</title><section id="sec_10.1.3.1"><label>10.1.3.1</label><title>General</title></section><section id="sec_10.1.3.2"><label>10.1.3.2</label><title>Elementary stream constraints</title></section><section id="sec_10.1.3.3"><label>10.1.3.3</label><title>ISO Base Media File Format constraints</title></section><section id="sec_10.1.3.4"><label>10.1.3.4</label><title>File decoding process</title></section><section id="sec_10.1.3.5"><label>10.1.3.5</label><title>Expected OMAF player operation</title></section></section><section id="sec_10.1.4"><label>10.1.4</label><title>AVC-based viewport-dependent OMAF video profile</title><section id="sec_10.1.4.1"><label>10.1.4.1</label><title>General</title></section><section id="sec_10.1.4.2"><label>10.1.4.2</label><title>Elementary stream constraints</title></section><section id="sec_10.1.4.3"><label>10.1.4.3</label><title>ISO Base Media File Format constraints</title></section><section id="sec_10.1.4.4"><label>10.1.4.4</label><title>File decoding process</title></section><section id="sec_10.1.4.5"><label>10.1.4.5</label><title>Expected OMAF player operation</title></section></section><section id="sec_10.1.5"><label>10.1.5</label><title>Unconstrained HEVC-based viewport-independent OMAF video profile</title><section id="sec_10.1.5.1"><label>10.1.5.1</label><title>General</title></section><section id="sec_10.1.5.2"><label>10.1.5.2</label><title>Elementary stream constraints</title></section><section id="sec_10.1.5.3"><label>10.1.5.3</label><title>ISO Base Media File Format constraints</title></section><section id="sec_10.1.5.4"><label>10.1.5.4</label><title>File decoding process</title></section><section id="sec_10.1.5.5"><label>10.1.5.5</label><title>Expected OMAF player operation</title></section></section><section id="sec_10.1.6"><label>10.1.6</label><title>Advanced tiling OMAF video profile</title><section id="sec_10.1.6.1"><label>10.1.6.1</label><title>General</title></section><section id="sec_10.1.6.2"><label>10.1.6.2</label><title>Elementary stream constraints</title><section id="sec_10.1.6.2.1"><label>10.1.6.2.1</label><title>Bitstream constraints at the decoder</title></section><section id="sec_10.1.6.2.2"><label>10.1.6.2.2</label><title>Encoding constraints</title></section></section><section id="sec_10.1.6.3"><label>10.1.6.3</label><title>ISO base media file format constraints</title><section id="sec_10.1.6.3.1"><label>10.1.6.3.1</label><title>Stream header</title></section><section id="sec_10.1.6.3.2"><label>10.1.6.3.2</label><title>Track box format for OMAF base track and OMAF tile tracks</title></section></section><section id="sec_10.1.6.4"><label>10.1.6.4</label><title>Bitstream rewriting</title><section id="sec_10.1.6.4.1"><label>10.1.6.4.1</label><title>General</title></section><section id="sec_10.1.6.4.2"><label>10.1.6.4.2</label><title>Rewriting parameter sets</title></section><section id="sec_10.1.6.4.3"><label>10.1.6.4.3</label><title>Rewriting slice segment header and possibly NAL unit header for each VCL NAL unit</title></section></section><section id="sec_10.1.6.5"><label>10.1.6.5</label><title>Expected OMAF player operation</title></section></section><section id="sec_10.1.7"><label>10.1.7</label><title>Simple tiling OMAF video profiles</title><section id="sec_10.1.7.1"><label>10.1.7.1</label><title>General</title></section><section id="sec_10.1.7.2"><label>10.1.7.2</label><title>Elementary stream constraints</title><section id="sec_10.1.7.2.1"><label>10.1.7.2.1</label><title>HEVC elementary stream constraints</title></section><section id="sec_10.1.7.2.2"><label>10.1.7.2.2</label><title>VVC elementary stream constraints</title></section></section><section id="sec_10.1.7.3"><label>10.1.7.3</label><title>ISO Base Media File Format constraints</title><section id="sec_10.1.7.3.1"><label>10.1.7.3.1</label><title>Stream header</title></section><section id="sec_10.1.7.3.2"><label>10.1.7.3.2</label><title>Track box format for OMAF base track and OMAF tile tracks</title></section><section id="sec_10.1.7.3.3"><label>10.1.7.3.3</label><title>Other constraints</title></section></section><section id="sec_10.1.7.4"><label>10.1.7.4</label><title>File decoding process</title></section><section id="sec_10.1.7.5"><label>10.1.7.5</label><title>Expected OMAF player operation</title></section></section><section id="sec_10.1.8"><label>10.1.8</label><title>VVC-based viewport-independent OMAF video profile</title><section id="sec_10.1.8.1"><label>10.1.8.1</label><title>General</title></section><section id="sec_10.1.8.2"><label>10.1.8.2</label><title>Elementary stream constraints</title></section><section id="sec_10.1.8.3"><label>10.1.8.3</label><title>SEI message related ISO Base Media File Format constraints</title></section><section id="sec_10.1.8.4"><label>10.1.8.4</label><title>ISO Base Media File Format constraints</title></section><section id="sec_10.1.8.5"><label>10.1.8.5</label><title>File decoding process</title></section><section id="sec_10.1.8.6"><label>10.1.8.6</label><title>Expected OMAF player operation</title></section></section></section><section id="sec_10.2"><label>10.2</label><title>Audio profiles</title><section id="sec_10.2.1"><label>10.2.1</label><title>Overview</title></section><section id="sec_10.2.2"><label>10.2.2</label><title>OMAF 3D audio baseline profile</title><section id="sec_10.2.2.1"><label>10.2.2.1</label><title>General</title></section><section id="sec_10.2.2.2"><label>10.2.2.2</label><title>Elementary stream constraints</title></section><section id="sec_10.2.2.3"><label>10.2.2.3</label><title>ISO Base Media File Format constraints</title><section id="sec_10.2.2.3.1"><label>10.2.2.3.1</label><title>General constraints</title></section><section id="sec_10.2.2.3.2"><label>10.2.2.3.2</label><title>Configuration change constraints</title></section><section id="sec_10.2.2.3.3"><label>10.2.2.3.3</label><title>Multi-stream constraints</title></section><section id="sec_10.2.2.3.4"><label>10.2.2.3.4</label><title>Loudness and dynamic range control</title></section></section></section><section id="sec_10.2.3"><label>10.2.3</label><title>OMAF 2D audio legacy profile</title><section id="sec_10.2.3.1"><label>10.2.3.1</label><title>General</title></section><section id="sec_10.2.3.2"><label>10.2.3.2</label><title>Elementary stream constraints</title><section id="sec_10.2.3.2.1"><label>10.2.3.2.1</label><title>General encoding constraints</title></section><section id="sec_10.2.3.2.2"><label>10.2.3.2.2</label><title>Syntax and values of syntactic elements</title></section><section id="sec_10.2.3.2.3"><label>10.2.3.2.3</label><title>AAC presentation timing</title></section><section id="sec_10.2.3.2.4"><label>10.2.3.2.4</label><title>Loudness and dynamic range control</title></section><section id="sec_10.2.3.2.5"><label>10.2.3.2.5</label><title>Maximum bitrate</title></section></section><section id="sec_10.2.3.3"><label>10.2.3.3</label><title>ISO Base Media File Format constraints</title><section id="sec_10.2.3.3.1"><label>10.2.3.3.1</label><title>Storage of AAC media samples</title></section><section id="sec_10.2.3.3.2"><label>10.2.3.3.2</label><title>AAC audio sample entry</title><section id="sec_10.2.3.3.2.1"><label>10.2.3.3.2.1</label><title>ES_Descriptor</title></section><section id="sec_10.2.3.3.2.2"><label>10.2.3.3.2.2</label><title>DecoderConfigDescriptor</title></section><section id="sec_10.2.3.3.2.3"><label>10.2.3.3.2.3</label><title>AudioSpecificConfig</title></section><section id="sec_10.2.3.3.2.4"><label>10.2.3.3.2.4</label><title>GASpecificConfig</title></section></section></section></section></section><section id="sec_10.3"><label>10.3</label><title>Image profiles</title><section id="sec_10.3.1"><label>10.3.1</label><title>Overview</title></section><section id="sec_10.3.2"><label>10.3.2</label><title>Common specifications for image profiles</title><section id="sec_10.3.2.1"><label>10.3.2.1</label><title>General</title></section><section id="sec_10.3.2.2"><label>10.3.2.2</label><title>ISO Base Media File Format constraints for an image item conforming to an OMAF image profile</title></section><section id="sec_10.3.2.3"><label>10.3.2.3</label><title>ISO Base Media File Format constraints for a file conforming to an OMAF image profile</title></section></section><section id="sec_10.3.3"><label>10.3.3</label><title>OMAF HEVC image profile</title><section id="sec_10.3.3.1"><label>10.3.3.1</label><title>General</title></section><section id="sec_10.3.3.2"><label>10.3.3.2</label><title>Elementary stream constraints</title></section><section id="sec_10.3.3.3"><label>10.3.3.3</label><title>ISO Base Media File Format constraints</title></section><section id="sec_10.3.3.4"><label>10.3.3.4</label><title>File decoding process</title></section><section id="sec_10.3.3.5"><label>10.3.3.5</label><title>Recommendations and requirements for OMAF player</title></section></section><section id="sec_10.3.4"><label>10.3.4</label><title>OMAF legacy image profile</title><section id="sec_10.3.4.1"><label>10.3.4.1</label><title>General</title></section><section id="sec_10.3.4.2"><label>10.3.4.2</label><title>Elementary stream constraints</title></section><section id="sec_10.3.4.3"><label>10.3.4.3</label><title>ISO Base Media File Format constraints</title></section><section id="sec_10.3.4.4"><label>10.3.4.4</label><title>File decoding process</title></section><section id="sec_10.3.4.5"><label>10.3.4.5</label><title>Recommendations and requirements for OMAF player</title></section></section><section id="sec_10.3.5"><label>10.3.5</label><title>OMAF VVC image profile</title><section id="sec_10.3.5.1"><label>10.3.5.1</label><title>General</title></section><section id="sec_10.3.5.2"><label>10.3.5.2</label><title>Elementary stream constraints</title></section><section id="sec_10.3.5.3"><label>10.3.5.3</label><title>ISO Base Media File Format constraints</title></section><section id="sec_10.3.5.4"><label>10.3.5.4</label><title>File decoding process</title></section><section id="sec_10.3.5.5"><label>10.3.5.5</label><title>Recommendations and requirements for OMAF player</title></section></section></section><section id="sec_10.4"><label>10.4</label><title>Timed text profiles</title><section id="sec_10.4.1"><label>10.4.1</label><title>Overview</title></section><section id="sec_10.4.2"><label>10.4.2</label><title>OMAF IMSC1 timed text profile</title><section id="sec_10.4.2.1"><label>10.4.2.1</label><title>Elementary stream constraints</title></section><section id="sec_10.4.2.2"><label>10.4.2.2</label><title>ISO Base Media File Format constraints</title></section></section><section id="sec_10.4.3"><label>10.4.3</label><title>OMAF WebVTT timed text profile</title><section id="sec_10.4.3.1"><label>10.4.3.1</label><title>Elementary stream constraints</title></section><section id="sec_10.4.3.2"><label>10.4.3.2</label><title>ISO Base Media File Format constraints</title></section></section></section></section><section id="sec_11"><label>11</label><title>Presentation profiles</title><section id="sec_11.1"><label>11.1</label><title>OMAF viewport-independent baseline presentation profile</title><section id="sec_11.1.1"><label>11.1.1</label><title>General</title></section><section id="sec_11.1.2"><label>11.1.2</label><title>ISO Base Media File Format constraints</title></section></section><section id="sec_11.2"><label>11.2</label><title>OMAF viewport-dependent baseline presentation profile</title><section id="sec_11.2.1"><label>11.2.1</label><title>General</title></section><section id="sec_11.2.2"><label>11.2.2</label><title>ISO Base Media File Format constraints</title></section></section></section><section id="sec_12"><label>12</label><title>OMAF toolset brands</title><section id="sec_12.1"><label>12.1</label><title>Overlay toolset brand</title><section id="sec_12.1.1"><label>12.1.1</label><title>Overview</title></section><section id="sec_12.1.2"><label>12.1.2</label><title>ISO Base Media File Format constraints</title></section><section id="sec_12.1.3"><label>12.1.3</label><title>OMAF player operation</title></section></section><section id="sec_12.2"><label>12.2</label><title>Viewpoint toolset brand</title><section id="sec_12.2.1"><label>12.2.1</label><title>Overview</title></section><section id="sec_12.2.2"><label>12.2.2</label><title>ISO Base Media File Format constraints</title></section><section id="sec_12.2.3"><label>12.2.3</label><title>OMAF player operation</title></section></section><section id="sec_12.3"><label>12.3</label><title>Non-linear storyline toolset brand</title><section id="sec_12.3.1"><label>12.3.1</label><title>Overview</title></section><section id="sec_12.3.2"><label>12.3.2</label><title>ISO Base Media File Format constraints</title></section><section id="sec_12.3.3"><label>12.3.3</label><title>OMAF player operation</title></section></section></section><section id="sec_A"><label>Annex A</label><title>OMAF DASH schema (normative)</title></section><section id="sec_B"><label>Annex B</label><title>DASH integration of media profiles (normative)</title><section id="sec_B.1"><label>B.1</label><title>Video profiles</title><section id="sec_B.1.1"><label>B.1.1</label><title>HEVC-based viewport-independent OMAF video profile</title></section><section id="sec_B.1.2"><label>B.1.2</label><title>Viewport-dependent delivery of AVC, HEVC, and VVC without Index Segments</title><section id="sec_B.1.2.1"><label>B.1.2.1</label><title>General</title></section><section id="sec_B.1.2.2"><label>B.1.2.2</label><title>Specifications for 'hvc2', 'avc2', and 'avc4' sample entry types and for 'vvc1' merge base tracks</title></section></section><section id="sec_B.1.3"><label>B.1.3</label><title>Unconstrained HEVC-based viewport-independent OMAF video profile</title></section><section id="sec_B.1.4"><label>B.1.4</label><title>OMAF tiling video profiles</title><section id="sec_B.1.4.1"><label>B.1.4.1</label><title>General</title></section><section id="sec_B.1.4.2"><label>B.1.4.2</label><title>Specifications for the advanced tiling OMAF video profile</title></section><section id="sec_B.1.4.3"><label>B.1.4.3</label><title>Specifications for the simple tiling OMAF video profiles</title></section><section id="sec_B.1.4.4"><label>B.1.4.4</label><title>Tile Index Segment</title></section><section id="sec_B.1.4.5"><label>B.1.4.5</label><title>Expected player operation</title></section></section></section><section id="sec_B.2"><label>B.2</label><title>Audio profiles</title><section id="sec_B.2.1"><label>B.2.1</label><title>OMAF 3D audio baseline profile</title><section id="sec_B.2.1.1"><label>B.2.1.1</label><title>General</title></section><section id="sec_B.2.1.2"><label>B.2.1.2</label><title>Element and attribute settings</title></section></section><section id="sec_B.2.2"><label>B.2.2</label><title>OMAF 2D audio legacy profile</title></section></section><section id="sec_B.3"><label>B.3</label><title>Timed text profiles</title><section id="sec_B.3.1"><label>B.3.1</label><title>OMAF IMSC1 timed text profile</title></section><section id="sec_B.3.2"><label>B.3.2</label><title>OMAF WebVTT timed text profile</title></section></section></section><section id="sec_C"><label>Annex C</label><title>CMAF integration of media profiles (normative)</title><section id="sec_C.1"><label>C.1</label><title>Video profiles</title><section id="sec_C.1.1"><label>C.1.1</label><title>HEVC-based viewport-independent OMAF video profile</title></section><section id="sec_C.1.2"><label>C.1.2</label><title>HEVC-based viewport-dependent OMAF video profile</title></section><section id="sec_C.1.3"><label>C.1.3</label><title>Unconstrained HEVC-based viewport-independent OMAF video profile</title></section><section id="sec_C.1.4"><label>C.1.4</label><title>VVC-based viewport-independent OMAF video profile</title></section></section><section id="sec_C.2"><label>C.2</label><title>Audio profiles</title><section id="sec_C.2.1"><label>C.2.1</label><title>OMAF 3D audio baseline profile</title></section></section></section><section id="sec_D"><label>Annex D</label><title>Viewport-dependent omnidirectional video processing (informative)</title><section id="sec_D.1"><label>D.1</label><title>General</title></section><section id="sec_D.2"><label>D.2</label><title>Region-wise quality ranked encoding of omnidirectional content</title></section><section id="sec_D.3"><label>D.3</label><title>Sub-picture bitstreams</title></section><section id="sec_D.4"><label>D.4</label><title>Equal-resolution OMAF tile bitstreams merged to one bitstream</title><section id="sec_D.4.1"><label>D.4.1</label><title>General</title></section><section id="sec_D.4.2"><label>D.4.2</label><title>MCTS-based approach for HEVC</title></section><section id="sec_D.4.3"><label>D.4.3</label><title>Slice-based approach for AVC</title></section><section id="sec_D.4.4"><label>D.4.4</label><title>Approach based on independent VVC subpictures</title></section></section><section id="sec_D.5"><label>D.5</label><title>OMAF tile bitstreams merged resolution-wise</title><section id="sec_D.5.1"><label>D.5.1</label><title>General</title></section><section id="sec_D.5.2"><label>D.5.2</label><title>HEVC MCTS sub-picture bitstreams merged resolution-wise</title></section><section id="sec_D.5.3"><label>D.5.3</label><title>Independent VVC subpictures merged resolution-wise</title></section></section><section id="sec_D.6"><label>D.6</label><title>OMAF tile bitstreams with several resolutions merged to one bitstream</title><section id="sec_D.6.1"><label>D.6.1</label><title>General</title></section><section id="sec_D.6.2"><label>D.6.2</label><title>MCTS-based approach for achieving 5K effective ERP resolution with HEVC-based viewport-dependent OMAF video profile</title></section><section id="sec_D.6.3"><label>D.6.3</label><title>MCTS-based approach for achieving 6K effective ERP resolution with HEVC-based viewport-dependent OMAF video profile</title></section><section id="sec_D.6.4"><label>D.6.4</label><title>MCTS-based approach for achieving 6K effective cubemap resolution with HEVC-based viewport-dependent OMAF video profile</title></section><section id="sec_D.6.5"><label>D.6.5</label><title>Slice-based approach for achieving 5K effective ERP resolution with AVC-based viewport-dependent OMAF video profile</title></section><section id="sec_D.6.6"><label>D.6.6</label><title>MCTS-based approach for the use of ERP with the HEVC-based simple tiling OMAF video profile</title></section><section id="sec_D.6.7"><label>D.6.7</label><title>MCTS-based approach for the use of cubemap with the HEVC-based simple tiling OMAF video profile</title></section><section id="sec_D.6.8"><label>D.6.8</label><title>MCTS-based approach for the use of cubemap with the advanced tiling OMAF video profile</title></section><section id="sec_D.6.9"><label>D.6.9</label><title>Subpicture-based approach for the use of ERP with the VVC-based simple tiling OMAF video profile</title></section><section id="sec_D.6.10"><label>D.6.10</label><title>Approach based on the use of independent VVC subpictures and cubemap with the VVC-based simple tiling OMAF video profile</title></section></section><section id="sec_D.7"><label>D.7</label><title>Omnidirectional single-layer content and OMAF tile bitstreams</title></section><section id="sec_D.8"><label>D.8</label><title>Spatial merging of omnidirectional picture(s) and content for viewports</title></section><section id="sec_D.9"><label>D.9</label><title>Single stream delivery of spatially packed viewport-dependent content</title><section id="sec_D.9.1"><label>D.9.1</label><title>General</title></section><section id="sec_D.9.2"><label>D.9.2</label><title>Omnidirectional picture(s) and content for viewports</title></section></section><section id="sec_D.10"><label>D.10</label><title>Representations with different stream access point intervals</title><section id="sec_D.10.1"><label>D.10.1</label><title>Overview</title></section><section id="sec_D.10.2"><label>D.10.2</label><title>Using stream access points for viewport switching</title></section><section id="sec_D.10.3"><label>D.10.3</label><title>Using switching points for viewport switching</title></section><section id="sec_D.10.4"><label>D.10.4</label><title>Using VVC subpictures for viewport switching</title></section></section><section id="sec_D.11"><label>D.11</label><title>Viewport-dependent omnidirectional video streaming based on massively overlapping and greater-than-FOV sub-pictures and picture-by-picture shifting RAPs</title></section><section id="sec_D.12"><label>D.12</label><title>Comparison of different omnidirectional video coding schemes</title></section></section><section id="sec_E"><label>Annex E</label><title>DASH MPD examples (informative)</title><section id="sec_E.1"><label>E.1</label><title>General</title></section><section id="sec_E.2"><label>E.2</label><title>Single bitstream delivery</title></section><section id="sec_E.3"><label>E.3</label><title>Sub-picture bitstreams delivery</title></section><section id="sec_E.4"><label>E.4</label><title>Timed metadata delivery</title></section><section id="sec_E.5"><label>E.5</label><title>Region-based playback of omnidirectional media</title></section></section><section id="sec_F"><label>Annex F</label><title>MMT signalling examples (informative)</title><section id="sec_F.1"><label>F.1</label><title>General</title></section><section id="sec_F.2"><label>F.2</label><title>Single packed stream delivery</title></section></section><section id="sec_G"><label>Annex G</label><title>Expected behaviour of OMAF player (normative)</title><section id="sec_G.1"><label>G.1</label><title>General</title></section><section id="sec_G.2"><label>G.2</label><title>Rendering procedure for timed text</title></section><section id="sec_G.3"><label>G.3</label><title>Processing of overlay control structure</title></section><section id="sec_G.4"><label>G.4</label><title>Sphere-relative overlay rendering procedure</title></section><section id="sec_G.5"><label>G.5</label><title>Viewport-relative overlay rendering procedure</title></section><section id="sec_G.6"><label>G.6</label><title>Overlay source region access procedure</title></section><section id="sec_G.7"><label>G.7</label><title>Procedure for handling user interactions with overlays</title></section><section id="sec_G.8"><label>G.8</label><title>Expected player behaviour for handling viewpoints</title><section id="sec_G.8.1"><label>G.8.1</label><title>Expected player behaviour based on signalling in DASH MPD</title></section><section id="sec_G.8.2"><label>G.8.2</label><title>Expected player behaviour based on signalling in ISOBMFF</title><section id="sec_G.8.2.1"><label>G.8.2.1</label><title>General</title></section><section id="sec_G.8.2.2"><label>G.8.2.2</label><title>Viewpoint positioning</title></section><section id="sec_G.8.2.3"><label>G.8.2.3</label><title>Viewpoint switching</title></section><section id="sec_G.8.2.4"><label>G.8.2.4</label><title>Viewpoint looping</title></section></section></section></section><section id="sec_bibl"><title>Bibliography</title></section></toc>