Home | History | Annotate | Download | only in media
      1 /*
      2  * Copyright (C) 2012 The Android Open Source Project
      3  *
      4  * Licensed under the Apache License, Version 2.0 (the "License");
      5  * you may not use this file except in compliance with the License.
      6  * You may obtain a copy of the License at
      7  *
      8  *      http://www.apache.org/licenses/LICENSE-2.0
      9  *
     10  * Unless required by applicable law or agreed to in writing, software
     11  * distributed under the License is distributed on an "AS IS" BASIS,
     12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     13  * See the License for the specific language governing permissions and
     14  * limitations under the License.
     15  */
     16 
     17 package android.media;
     18 
     19 import android.annotation.IntDef;
     20 
     21 import java.lang.annotation.Retention;
     22 import java.lang.annotation.RetentionPolicy;
     23 import java.nio.ByteBuffer;
     24 import java.util.HashMap;
     25 import java.util.Map;
     26 
     27 /**
     28  * Encapsulates the information describing the format of media data,
     29  * be it audio or video.
     30  *
     31  * The format of the media data is specified as string/value pairs.
     32  *
     33  * Keys common to all audio/video formats, <b>all keys not marked optional are mandatory</b>:
     34  *
     35  * <table>
     36  * <tr><th>Name</th><th>Value Type</th><th>Description</th></tr>
     37  * <tr><td>{@link #KEY_MIME}</td><td>String</td><td>The type of the format.</td></tr>
     38  * <tr><td>{@link #KEY_MAX_INPUT_SIZE}</td><td>Integer</td><td>optional, maximum size of a buffer of input data</td></tr>
     39  * <tr><td>{@link #KEY_BIT_RATE}</td><td>Integer</td><td><b>encoder-only</b>, desired bitrate in bits/second</td></tr>
     40  * </table>
     41  *
     42  * Video formats have the following keys:
     43  * <table>
     44  * <tr><th>Name</th><th>Value Type</th><th>Description</th></tr>
     45  * <tr><td>{@link #KEY_WIDTH}</td><td>Integer</td><td></td></tr>
     46  * <tr><td>{@link #KEY_HEIGHT}</td><td>Integer</td><td></td></tr>
     47  * <tr><td>{@link #KEY_COLOR_FORMAT}</td><td>Integer</td><td>set by the user
     48  *         for encoders, readable in the output format of decoders</b></td></tr>
     49  * <tr><td>{@link #KEY_FRAME_RATE}</td><td>Integer or Float</td><td>required for <b>encoders</b>,
     50  *         optional for <b>decoders</b></td></tr>
     51  * <tr><td>{@link #KEY_CAPTURE_RATE}</td><td>Integer</td><td></td></tr>
     52  * <tr><td>{@link #KEY_I_FRAME_INTERVAL}</td><td>Integer (or Float)</td><td><b>encoder-only</b>,
     53  *         time-interval between key frames.
     54  *         Float support added in {@link android.os.Build.VERSION_CODES#N_MR1}</td></tr>
     55  * <tr><td>{@link #KEY_INTRA_REFRESH_PERIOD}</td><td>Integer</td><td><b>encoder-only</b>, optional</td></tr>
     56  * <tr><td>{@link #KEY_MAX_WIDTH}</td><td>Integer</td><td><b>decoder-only</b>, optional, max-resolution width</td></tr>
     57  * <tr><td>{@link #KEY_MAX_HEIGHT}</td><td>Integer</td><td><b>decoder-only</b>, optional, max-resolution height</td></tr>
     58  * <tr><td>{@link #KEY_REPEAT_PREVIOUS_FRAME_AFTER}</td><td>Long</td><td><b>encoder in surface-mode
     59  *         only</b>, optional</td></tr>
     60  * <tr><td>{@link #KEY_PUSH_BLANK_BUFFERS_ON_STOP}</td><td>Integer(1)</td><td><b>decoder rendering
     61  *         to a surface only</b>, optional</td></tr>
     62  * <tr><td>{@link #KEY_TEMPORAL_LAYERING}</td><td>String</td><td><b>encoder only</b>, optional,
     63  *         temporal-layering schema</td></tr>
     64  * </table>
     65  * Specify both {@link #KEY_MAX_WIDTH} and {@link #KEY_MAX_HEIGHT} to enable
     66  * adaptive playback (seamless resolution change) for a video decoder that
     67  * supports it ({@link MediaCodecInfo.CodecCapabilities#FEATURE_AdaptivePlayback}).
     68  * The values are used as hints for the codec: they are the maximum expected
     69  * resolution to prepare for.  Depending on codec support, preparing for larger
     70  * maximum resolution may require more memory even if that resolution is never
     71  * reached.  These fields have no effect for codecs that do not support adaptive
     72  * playback.<br /><br />
     73  *
     74  * Audio formats have the following keys:
     75  * <table>
     76  * <tr><th>Name</th><th>Value Type</th><th>Description</th></tr>
     77  * <tr><td>{@link #KEY_CHANNEL_COUNT}</td><td>Integer</td><td></td></tr>
     78  * <tr><td>{@link #KEY_SAMPLE_RATE}</td><td>Integer</td><td></td></tr>
     79  * <tr><td>{@link #KEY_PCM_ENCODING}</td><td>Integer</td><td>optional</td></tr>
     80  * <tr><td>{@link #KEY_IS_ADTS}</td><td>Integer</td><td>optional, if <em>decoding</em> AAC audio content, setting this key to 1 indicates that each audio frame is prefixed by the ADTS header.</td></tr>
     81  * <tr><td>{@link #KEY_AAC_PROFILE}</td><td>Integer</td><td><b>encoder-only</b>, optional, if content is AAC audio, specifies the desired profile.</td></tr>
     82  * <tr><td>{@link #KEY_AAC_SBR_MODE}</td><td>Integer</td><td><b>encoder-only</b>, optional, if content is AAC audio, specifies the desired SBR mode.</td></tr>
     83  * <tr><td>{@link #KEY_AAC_DRC_TARGET_REFERENCE_LEVEL}</td><td>Integer</td><td><b>decoder-only</b>, optional, if content is AAC audio, specifies the target reference level.</td></tr>
     84  * <tr><td>{@link #KEY_AAC_ENCODED_TARGET_LEVEL}</td><td>Integer</td><td><b>decoder-only</b>, optional, if content is AAC audio, specifies the target reference level used at encoder.</td></tr>
     85  * <tr><td>{@link #KEY_AAC_DRC_BOOST_FACTOR}</td><td>Integer</td><td><b>decoder-only</b>, optional, if content is AAC audio, specifies the DRC boost factor.</td></tr>
     86  * <tr><td>{@link #KEY_AAC_DRC_ATTENUATION_FACTOR}</td><td>Integer</td><td><b>decoder-only</b>, optional, if content is AAC audio, specifies the DRC attenuation factor.</td></tr>
     87  * <tr><td>{@link #KEY_AAC_DRC_HEAVY_COMPRESSION}</td><td>Integer</td><td><b>decoder-only</b>, optional, if content is AAC audio, specifies whether to use heavy compression.</td></tr>
     88  * <tr><td>{@link #KEY_AAC_MAX_OUTPUT_CHANNEL_COUNT}</td><td>Integer</td><td><b>decoder-only</b>, optional, if content is AAC audio, specifies the maximum number of channels the decoder outputs.</td></tr>
     89  * <tr><td>{@link #KEY_CHANNEL_MASK}</td><td>Integer</td><td>optional, a mask of audio channel assignments</td></tr>
     90  * <tr><td>{@link #KEY_FLAC_COMPRESSION_LEVEL}</td><td>Integer</td><td><b>encoder-only</b>, optional, if content is FLAC audio, specifies the desired compression level.</td></tr>
     91  * </table>
     92  *
     93  * Subtitle formats have the following keys:
     94  * <table>
     95  * <tr><td>{@link #KEY_MIME}</td><td>String</td><td>The type of the format.</td></tr>
     96  * <tr><td>{@link #KEY_LANGUAGE}</td><td>String</td><td>The language of the content.</td></tr>
     97  * </table>
     98  */
     99 public final class MediaFormat {
    100     public static final String MIMETYPE_VIDEO_VP8 = "video/x-vnd.on2.vp8";
    101     public static final String MIMETYPE_VIDEO_VP9 = "video/x-vnd.on2.vp9";
    102     public static final String MIMETYPE_VIDEO_AVC = "video/avc";
    103     public static final String MIMETYPE_VIDEO_HEVC = "video/hevc";
    104     public static final String MIMETYPE_VIDEO_MPEG4 = "video/mp4v-es";
    105     public static final String MIMETYPE_VIDEO_H263 = "video/3gpp";
    106     public static final String MIMETYPE_VIDEO_MPEG2 = "video/mpeg2";
    107     public static final String MIMETYPE_VIDEO_RAW = "video/raw";
    108 
    109     public static final String MIMETYPE_AUDIO_AMR_NB = "audio/3gpp";
    110     public static final String MIMETYPE_AUDIO_AMR_WB = "audio/amr-wb";
    111     public static final String MIMETYPE_AUDIO_MPEG = "audio/mpeg";
    112     public static final String MIMETYPE_AUDIO_AAC = "audio/mp4a-latm";
    113     public static final String MIMETYPE_AUDIO_QCELP = "audio/qcelp";
    114     public static final String MIMETYPE_AUDIO_VORBIS = "audio/vorbis";
    115     public static final String MIMETYPE_AUDIO_OPUS = "audio/opus";
    116     public static final String MIMETYPE_AUDIO_G711_ALAW = "audio/g711-alaw";
    117     public static final String MIMETYPE_AUDIO_G711_MLAW = "audio/g711-mlaw";
    118     public static final String MIMETYPE_AUDIO_RAW = "audio/raw";
    119     public static final String MIMETYPE_AUDIO_FLAC = "audio/flac";
    120     public static final String MIMETYPE_AUDIO_MSGSM = "audio/gsm";
    121     public static final String MIMETYPE_AUDIO_AC3 = "audio/ac3";
    122     public static final String MIMETYPE_AUDIO_EAC3 = "audio/eac3";
    123     public static final String MIMETYPE_VIDEO_DOLBY_VISION = "video/dolby-vision";
    124 
    125     /**
    126      * MIME type for WebVTT subtitle data.
    127      */
    128     public static final String MIMETYPE_TEXT_VTT = "text/vtt";
    129 
    130     /**
    131      * MIME type for CEA-608 closed caption data.
    132      */
    133     public static final String MIMETYPE_TEXT_CEA_608 = "text/cea-608";
    134 
    135     private Map<String, Object> mMap;
    136 
    137     /**
    138      * A key describing the mime type of the MediaFormat.
    139      * The associated value is a string.
    140      */
    141     public static final String KEY_MIME = "mime";
    142 
    143     /**
    144      * A key describing the language of the content, using either ISO 639-1
    145      * or 639-2/T codes.  The associated value is a string.
    146      */
    147     public static final String KEY_LANGUAGE = "language";
    148 
    149     /**
    150      * A key describing the sample rate of an audio format.
    151      * The associated value is an integer
    152      */
    153     public static final String KEY_SAMPLE_RATE = "sample-rate";
    154 
    155     /**
    156      * A key describing the number of channels in an audio format.
    157      * The associated value is an integer
    158      */
    159     public static final String KEY_CHANNEL_COUNT = "channel-count";
    160 
    161     /**
    162      * A key describing the width of the content in a video format.
    163      * The associated value is an integer
    164      */
    165     public static final String KEY_WIDTH = "width";
    166 
    167     /**
    168      * A key describing the height of the content in a video format.
    169      * The associated value is an integer
    170      */
    171     public static final String KEY_HEIGHT = "height";
    172 
    173     /**
    174      * A key describing the maximum expected width of the content in a video
    175      * decoder format, in case there are resolution changes in the video content.
    176      * The associated value is an integer
    177      */
    178     public static final String KEY_MAX_WIDTH = "max-width";
    179 
    180     /**
    181      * A key describing the maximum expected height of the content in a video
    182      * decoder format, in case there are resolution changes in the video content.
    183      * The associated value is an integer
    184      */
    185     public static final String KEY_MAX_HEIGHT = "max-height";
    186 
    187     /** A key describing the maximum size in bytes of a buffer of data
    188      * described by this MediaFormat.
    189      * The associated value is an integer
    190      */
    191     public static final String KEY_MAX_INPUT_SIZE = "max-input-size";
    192 
    193     /**
    194      * A key describing the average bitrate in bits/sec.
    195      * The associated value is an integer
    196      */
    197     public static final String KEY_BIT_RATE = "bitrate";
    198 
    199     /**
    200      * A key describing the max bitrate in bits/sec.
    201      * This is usually over a one-second sliding window (e.g. over any window of one second).
    202      * The associated value is an integer
    203      * @hide
    204      */
    205     public static final String KEY_MAX_BIT_RATE = "max-bitrate";
    206 
    207     /**
    208      * A key describing the color format of the content in a video format.
    209      * Constants are declared in {@link android.media.MediaCodecInfo.CodecCapabilities}.
    210      */
    211     public static final String KEY_COLOR_FORMAT = "color-format";
    212 
    213     /**
    214      * A key describing the frame rate of a video format in frames/sec.
    215      * The associated value is normally an integer when the value is used by the platform,
    216      * but video codecs also accept float configuration values.
    217      * Specifically, {@link MediaExtractor#getTrackFormat MediaExtractor} provides an integer
    218      * value corresponding to the frame rate information of the track if specified and non-zero.
    219      * Otherwise, this key is not present. {@link MediaCodec#configure MediaCodec} accepts both
    220      * float and integer values. This represents the desired operating frame rate if the
    221      * {@link #KEY_OPERATING_RATE} is not present and {@link #KEY_PRIORITY} is {@code 0}
    222      * (realtime). For video encoders this value corresponds to the intended frame rate,
    223      * although encoders are expected
    224      * to support variable frame rate based on {@link MediaCodec.BufferInfo#presentationTimeUs
    225      * buffer timestamp}. This key is not used in the {@code MediaCodec}
    226      * {@link MediaCodec#getInputFormat input}/{@link MediaCodec#getOutputFormat output} formats,
    227      * nor by {@link MediaMuxer#addTrack MediaMuxer}.
    228      */
    229     public static final String KEY_FRAME_RATE = "frame-rate";
    230 
    231     /**
    232      * A key describing the raw audio sample encoding/format.
    233      *
    234      * <p>The associated value is an integer, using one of the
    235      * {@link AudioFormat}.ENCODING_PCM_ values.</p>
    236      *
    237      * <p>This is an optional key for audio decoders and encoders specifying the
    238      * desired raw audio sample format during {@link MediaCodec#configure
    239      * MediaCodec.configure(&hellip;)} call. Use {@link MediaCodec#getInputFormat
    240      * MediaCodec.getInput}/{@link MediaCodec#getOutputFormat OutputFormat(&hellip;)}
    241      * to confirm the actual format. For the PCM decoder this key specifies both
    242      * input and output sample encodings.</p>
    243      *
    244      * <p>This key is also used by {@link MediaExtractor} to specify the sample
    245      * format of audio data, if it is specified.</p>
    246      *
    247      * <p>If this key is missing, the raw audio sample format is signed 16-bit short.</p>
    248      */
    249     public static final String KEY_PCM_ENCODING = "pcm-encoding";
    250 
    251     /**
    252      * A key describing the capture rate of a video format in frames/sec.
    253      * <p>
    254      * When capture rate is different than the frame rate, it means that the
    255      * video is acquired at a different rate than the playback, which produces
    256      * slow motion or timelapse effect during playback. Application can use the
    257      * value of this key to tell the relative speed ratio between capture and
    258      * playback rates when the video was recorded.
    259      * </p>
    260      * <p>
    261      * The associated value is an integer or a float.
    262      * </p>
    263      */
    264     public static final String KEY_CAPTURE_RATE = "capture-rate";
    265 
    266     /**
    267      * A key describing the frequency of key frames expressed in seconds between key frames.
    268      * <p>
    269      * This key is used by video encoders.
    270      * A negative value means no key frames are requested after the first frame.
    271      * A zero value means a stream containing all key frames is requested.
    272      * <p class=note>
    273      * Most video encoders will convert this value of the number of non-key-frames between
    274      * key-frames, using the {@linkplain #KEY_FRAME_RATE frame rate} information; therefore,
    275      * if the actual frame rate differs (e.g. input frames are dropped or the frame rate
    276      * changes), the <strong>time interval</strong> between key frames will not be the
    277      * configured value.
    278      * <p>
    279      * The associated value is an integer (or float since
    280      * {@link android.os.Build.VERSION_CODES#N_MR1}).
    281      */
    282     public static final String KEY_I_FRAME_INTERVAL = "i-frame-interval";
    283 
    284     /**
    285     * An optional key describing the period of intra refresh in frames. This is an
    286     * optional parameter that applies only to video encoders. If encoder supports it
    287     * ({@link MediaCodecInfo.CodecCapabilities#FEATURE_IntraRefresh}), the whole
    288     * frame is completely refreshed after the specified period. Also for each frame,
    289     * a fix subset of macroblocks must be intra coded which leads to more constant bitrate
    290     * than inserting a key frame. This key is recommended for video streaming applications
    291     * as it provides low-delay and good error-resilience. This key is ignored if the
    292     * video encoder does not support the intra refresh feature. Use the output format to
    293     * verify that this feature was enabled.
    294     * The associated value is an integer.
    295     */
    296     public static final String KEY_INTRA_REFRESH_PERIOD = "intra-refresh-period";
    297 
    298    /**
    299      * A key describing the temporal layering schema.  This is an optional parameter
    300      * that applies only to video encoders.  Use {@link MediaCodec#getOutputFormat}
    301      * after {@link MediaCodec#configure configure} to query if the encoder supports
    302      * the desired schema. Supported values are {@code webrtc.vp8.N-layer},
    303      * {@code android.generic.N}, {@code android.generic.N+M} and {@code none}, where
    304      * {@code N} denotes the total number of non-bidirectional layers (which must be at least 1)
    305      * and {@code M} denotes the total number of bidirectional layers (which must be non-negative).
    306      * <p class=note>{@code android.generic.*} schemas have been added in {@link
    307      * android.os.Build.VERSION_CODES#N_MR1}.
    308      * <p>
    309      * The encoder may support fewer temporal layers, in which case the output format
    310      * will contain the configured schema. If the encoder does not support temporal
    311      * layering, the output format will not have an entry with this key.
    312      * The associated value is a string.
    313      */
    314     public static final String KEY_TEMPORAL_LAYERING = "ts-schema";
    315 
    316     /**
    317      * A key describing the stride of the video bytebuffer layout.
    318      * Stride (or row increment) is the difference between the index of a pixel
    319      * and that of the pixel directly underneath. For YUV 420 formats, the
    320      * stride corresponds to the Y plane; the stride of the U and V planes can
    321      * be calculated based on the color format, though it is generally undefined
    322      * and depends on the device and release.
    323      * The associated value is an integer, representing number of bytes.
    324      */
    325     public static final String KEY_STRIDE = "stride";
    326 
    327     /**
    328      * A key describing the plane height of a multi-planar (YUV) video bytebuffer layout.
    329      * Slice height (or plane height/vertical stride) is the number of rows that must be skipped
    330      * to get from the top of the Y plane to the top of the U plane in the bytebuffer. In essence
    331      * the offset of the U plane is sliceHeight * stride. The height of the U/V planes
    332      * can be calculated based on the color format, though it is generally undefined
    333      * and depends on the device and release.
    334      * The associated value is an integer, representing number of rows.
    335      */
    336     public static final String KEY_SLICE_HEIGHT = "slice-height";
    337 
    338     /**
    339      * Applies only when configuring a video encoder in "surface-input" mode.
    340      * The associated value is a long and gives the time in microseconds
    341      * after which the frame previously submitted to the encoder will be
    342      * repeated (once) if no new frame became available since.
    343      */
    344     public static final String KEY_REPEAT_PREVIOUS_FRAME_AFTER
    345         = "repeat-previous-frame-after";
    346 
    347     /**
    348      * If specified when configuring a video decoder rendering to a surface,
    349      * causes the decoder to output "blank", i.e. black frames to the surface
    350      * when stopped to clear out any previously displayed contents.
    351      * The associated value is an integer of value 1.
    352      */
    353     public static final String KEY_PUSH_BLANK_BUFFERS_ON_STOP
    354         = "push-blank-buffers-on-shutdown";
    355 
    356     /**
    357      * A key describing the duration (in microseconds) of the content.
    358      * The associated value is a long.
    359      */
    360     public static final String KEY_DURATION = "durationUs";
    361 
    362     /**
    363      * A key mapping to a value of 1 if the content is AAC audio and
    364      * audio frames are prefixed with an ADTS header.
    365      * The associated value is an integer (0 or 1).
    366      * This key is only supported when _decoding_ content, it cannot
    367      * be used to configure an encoder to emit ADTS output.
    368      */
    369     public static final String KEY_IS_ADTS = "is-adts";
    370 
    371     /**
    372      * A key describing the channel composition of audio content. This mask
    373      * is composed of bits drawn from channel mask definitions in {@link android.media.AudioFormat}.
    374      * The associated value is an integer.
    375      */
    376     public static final String KEY_CHANNEL_MASK = "channel-mask";
    377 
    378     /**
    379      * A key describing the AAC profile to be used (AAC audio formats only).
    380      * Constants are declared in {@link android.media.MediaCodecInfo.CodecProfileLevel}.
    381      */
    382     public static final String KEY_AAC_PROFILE = "aac-profile";
    383 
    384     /**
    385      * A key describing the AAC SBR mode to be used (AAC audio formats only).
    386      * The associated value is an integer and can be set to following values:
    387      * <ul>
    388      * <li>0 - no SBR should be applied</li>
    389      * <li>1 - single rate SBR</li>
    390      * <li>2 - double rate SBR</li>
    391      * </ul>
    392      * Note: If this key is not defined the default SRB mode for the desired AAC profile will
    393      * be used.
    394      * <p>This key is only used during encoding.
    395      */
    396     public static final String KEY_AAC_SBR_MODE = "aac-sbr-mode";
    397 
    398     /**
    399      * A key describing the maximum number of channels that can be output by the AAC decoder.
    400      * By default, the decoder will output the same number of channels as present in the encoded
    401      * stream, if supported. Set this value to limit the number of output channels, and use
    402      * the downmix information in the stream, if available.
    403      * <p>Values larger than the number of channels in the content to decode are ignored.
    404      * <p>This key is only used during decoding.
    405      */
    406     public static final String KEY_AAC_MAX_OUTPUT_CHANNEL_COUNT = "aac-max-output-channel_count";
    407 
    408     /**
    409      * A key describing a gain to be applied so that the output loudness matches the
    410      * Target Reference Level. This is typically used to normalize loudness across program items.
    411      * The gain is derived as the difference between the Target Reference Level and the
    412      * Program Reference Level. The latter can be given in the bitstream and indicates the actual
    413      * loudness value of the program item.
    414      * <p>The value is given as an integer value between
    415      * 0 and 127, and is calculated as -0.25 * Target Reference Level in dBFS.
    416      * Therefore, it represents the range of Full Scale (0 dBFS) to -31.75 dBFS.
    417      * <p>This key is only used during decoding.
    418      */
    419     public static final String KEY_AAC_DRC_TARGET_REFERENCE_LEVEL = "aac-target-ref-level";
    420 
    421     /**
    422      * A key describing the target reference level that was assumed at the encoder for
    423      * calculation of attenuation gains for clipping prevention. This information can be provided
    424      * if it is known, otherwise a worst-case assumption is used.
    425      * <p>The value is given as an integer value between
    426      * 0 and 127, and is calculated as -0.25 * Target Reference Level in dBFS.
    427      * Therefore, it represents the range of Full Scale (0 dBFS) to -31.75 dBFS.
    428      * The default value is the worst-case assumption of 127.
    429      * <p>The value is ignored when heavy compression is used (see
    430      * {@link #KEY_AAC_DRC_HEAVY_COMPRESSION}).
    431      * <p>This key is only used during decoding.
    432      */
    433     public static final String KEY_AAC_ENCODED_TARGET_LEVEL = "aac-encoded-target-level";
    434 
    435     /**
    436      * A key describing the boost factor allowing to adapt the dynamics of the output to the
    437      * actual listening requirements. This relies on DRC gain sequences that can be transmitted in
    438      * the encoded bitstream to be able to reduce the dynamics of the output signal upon request.
    439      * This factor enables the user to select how much of the gains are applied.
    440      * <p>Positive gains (boost) and negative gains (attenuation, see
    441      * {@link #KEY_AAC_DRC_ATTENUATION_FACTOR}) can be controlled separately for a better match
    442      * to different use-cases.
    443      * <p>Typically, attenuation gains are sent for loud signal segments, and boost gains are sent
    444      * for soft signal segments. If the output is listened to in a noisy environment, for example,
    445      * the boost factor is used to enable the positive gains, i.e. to amplify soft signal segments
    446      * beyond the noise floor. But for listening late at night, the attenuation
    447      * factor is used to enable the negative gains, to prevent loud signal from surprising
    448      * the listener. In applications which generally need a low dynamic range, both the boost factor
    449      * and the attenuation factor are used in order to enable all DRC gains.
    450      * <p>In order to prevent clipping, it is also recommended to apply the attenuation factors
    451      * in case of a downmix and/or loudness normalization to high target reference levels.
    452      * <p>Both the boost and the attenuation factor parameters are given as integer values
    453      * between 0 and 127, representing the range of the factor of 0 (i.e. don't apply)
    454      * to 1 (i.e. fully apply boost/attenuation factors respectively).
    455      * <p>This key is only used during decoding.
    456      */
    457     public static final String KEY_AAC_DRC_BOOST_FACTOR = "aac-drc-boost-level";
    458 
    459     /**
    460      * A key describing the attenuation factor allowing to adapt the dynamics of the output to the
    461      * actual listening requirements.
    462      * See {@link #KEY_AAC_DRC_BOOST_FACTOR} for a description of the role of this attenuation
    463      * factor and the value range.
    464      * <p>This key is only used during decoding.
    465      */
    466     public static final String KEY_AAC_DRC_ATTENUATION_FACTOR = "aac-drc-cut-level";
    467 
    468     /**
    469      * A key describing the selection of the heavy compression profile for DRC.
    470      * Two separate DRC gain sequences can be transmitted in one bitstream: MPEG-4 DRC light
    471      * compression, and DVB-specific heavy compression. When selecting the application of the heavy
    472      * compression, one of the sequences is selected:
    473      * <ul>
    474      * <li>0 enables light compression,</li>
    475      * <li>1 enables heavy compression instead.
    476      * </ul>
    477      * Note that only light compression offers the features of scaling of DRC gains
    478      * (see {@link #KEY_AAC_DRC_BOOST_FACTOR} and {@link #KEY_AAC_DRC_ATTENUATION_FACTOR} for the
    479      * boost and attenuation factors, and frequency-selective (multiband) DRC.
    480      * Light compression usually contains clipping prevention for stereo downmixing while heavy
    481      * compression, if additionally provided in the bitstream, is usually stronger, and contains
    482      * clipping prevention for stereo and mono downmixing.
    483      * <p>The default is light compression.
    484      * <p>This key is only used during decoding.
    485      */
    486     public static final String KEY_AAC_DRC_HEAVY_COMPRESSION = "aac-drc-heavy-compression";
    487 
    488     /**
    489      * A key describing the FLAC compression level to be used (FLAC audio format only).
    490      * The associated value is an integer ranging from 0 (fastest, least compression)
    491      * to 8 (slowest, most compression).
    492      */
    493     public static final String KEY_FLAC_COMPRESSION_LEVEL = "flac-compression-level";
    494 
    495     /**
    496      * A key describing the encoding complexity.
    497      * The associated value is an integer.  These values are device and codec specific,
    498      * but lower values generally result in faster and/or less power-hungry encoding.
    499      *
    500      * @see MediaCodecInfo.EncoderCapabilities#getComplexityRange()
    501      */
    502     public static final String KEY_COMPLEXITY = "complexity";
    503 
    504     /**
    505      * A key describing the desired encoding quality.
    506      * The associated value is an integer.  This key is only supported for encoders
    507      * that are configured in constant-quality mode.  These values are device and
    508      * codec specific, but lower values generally result in more efficient
    509      * (smaller-sized) encoding.
    510      *
    511      * @hide
    512      *
    513      * @see MediaCodecInfo.EncoderCapabilities#getQualityRange()
    514      */
    515     public static final String KEY_QUALITY = "quality";
    516 
    517     /**
    518      * A key describing the desired codec priority.
    519      * <p>
    520      * The associated value is an integer. Higher value means lower priority.
    521      * <p>
    522      * Currently, only two levels are supported:<br>
    523      * 0: realtime priority - meaning that the codec shall support the given
    524      *    performance configuration (e.g. framerate) at realtime. This should
    525      *    only be used by media playback, capture, and possibly by realtime
    526      *    communication scenarios if best effort performance is not suitable.<br>
    527      * 1: non-realtime priority (best effort).
    528      * <p>
    529      * This is a hint used at codec configuration and resource planning - to understand
    530      * the realtime requirements of the application; however, due to the nature of
    531      * media components, performance is not guaranteed.
    532      *
    533      */
    534     public static final String KEY_PRIORITY = "priority";
    535 
    536     /**
    537      * A key describing the desired operating frame rate for video or sample rate for audio
    538      * that the codec will need to operate at.
    539      * <p>
    540      * The associated value is an integer or a float representing frames-per-second or
    541      * samples-per-second
    542      * <p>
    543      * This is used for cases like high-speed/slow-motion video capture, where the video encoder
    544      * format contains the target playback rate (e.g. 30fps), but the component must be able to
    545      * handle the high operating capture rate (e.g. 240fps).
    546      * <p>
    547      * This rate will be used by codec for resource planning and setting the operating points.
    548      *
    549      */
    550     public static final String KEY_OPERATING_RATE = "operating-rate";
    551 
    552     /**
    553      * A key describing the desired profile to be used by an encoder.
    554      * The associated value is an integer.
    555      * Constants are declared in {@link MediaCodecInfo.CodecProfileLevel}.
    556      * This key is used as a hint, and is only supported for codecs
    557      * that specify a profile. Note: Codecs are free to use all the available
    558      * coding tools at the specified profile.
    559      *
    560      * @see MediaCodecInfo.CodecCapabilities#profileLevels
    561      */
    562     public static final String KEY_PROFILE = "profile";
    563 
    564     /**
    565      * A key describing the desired profile to be used by an encoder.
    566      * The associated value is an integer.
    567      * Constants are declared in {@link MediaCodecInfo.CodecProfileLevel}.
    568      * This key is used as a further hint when specifying a desired profile,
    569      * and is only supported for codecs that specify a level.
    570      * <p>
    571      * This key is ignored if the {@link #KEY_PROFILE profile} is not specified.
    572      *
    573      * @see MediaCodecInfo.CodecCapabilities#profileLevels
    574      */
    575     public static final String KEY_LEVEL = "level";
    576 
    577     /**
    578      * A key describing the desired clockwise rotation on an output surface.
    579      * This key is only used when the codec is configured using an output surface.
    580      * The associated value is an integer, representing degrees. Supported values
    581      * are 0, 90, 180 or 270. This is an optional field; if not specified, rotation
    582      * defaults to 0.
    583      *
    584      * @see MediaCodecInfo.CodecCapabilities#profileLevels
    585      */
    586     public static final String KEY_ROTATION = "rotation-degrees";
    587 
    588     /**
    589      * A key describing the desired bitrate mode to be used by an encoder.
    590      * Constants are declared in {@link MediaCodecInfo.CodecCapabilities}.
    591      *
    592      * @see MediaCodecInfo.EncoderCapabilities#isBitrateModeSupported(int)
    593      */
    594     public static final String KEY_BITRATE_MODE = "bitrate-mode";
    595 
    596     /**
    597      * A key describing the audio session ID of the AudioTrack associated
    598      * to a tunneled video codec.
    599      * The associated value is an integer.
    600      *
    601      * @see MediaCodecInfo.CodecCapabilities#FEATURE_TunneledPlayback
    602      */
    603     public static final String KEY_AUDIO_SESSION_ID = "audio-session-id";
    604 
    605     /**
    606      * A key for boolean AUTOSELECT behavior for the track. Tracks with AUTOSELECT=true
    607      * are considered when automatically selecting a track without specific user
    608      * choice, based on the current locale.
    609      * This is currently only used for subtitle tracks, when the user selected
    610      * 'Default' for the captioning locale.
    611      * The associated value is an integer, where non-0 means TRUE.  This is an optional
    612      * field; if not specified, AUTOSELECT defaults to TRUE.
    613      */
    614     public static final String KEY_IS_AUTOSELECT = "is-autoselect";
    615 
    616     /**
    617      * A key for boolean DEFAULT behavior for the track. The track with DEFAULT=true is
    618      * selected in the absence of a specific user choice.
    619      * This is currently only used for subtitle tracks, when the user selected
    620      * 'Default' for the captioning locale.
    621      * The associated value is an integer, where non-0 means TRUE.  This is an optional
    622      * field; if not specified, DEFAULT is considered to be FALSE.
    623      */
    624     public static final String KEY_IS_DEFAULT = "is-default";
    625 
    626 
    627     /**
    628      * A key for the FORCED field for subtitle tracks. True if it is a
    629      * forced subtitle track.  Forced subtitle tracks are essential for the
    630      * content and are shown even when the user turns off Captions.  They
    631      * are used for example to translate foreign/alien dialogs or signs.
    632      * The associated value is an integer, where non-0 means TRUE.  This is an
    633      * optional field; if not specified, FORCED defaults to FALSE.
    634      */
    635     public static final String KEY_IS_FORCED_SUBTITLE = "is-forced-subtitle";
    636 
    637     /** @hide */
    638     public static final String KEY_IS_TIMED_TEXT = "is-timed-text";
    639 
    640     // The following color aspect values must be in sync with the ones in HardwareAPI.h.
    641     /**
    642      * An optional key describing the color primaries, white point and
    643      * luminance factors for video content.
    644      *
    645      * The associated value is an integer: 0 if unspecified, or one of the
    646      * COLOR_STANDARD_ values.
    647      */
    648     public static final String KEY_COLOR_STANDARD = "color-standard";
    649 
    650     /** BT.709 color chromacity coordinates with KR = 0.2126, KB = 0.0722. */
    651     public static final int COLOR_STANDARD_BT709 = 1;
    652 
    653     /** BT.601 625 color chromacity coordinates with KR = 0.299, KB = 0.114. */
    654     public static final int COLOR_STANDARD_BT601_PAL = 2;
    655 
    656     /** BT.601 525 color chromacity coordinates with KR = 0.299, KB = 0.114. */
    657     public static final int COLOR_STANDARD_BT601_NTSC = 4;
    658 
    659     /** BT.2020 color chromacity coordinates with KR = 0.2627, KB = 0.0593. */
    660     public static final int COLOR_STANDARD_BT2020 = 6;
    661 
    662     /** @hide */
    663     @IntDef({
    664         COLOR_STANDARD_BT709,
    665         COLOR_STANDARD_BT601_PAL,
    666         COLOR_STANDARD_BT601_NTSC,
    667         COLOR_STANDARD_BT2020,
    668     })
    669     @Retention(RetentionPolicy.SOURCE)
    670     public @interface ColorStandard {}
    671 
    672     /**
    673      * An optional key describing the opto-electronic transfer function used
    674      * for the video content.
    675      *
    676      * The associated value is an integer: 0 if unspecified, or one of the
    677      * COLOR_TRANSFER_ values.
    678      */
    679     public static final String KEY_COLOR_TRANSFER = "color-transfer";
    680 
    681     /** Linear transfer characteristic curve. */
    682     public static final int COLOR_TRANSFER_LINEAR = 1;
    683 
    684     /** SMPTE 170M transfer characteristic curve used by BT.601/BT.709/BT.2020. This is the curve
    685      *  used by most non-HDR video content. */
    686     public static final int COLOR_TRANSFER_SDR_VIDEO = 3;
    687 
    688     /** SMPTE ST 2084 transfer function. This is used by some HDR video content. */
    689     public static final int COLOR_TRANSFER_ST2084 = 6;
    690 
    691     /** ARIB STD-B67 hybrid-log-gamma transfer function. This is used by some HDR video content. */
    692     public static final int COLOR_TRANSFER_HLG = 7;
    693 
    694     /** @hide */
    695     @IntDef({
    696         COLOR_TRANSFER_LINEAR,
    697         COLOR_TRANSFER_SDR_VIDEO,
    698         COLOR_TRANSFER_ST2084,
    699         COLOR_TRANSFER_HLG,
    700     })
    701     @Retention(RetentionPolicy.SOURCE)
    702     public @interface ColorTransfer {}
    703 
    704     /**
    705      * An optional key describing the range of the component values of the video content.
    706      *
    707      * The associated value is an integer: 0 if unspecified, or one of the
    708      * COLOR_RANGE_ values.
    709      */
    710     public static final String KEY_COLOR_RANGE = "color-range";
    711 
    712     /** Limited range. Y component values range from 16 to 235 for 8-bit content.
    713      *  Cr, Cy values range from 16 to 240 for 8-bit content.
    714      *  This is the default for video content. */
    715     public static final int COLOR_RANGE_LIMITED = 2;
    716 
    717     /** Full range. Y, Cr and Cb component values range from 0 to 255 for 8-bit content. */
    718     public static final int COLOR_RANGE_FULL = 1;
    719 
    720     /** @hide */
    721     @IntDef({
    722         COLOR_RANGE_LIMITED,
    723         COLOR_RANGE_FULL,
    724     })
    725     @Retention(RetentionPolicy.SOURCE)
    726     public @interface ColorRange {}
    727 
    728     /**
    729      * An optional key describing the static metadata of HDR (high-dynamic-range) video content.
    730      *
    731      * The associated value is a ByteBuffer. This buffer contains the raw contents of the
    732      * Static Metadata Descriptor (including the descriptor ID) of an HDMI Dynamic Range and
    733      * Mastering InfoFrame as defined by CTA-861.3. This key must be provided to video decoders
    734      * for HDR video content unless this information is contained in the bitstream and the video
    735      * decoder supports an HDR-capable profile. This key must be provided to video encoders for
    736      * HDR video content.
    737      */
    738     public static final String KEY_HDR_STATIC_INFO = "hdr-static-info";
    739 
    740     /**
    741      * A key describing a unique ID for the content of a media track.
    742      *
    743      * <p>This key is used by {@link MediaExtractor}. Some extractors provide multiple encodings
    744      * of the same track (e.g. float audio tracks for FLAC and WAV may be expressed as two
    745      * tracks via MediaExtractor: a normal PCM track for backward compatibility, and a float PCM
    746      * track for added fidelity. Similarly, Dolby Vision extractor may provide a baseline SDR
    747      * version of a DV track.) This key can be used to identify which MediaExtractor tracks refer
    748      * to the same underlying content.
    749      * </p>
    750      *
    751      * The associated value is an integer.
    752      */
    753     public static final String KEY_TRACK_ID = "track-id";
    754 
    755     /* package private */ MediaFormat(Map<String, Object> map) {
    756         mMap = map;
    757     }
    758 
    759     /**
    760      * Creates an empty MediaFormat
    761      */
    762     public MediaFormat() {
    763         mMap = new HashMap();
    764     }
    765 
    766     /* package private */ Map<String, Object> getMap() {
    767         return mMap;
    768     }
    769 
    770     /**
    771      * Returns true iff a key of the given name exists in the format.
    772      */
    773     public final boolean containsKey(String name) {
    774         return mMap.containsKey(name);
    775     }
    776 
    777     /**
    778      * A key prefix used together with a {@link MediaCodecInfo.CodecCapabilities}
    779      * feature name describing a required or optional feature for a codec capabilities
    780      * query.
    781      * The associated value is an integer, where non-0 value means the feature is
    782      * requested to be present, while 0 value means the feature is requested to be not
    783      * present.
    784      * @see MediaCodecList#findDecoderForFormat
    785      * @see MediaCodecList#findEncoderForFormat
    786      * @see MediaCodecInfo.CodecCapabilities#isFormatSupported
    787      *
    788      * @hide
    789      */
    790     public static final String KEY_FEATURE_ = "feature-";
    791 
    792     /**
    793      * Returns the value of an integer key.
    794      */
    795     public final int getInteger(String name) {
    796         return ((Integer)mMap.get(name)).intValue();
    797     }
    798 
    799     /**
    800      * Returns the value of an integer key, or the default value if the
    801      * key is missing or is for another type value.
    802      * @hide
    803      */
    804     public final int getInteger(String name, int defaultValue) {
    805         try {
    806             return getInteger(name);
    807         }
    808         catch (NullPointerException  e) { /* no such field */ }
    809         catch (ClassCastException e) { /* field of different type */ }
    810         return defaultValue;
    811     }
    812 
    813     /**
    814      * Returns the value of a long key.
    815      */
    816     public final long getLong(String name) {
    817         return ((Long)mMap.get(name)).longValue();
    818     }
    819 
    820     /**
    821      * Returns the value of a float key.
    822      */
    823     public final float getFloat(String name) {
    824         return ((Float)mMap.get(name)).floatValue();
    825     }
    826 
    827     /**
    828      * Returns the value of a string key.
    829      */
    830     public final String getString(String name) {
    831         return (String)mMap.get(name);
    832     }
    833 
    834     /**
    835      * Returns the value of a ByteBuffer key.
    836      */
    837     public final ByteBuffer getByteBuffer(String name) {
    838         return (ByteBuffer)mMap.get(name);
    839     }
    840 
    841     /**
    842      * Returns whether a feature is to be enabled ({@code true}) or disabled
    843      * ({@code false}).
    844      *
    845      * @param feature the name of a {@link MediaCodecInfo.CodecCapabilities} feature.
    846      *
    847      * @throws IllegalArgumentException if the feature was neither set to be enabled
    848      *        nor to be disabled.
    849      */
    850     public boolean getFeatureEnabled(String feature) {
    851         Integer enabled = (Integer)mMap.get(KEY_FEATURE_ + feature);
    852         if (enabled == null) {
    853             throw new IllegalArgumentException("feature is not specified");
    854         }
    855         return enabled != 0;
    856     }
    857 
    858     /**
    859      * Sets the value of an integer key.
    860      */
    861     public final void setInteger(String name, int value) {
    862         mMap.put(name, Integer.valueOf(value));
    863     }
    864 
    865     /**
    866      * Sets the value of a long key.
    867      */
    868     public final void setLong(String name, long value) {
    869         mMap.put(name, Long.valueOf(value));
    870     }
    871 
    872     /**
    873      * Sets the value of a float key.
    874      */
    875     public final void setFloat(String name, float value) {
    876         mMap.put(name, new Float(value));
    877     }
    878 
    879     /**
    880      * Sets the value of a string key.
    881      */
    882     public final void setString(String name, String value) {
    883         mMap.put(name, value);
    884     }
    885 
    886     /**
    887      * Sets the value of a ByteBuffer key.
    888      */
    889     public final void setByteBuffer(String name, ByteBuffer bytes) {
    890         mMap.put(name, bytes);
    891     }
    892 
    893     /**
    894      * Sets whether a feature is to be enabled ({@code true}) or disabled
    895      * ({@code false}).
    896      *
    897      * If {@code enabled} is {@code true}, the feature is requested to be present.
    898      * Otherwise, the feature is requested to be not present.
    899      *
    900      * @param feature the name of a {@link MediaCodecInfo.CodecCapabilities} feature.
    901      *
    902      * @see MediaCodecList#findDecoderForFormat
    903      * @see MediaCodecList#findEncoderForFormat
    904      * @see MediaCodecInfo.CodecCapabilities#isFormatSupported
    905      */
    906     public void setFeatureEnabled(String feature, boolean enabled) {
    907         setInteger(KEY_FEATURE_ + feature, enabled ? 1 : 0);
    908     }
    909 
    910     /**
    911      * Creates a minimal audio format.
    912      * @param mime The mime type of the content.
    913      * @param sampleRate The sampling rate of the content.
    914      * @param channelCount The number of audio channels in the content.
    915      */
    916     public static final MediaFormat createAudioFormat(
    917             String mime,
    918             int sampleRate,
    919             int channelCount) {
    920         MediaFormat format = new MediaFormat();
    921         format.setString(KEY_MIME, mime);
    922         format.setInteger(KEY_SAMPLE_RATE, sampleRate);
    923         format.setInteger(KEY_CHANNEL_COUNT, channelCount);
    924 
    925         return format;
    926     }
    927 
    928     /**
    929      * Creates a minimal subtitle format.
    930      * @param mime The mime type of the content.
    931      * @param language The language of the content, using either ISO 639-1 or 639-2/T
    932      *        codes.  Specify null or "und" if language information is only included
    933      *        in the content.  (This will also work if there are multiple language
    934      *        tracks in the content.)
    935      */
    936     public static final MediaFormat createSubtitleFormat(
    937             String mime,
    938             String language) {
    939         MediaFormat format = new MediaFormat();
    940         format.setString(KEY_MIME, mime);
    941         format.setString(KEY_LANGUAGE, language);
    942 
    943         return format;
    944     }
    945 
    946     /**
    947      * Creates a minimal video format.
    948      * @param mime The mime type of the content.
    949      * @param width The width of the content (in pixels)
    950      * @param height The height of the content (in pixels)
    951      */
    952     public static final MediaFormat createVideoFormat(
    953             String mime,
    954             int width,
    955             int height) {
    956         MediaFormat format = new MediaFormat();
    957         format.setString(KEY_MIME, mime);
    958         format.setInteger(KEY_WIDTH, width);
    959         format.setInteger(KEY_HEIGHT, height);
    960 
    961         return format;
    962     }
    963 
    964     @Override
    965     public String toString() {
    966         return mMap.toString();
    967     }
    968 }
    969