blob: 951695b5b58c629bb9c92c8942dc1794360dc510 [file] [log] [blame]
David Conradb061d892007-06-04 22:10:541/*
Aurelien Jacobsff33c5c2008-08-05 00:42:432 * Matroska file demuxer
Diego Biurrun5968d2d2008-08-05 08:28:573 * Copyright (c) 2003-2008 The FFmpeg Project
David Conradb061d892007-06-04 22:10:544 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22/**
Diego Biurrunba87f082010-04-20 14:45:3423 * @file
David Conradb061d892007-06-04 22:10:5424 * Matroska file demuxer
Diego Biurrune873c032011-10-30 18:10:5025 * @author Ronald Bultje <[email protected]>
26 * @author with a little help from Moritz Bunkus <[email protected]>
27 * @author totally reworked by Aurelien Jacobs <[email protected]>
28 * @see specs available on the Matroska project page: http://www.matroska.org/
David Conradb061d892007-06-04 22:10:5429 */
30
Keiji Costantini84cfce92014-03-01 16:28:1531#include "config.h"
32
Diego Biurrund92024f2014-03-10 14:35:5933#include <inttypes.h>
Aurelien Jacobs3eb9bfb2008-09-04 23:26:1234#include <stdio.h>
Keiji Costantini84cfce92014-03-01 16:28:1535
36#include "libavutil/avstring.h"
Michael Niedermayerb3d9ab12014-03-07 22:46:3737#include "libavutil/base64.h"
Keiji Costantini84cfce92014-03-01 16:28:1538#include "libavutil/dict.h"
39#include "libavutil/intfloat.h"
40#include "libavutil/intreadwrite.h"
41#include "libavutil/lzo.h"
Neil Birkbeckbbda13a2016-03-01 00:41:0442#include "libavutil/mastering_display_metadata.h"
Anton Khirnoveb3b5502014-04-29 10:03:1343#include "libavutil/mathematics.h"
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:5744#include "libavutil/opt.h"
Michael Niedermayera52cb422014-11-02 18:19:0745#include "libavutil/time_internal.h"
James Almer445204c2016-12-06 17:48:4546#include "libavutil/spherical.h"
Keiji Costantini84cfce92014-03-01 16:28:1547
48#include "libavcodec/bytestream.h"
Anton Khirnov4efdadc2014-05-25 12:05:5149#include "libavcodec/flac.h"
Keiji Costantini84cfce92014-03-01 16:28:1550#include "libavcodec/mpeg4audio.h"
51
52#include "avformat.h"
53#include "avio_internal.h"
54#include "internal.h"
55#include "isom.h"
56#include "matroska.h"
Anton Khirnov23f741f2014-05-26 10:48:5657#include "oggdec.h"
Keiji Costantini84cfce92014-03-01 16:28:1558/* For ff_codec_get_id(). */
59#include "riff.h"
60#include "rmsipr.h"
David Conradb061d892007-06-04 22:10:5461
Matthew Oliver0167fa02014-11-27 08:00:3662#if CONFIG_BZLIB
63#include <bzlib.h>
64#endif
65#if CONFIG_ZLIB
66#include <zlib.h>
67#endif
68
Mats Peterson79736032015-12-27 20:28:0969#include "qtpalette.h"
70
Steve Lhommea2c77022019-02-23 10:14:3371#define EBML_UNKNOWN_LENGTH UINT64_MAX /* EBML unknown length, in uint64_t */
Andreas Rheinhardta569a7b2019-06-23 23:42:3072#define NEEDS_CHECKING 2 /* Indicates that some error checks
73 * still need to be performed */
Andreas Rheinhardtb31c9b72019-06-23 23:46:5474#define LEVEL_ENDED 3 /* return value of ebml_parse when the
75 * syntax level used for parsing ended. */
Andreas Rheinhardt51203052019-05-16 22:30:1476#define SKIP_THRESHOLD 1024 * 1024 /* In non-seekable mode, if more than SKIP_THRESHOLD
77 * of unkown, potentially damaged data is encountered,
78 * it is considered an error. */
79#define UNKNOWN_EQUIV 50 * 1024 /* An unknown element is considered equivalent
80 * to this many bytes of unknown data for the
81 * SKIP_THRESHOLD check. */
Steve Lhommea2c77022019-02-23 10:14:3382
Aurelien Jacobs789ed102008-08-05 00:40:0083typedef enum {
84 EBML_NONE,
85 EBML_UINT,
Andreas Rheinhardt60f75c92019-05-16 22:30:1386 EBML_SINT,
Aurelien Jacobs789ed102008-08-05 00:40:0087 EBML_FLOAT,
88 EBML_STR,
89 EBML_UTF8,
90 EBML_BIN,
91 EBML_NEST,
wm4cac22952015-02-09 19:39:0092 EBML_LEVEL1,
Aurelien Jacobs789ed102008-08-05 00:40:0093 EBML_STOP,
Reimar Döffinger14d735b2011-02-06 10:32:0394 EBML_TYPE_COUNT
Aurelien Jacobs789ed102008-08-05 00:40:0095} EbmlType;
96
97typedef const struct EbmlSyntax {
98 uint32_t id;
99 EbmlType type;
James Almerf34aabf2019-09-03 21:52:51100 size_t list_elem_size;
101 size_t data_offset;
Aurelien Jacobs789ed102008-08-05 00:40:00102 union {
Chris Cunninghamac258402017-02-03 22:42:44103 int64_t i;
Aurelien Jacobs789ed102008-08-05 00:40:00104 uint64_t u;
105 double f;
106 const char *s;
107 const struct EbmlSyntax *n;
108 } def;
109} EbmlSyntax;
110
Diego Biurrundaf8cf32014-09-22 07:19:33111typedef struct EbmlList {
Aurelien Jacobs789ed102008-08-05 00:40:00112 int nb_elem;
James Almer3b3150c2019-09-03 21:45:04113 unsigned int alloc_elem_size;
Aurelien Jacobs789ed102008-08-05 00:40:00114 void *elem;
115} EbmlList;
116
Diego Biurrundaf8cf32014-09-22 07:19:33117typedef struct EbmlBin {
Aurelien Jacobs789ed102008-08-05 00:40:00118 int size;
James Almera6188662018-04-04 17:12:54119 AVBufferRef *buf;
Aurelien Jacobs789ed102008-08-05 00:40:00120 uint8_t *data;
121 int64_t pos;
122} EbmlBin;
123
Diego Biurrundaf8cf32014-09-22 07:19:33124typedef struct Ebml {
Aurelien Jacobs63511322008-08-05 00:40:02125 uint64_t version;
126 uint64_t max_size;
127 uint64_t id_length;
128 char *doctype;
129 uint64_t doctype_version;
130} Ebml;
131
Diego Biurrundaf8cf32014-09-22 07:19:33132typedef struct MatroskaTrackCompression {
Aurelien Jacobs2cbc8812008-08-05 00:40:31133 uint64_t algo;
134 EbmlBin settings;
135} MatroskaTrackCompression;
David Conradb061d892007-06-04 22:10:54136
Michael Niedermayera0fe1a22015-02-14 20:07:40137typedef struct MatroskaTrackEncryption {
Frank Galliganb8531032013-03-07 16:11:38138 uint64_t algo;
139 EbmlBin key_id;
140} MatroskaTrackEncryption;
141
Diego Biurrundaf8cf32014-09-22 07:19:33142typedef struct MatroskaTrackEncoding {
Aurelien Jacobs2cbc8812008-08-05 00:40:31143 uint64_t scope;
144 uint64_t type;
145 MatroskaTrackCompression compression;
Frank Galliganb8531032013-03-07 16:11:38146 MatroskaTrackEncryption encryption;
Aurelien Jacobs2cbc8812008-08-05 00:40:31147} MatroskaTrackEncoding;
David Conradb061d892007-06-04 22:10:54148
Neil Birkbeckbbda13a2016-03-01 00:41:04149typedef struct MatroskaMasteringMeta {
150 double r_x;
151 double r_y;
152 double g_x;
153 double g_y;
154 double b_x;
155 double b_y;
156 double white_x;
157 double white_y;
158 double max_luminance;
159 double min_luminance;
160} MatroskaMasteringMeta;
161
162typedef struct MatroskaTrackVideoColor {
163 uint64_t matrix_coefficients;
164 uint64_t bits_per_channel;
165 uint64_t chroma_sub_horz;
166 uint64_t chroma_sub_vert;
167 uint64_t cb_sub_horz;
168 uint64_t cb_sub_vert;
169 uint64_t chroma_siting_horz;
170 uint64_t chroma_siting_vert;
171 uint64_t range;
172 uint64_t transfer_characteristics;
173 uint64_t primaries;
174 uint64_t max_cll;
175 uint64_t max_fall;
176 MatroskaMasteringMeta mastering_meta;
177} MatroskaTrackVideoColor;
178
James Almer445204c2016-12-06 17:48:45179typedef struct MatroskaTrackVideoProjection {
180 uint64_t type;
181 EbmlBin private;
182 double yaw;
183 double pitch;
184 double roll;
185} MatroskaTrackVideoProjection;
186
Diego Biurrundaf8cf32014-09-22 07:19:33187typedef struct MatroskaTrackVideo {
Aurelien Jacobs2cbc8812008-08-05 00:40:31188 double frame_rate;
189 uint64_t display_width;
190 uint64_t display_height;
191 uint64_t pixel_width;
192 uint64_t pixel_height;
Andreas Rheinhardt60f75c92019-05-16 22:30:13193 EbmlBin color_space;
James Almerbad8bbc2016-10-15 21:01:50194 uint64_t display_unit;
Luca Barbato5f022662016-03-28 18:29:54195 uint64_t interlaced;
196 uint64_t field_order;
Aurelien Jacobs4c509fe2011-05-23 23:09:24197 uint64_t stereo_mode;
Vignesh Venkatasubramaniance6a8e52013-02-04 23:17:52198 uint64_t alpha_mode;
James Almer4e759072016-12-05 02:22:39199 EbmlList color;
James Almer445204c2016-12-06 17:48:45200 MatroskaTrackVideoProjection projection;
Aurelien Jacobs2cbc8812008-08-05 00:40:31201} MatroskaTrackVideo;
David Conradb061d892007-06-04 22:10:54202
Diego Biurrundaf8cf32014-09-22 07:19:33203typedef struct MatroskaTrackAudio {
Aurelien Jacobs2cbc8812008-08-05 00:40:31204 double samplerate;
205 double out_samplerate;
206 uint64_t bitdepth;
207 uint64_t channels;
David Conradb061d892007-06-04 22:10:54208
Aurelien Jacobs2cbc8812008-08-05 00:40:31209 /* real audio header (extracted from extradata) */
210 int coded_framesize;
211 int sub_packet_h;
212 int frame_size;
213 int sub_packet_size;
214 int sub_packet_cnt;
215 int pkt_cnt;
Reimar Döffingerb09e5062011-02-26 11:52:01216 uint64_t buf_timecode;
Aurelien Jacobs2cbc8812008-08-05 00:40:31217 uint8_t *buf;
218} MatroskaTrackAudio;
David Conradb061d892007-06-04 22:10:54219
Michael Niedermayera0fe1a22015-02-14 20:07:40220typedef struct MatroskaTrackPlane {
Kirill Gavrilove6ec9212011-05-21 15:14:14221 uint64_t uid;
222 uint64_t type;
223} MatroskaTrackPlane;
224
Michael Niedermayera0fe1a22015-02-14 20:07:40225typedef struct MatroskaTrackOperation {
Kirill Gavrilove6ec9212011-05-21 15:14:14226 EbmlList combine_planes;
Kirill Gavrilove6ec9212011-05-21 15:14:14227} MatroskaTrackOperation;
228
Diego Biurrundaf8cf32014-09-22 07:19:33229typedef struct MatroskaTrack {
Aurelien Jacobs2cbc8812008-08-05 00:40:31230 uint64_t num;
Aurelien Jacobs325ace32009-02-15 15:34:22231 uint64_t uid;
Aurelien Jacobs2cbc8812008-08-05 00:40:31232 uint64_t type;
Aurelien Jacobs38766e02009-02-15 15:29:09233 char *name;
Aurelien Jacobs2cbc8812008-08-05 00:40:31234 char *codec_id;
235 EbmlBin codec_priv;
236 char *language;
Anton Khirnov7ff97082008-06-01 13:54:11237 double time_scale;
David Conradb061d892007-06-04 22:10:54238 uint64_t default_duration;
Aurelien Jacobs4eff9742008-08-05 00:39:53239 uint64_t flag_default;
Aurelien Jacobs7a617a82010-07-02 16:38:44240 uint64_t flag_forced;
Vignesh Venkatasubramaniand6f86d72013-10-14 17:42:08241 uint64_t seek_preroll;
Aurelien Jacobs2cbc8812008-08-05 00:40:31242 MatroskaTrackVideo video;
243 MatroskaTrackAudio audio;
Kirill Gavrilove6ec9212011-05-21 15:14:14244 MatroskaTrackOperation operation;
Aurelien Jacobs2cbc8812008-08-05 00:40:31245 EbmlList encodings;
Anton Khirnoveb3b5502014-04-29 10:03:13246 uint64_t codec_delay;
Michael Niedermayerb5bc4362016-06-06 02:23:16247 uint64_t codec_delay_in_track_tb;
Aurelien Jacobsfc4d3352008-08-05 00:40:06248
249 AVStream *stream;
Aurelien Jacobs82360e62008-09-09 12:07:10250 int64_t end_timecode;
Joakim Plate3e93c8e2010-03-03 21:46:43251 int ms_compat;
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:48252 uint64_t max_block_additional_id;
Mats Peterson6aac43f2016-02-24 17:14:05253
254 uint32_t palette[AVPALETTE_COUNT];
255 int has_palette;
David Conradb061d892007-06-04 22:10:54256} MatroskaTrack;
257
Diego Biurrundaf8cf32014-09-22 07:19:33258typedef struct MatroskaAttachment {
Aurelien Jacobs325ace32009-02-15 15:34:22259 uint64_t uid;
Aurelien Jacobsb414cb82008-08-05 00:40:24260 char *filename;
261 char *mime;
262 EbmlBin bin;
Aurelien Jacobs929e9de2009-02-15 15:53:55263
264 AVStream *stream;
Diego Biurrunf69befe2014-03-07 12:54:18265} MatroskaAttachment;
Aurelien Jacobsb414cb82008-08-05 00:40:24266
Diego Biurrundaf8cf32014-09-22 07:19:33267typedef struct MatroskaChapter {
Aurelien Jacobs6bbd7c72008-08-05 00:40:21268 uint64_t start;
269 uint64_t end;
270 uint64_t uid;
271 char *title;
Aurelien Jacobs6cb6e152009-02-15 15:25:14272
273 AVChapter *chapter;
Aurelien Jacobs6bbd7c72008-08-05 00:40:21274} MatroskaChapter;
275
Diego Biurrundaf8cf32014-09-22 07:19:33276typedef struct MatroskaIndexPos {
Aurelien Jacobse5929fd2008-08-05 00:40:15277 uint64_t track;
278 uint64_t pos;
279} MatroskaIndexPos;
280
Diego Biurrundaf8cf32014-09-22 07:19:33281typedef struct MatroskaIndex {
Aurelien Jacobse5929fd2008-08-05 00:40:15282 uint64_t time;
283 EbmlList pos;
284} MatroskaIndex;
285
Diego Biurrundaf8cf32014-09-22 07:19:33286typedef struct MatroskaTag {
Aurelien Jacobs44015c52008-08-08 23:50:38287 char *name;
288 char *string;
Aurelien Jacobsf702df32009-02-15 16:05:37289 char *lang;
290 uint64_t def;
Aurelien Jacobs44015c52008-08-08 23:50:38291 EbmlList sub;
292} MatroskaTag;
293
Diego Biurrundaf8cf32014-09-22 07:19:33294typedef struct MatroskaTagTarget {
Aurelien Jacobs929e9de2009-02-15 15:53:55295 char *type;
296 uint64_t typevalue;
297 uint64_t trackuid;
298 uint64_t chapteruid;
299 uint64_t attachuid;
300} MatroskaTagTarget;
301
Diego Biurrundaf8cf32014-09-22 07:19:33302typedef struct MatroskaTags {
Aurelien Jacobs929e9de2009-02-15 15:53:55303 MatroskaTagTarget target;
304 EbmlList tag;
305} MatroskaTags;
306
Diego Biurrundaf8cf32014-09-22 07:19:33307typedef struct MatroskaSeekhead {
Aurelien Jacobs13b350a2008-08-05 00:40:36308 uint64_t id;
309 uint64_t pos;
310} MatroskaSeekhead;
311
Diego Biurrundaf8cf32014-09-22 07:19:33312typedef struct MatroskaLevel {
Aurelien Jacobs8d75b5a2007-06-04 22:35:16313 uint64_t start;
314 uint64_t length;
David Conradb061d892007-06-04 22:10:54315} MatroskaLevel;
316
Andreas Rheinhardtffa64a42019-05-16 22:29:59317typedef struct MatroskaBlock {
318 uint64_t duration;
319 int64_t reference;
320 uint64_t non_simple;
321 EbmlBin bin;
322 uint64_t additional_id;
323 EbmlBin additional;
Andreas Rheinhardt60f75c92019-05-16 22:30:13324 int64_t discard_padding;
Andreas Rheinhardtffa64a42019-05-16 22:29:59325} MatroskaBlock;
326
Diego Biurrundaf8cf32014-09-22 07:19:33327typedef struct MatroskaCluster {
Andreas Rheinhardtffa64a42019-05-16 22:29:59328 MatroskaBlock block;
Dale Curtis8336eb62012-04-19 18:12:24329 uint64_t timecode;
Andreas Rheinhardtffa64a42019-05-16 22:29:59330 int64_t pos;
Dale Curtis8336eb62012-04-19 18:12:24331} MatroskaCluster;
332
Michael Niedermayera0fe1a22015-02-14 20:07:40333typedef struct MatroskaLevel1Element {
Andreas Rheinhardt730ac1a2019-05-16 22:30:20334 int64_t pos;
Andreas Rheinhardt410a0822019-05-16 22:29:47335 uint32_t id;
wm4cac22952015-02-09 19:39:00336 int parsed;
337} MatroskaLevel1Element;
338
Diego Biurrundaf8cf32014-09-22 07:19:33339typedef struct MatroskaDemuxContext {
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:57340 const AVClass *class;
David Conradb061d892007-06-04 22:10:54341 AVFormatContext *ctx;
342
Diego Biurrun5968d2d2008-08-05 08:28:57343 /* EBML stuff */
David Conradb061d892007-06-04 22:10:54344 MatroskaLevel levels[EBML_MAX_DEPTH];
Andreas Rheinhardt60f75c92019-05-16 22:30:13345 int num_levels;
Aurelien Jacobsc3ade622010-06-11 16:34:01346 uint32_t current_id;
Andreas Rheinhardta3db9f62019-05-16 22:30:05347 int64_t resync_pos;
Andreas Rheinhardt51203052019-05-16 22:30:14348 int unknown_count;
David Conradb061d892007-06-04 22:10:54349
Aurelien Jacobs29708582008-08-05 00:40:27350 uint64_t time_scale;
351 double duration;
352 char *title;
James Almer2c759d72013-11-24 08:31:48353 char *muxingapp;
Andreas Rheinhardt60f75c92019-05-16 22:30:13354 EbmlBin date_utc;
Aurelien Jacobs2cbc8812008-08-05 00:40:31355 EbmlList tracks;
Aurelien Jacobsb414cb82008-08-05 00:40:24356 EbmlList attachments;
Aurelien Jacobs6bbd7c72008-08-05 00:40:21357 EbmlList chapters;
Aurelien Jacobse5929fd2008-08-05 00:40:15358 EbmlList index;
Aurelien Jacobs44015c52008-08-08 23:50:38359 EbmlList tags;
Aurelien Jacobs13b350a2008-08-05 00:40:36360 EbmlList seekhead;
David Conradb061d892007-06-04 22:10:54361
David Conradb061d892007-06-04 22:10:54362 /* byte position of the segment inside the stream */
Diego Biurrunbc5c9182008-10-03 10:16:29363 int64_t segment_start;
David Conradb061d892007-06-04 22:10:54364
Diego Biurrun5968d2d2008-08-05 08:28:57365 /* the packet queue */
James Almer78b96be2018-03-26 18:02:37366 AVPacketList *queue;
367 AVPacketList *queue_end;
David Conradb061d892007-06-04 22:10:54368
Aurelien Jacobs8d75b5a2007-06-04 22:35:16369 int done;
David Conradb061d892007-06-04 22:10:54370
David Conradb061d892007-06-04 22:10:54371 /* What to skip before effectively reading a packet. */
372 int skip_to_keyframe;
Aurelien Jacobs20f74662008-09-09 12:01:51373 uint64_t skip_to_timecode;
Aaron Colwell31ad14c2011-07-09 05:48:43374
375 /* File has a CUES element, but we defer parsing until it is needed. */
376 int cues_parsing_deferred;
Dale Curtis8336eb62012-04-19 18:12:24377
wm4cac22952015-02-09 19:39:00378 /* Level1 elements and whether they were read yet */
379 MatroskaLevel1Element level1_elems[64];
380 int num_level1_elems;
381
Dale Curtis8336eb62012-04-19 18:12:24382 MatroskaCluster current_cluster;
383
James Zern20aeee42017-04-17 17:59:31384 /* WebM DASH Manifest live flag */
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:57385 int is_live;
Vignesh Venkatasubramanian62c27fd2017-04-12 04:33:28386
387 /* Bandwidth value for WebM DASH Manifest */
388 int bandwidth;
David Conradb061d892007-06-04 22:10:54389} MatroskaDemuxContext;
390
Andreas Rheinhardtc1abd952019-05-16 22:30:06391#define CHILD_OF(parent) { .def = { .n = parent } }
392
Andreas Rheinhardtab4795a2019-07-17 03:29:40393// The following forward declarations need their size because
394// a tentative definition with internal linkage must not be an
395// incomplete type (6.7.2 in C90, 6.9.2 in C99).
396// Removing the sizes breaks MSVC.
Andreas Rheinhardt9869e212019-07-18 19:07:20397static EbmlSyntax ebml_syntax[3], matroska_segment[9], matroska_track_video_color[15], matroska_track_video[19],
398 matroska_track[27], matroska_track_encoding[6], matroska_track_encodings[2],
399 matroska_track_combine_planes[2], matroska_track_operation[2], matroska_tracks[2],
400 matroska_attachments[2], matroska_chapter_entry[9], matroska_chapter[6], matroska_chapters[2],
401 matroska_index_entry[3], matroska_index[2], matroska_tag[3], matroska_tags[2], matroska_seekhead[2],
402 matroska_blockadditions[2], matroska_blockgroup[8], matroska_cluster_parsing[8];
Andreas Rheinhardtc1abd952019-05-16 22:30:06403
Andreas Rheinhardt9869e212019-07-18 19:07:20404static EbmlSyntax ebml_header[] = {
Keiji Costantini84cfce92014-03-01 16:28:15405 { EBML_ID_EBMLREADVERSION, EBML_UINT, 0, offsetof(Ebml, version), { .u = EBML_VERSION } },
406 { EBML_ID_EBMLMAXSIZELENGTH, EBML_UINT, 0, offsetof(Ebml, max_size), { .u = 8 } },
407 { EBML_ID_EBMLMAXIDLENGTH, EBML_UINT, 0, offsetof(Ebml, id_length), { .u = 4 } },
408 { EBML_ID_DOCTYPE, EBML_STR, 0, offsetof(Ebml, doctype), { .s = "(none)" } },
409 { EBML_ID_DOCTYPEREADVERSION, EBML_UINT, 0, offsetof(Ebml, doctype_version), { .u = 1 } },
410 { EBML_ID_EBMLVERSION, EBML_NONE },
411 { EBML_ID_DOCTYPEVERSION, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06412 CHILD_OF(ebml_syntax)
Aurelien Jacobs63511322008-08-05 00:40:02413};
414
Andreas Rheinhardt9869e212019-07-18 19:07:20415static EbmlSyntax ebml_syntax[] = {
Andreas Rheinhardtc1abd952019-05-16 22:30:06416 { EBML_ID_HEADER, EBML_NEST, 0, 0, { .n = ebml_header } },
417 { MATROSKA_ID_SEGMENT, EBML_STOP },
Aurelien Jacobs63511322008-08-05 00:40:02418 { 0 }
419};
420
Andreas Rheinhardt9869e212019-07-18 19:07:20421static EbmlSyntax matroska_info[] = {
Keiji Costantini84cfce92014-03-01 16:28:15422 { MATROSKA_ID_TIMECODESCALE, EBML_UINT, 0, offsetof(MatroskaDemuxContext, time_scale), { .u = 1000000 } },
423 { MATROSKA_ID_DURATION, EBML_FLOAT, 0, offsetof(MatroskaDemuxContext, duration) },
424 { MATROSKA_ID_TITLE, EBML_UTF8, 0, offsetof(MatroskaDemuxContext, title) },
425 { MATROSKA_ID_WRITINGAPP, EBML_NONE },
Michael Niedermayerb3d9ab12014-03-07 22:46:37426 { MATROSKA_ID_MUXINGAPP, EBML_UTF8, 0, offsetof(MatroskaDemuxContext, muxingapp) },
427 { MATROSKA_ID_DATEUTC, EBML_BIN, 0, offsetof(MatroskaDemuxContext, date_utc) },
Keiji Costantini84cfce92014-03-01 16:28:15428 { MATROSKA_ID_SEGMENTUID, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06429 CHILD_OF(matroska_segment)
Aurelien Jacobs29708582008-08-05 00:40:27430};
431
Andreas Rheinhardt9869e212019-07-18 19:07:20432static EbmlSyntax matroska_mastering_meta[] = {
Neil Birkbeckbbda13a2016-03-01 00:41:04433 { MATROSKA_ID_VIDEOCOLOR_RX, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, r_x), { .f=-1 } },
434 { MATROSKA_ID_VIDEOCOLOR_RY, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, r_y), { .f=-1 } },
435 { MATROSKA_ID_VIDEOCOLOR_GX, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, g_x), { .f=-1 } },
436 { MATROSKA_ID_VIDEOCOLOR_GY, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, g_y), { .f=-1 } },
437 { MATROSKA_ID_VIDEOCOLOR_BX, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, b_x), { .f=-1 } },
438 { MATROSKA_ID_VIDEOCOLOR_BY, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, b_y), { .f=-1 } },
439 { MATROSKA_ID_VIDEOCOLOR_WHITEX, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, white_x), { .f=-1 } },
440 { MATROSKA_ID_VIDEOCOLOR_WHITEY, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, white_y), { .f=-1 } },
441 { MATROSKA_ID_VIDEOCOLOR_LUMINANCEMIN, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, min_luminance), { .f=-1 } },
442 { MATROSKA_ID_VIDEOCOLOR_LUMINANCEMAX, EBML_FLOAT, 0, offsetof(MatroskaMasteringMeta, max_luminance), { .f=-1 } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06443 CHILD_OF(matroska_track_video_color)
Neil Birkbeckbbda13a2016-03-01 00:41:04444};
445
Andreas Rheinhardt9869e212019-07-18 19:07:20446static EbmlSyntax matroska_track_video_color[] = {
James Almerf5cfc0c2016-10-19 02:40:09447 { MATROSKA_ID_VIDEOCOLORMATRIXCOEFF, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, matrix_coefficients), { .u = AVCOL_SPC_UNSPECIFIED } },
James Almer0ad71ed2016-10-19 02:55:32448 { MATROSKA_ID_VIDEOCOLORBITSPERCHANNEL, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, bits_per_channel), { .u=0 } },
Neil Birkbeckbbda13a2016-03-01 00:41:04449 { MATROSKA_ID_VIDEOCOLORCHROMASUBHORZ, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, chroma_sub_horz), { .u=0 } },
450 { MATROSKA_ID_VIDEOCOLORCHROMASUBVERT, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, chroma_sub_vert), { .u=0 } },
451 { MATROSKA_ID_VIDEOCOLORCBSUBHORZ, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, cb_sub_horz), { .u=0 } },
452 { MATROSKA_ID_VIDEOCOLORCBSUBVERT, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, cb_sub_vert), { .u=0 } },
James Almerf5cfc0c2016-10-19 02:40:09453 { MATROSKA_ID_VIDEOCOLORCHROMASITINGHORZ, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, chroma_siting_horz), { .u = MATROSKA_COLOUR_CHROMASITINGHORZ_UNDETERMINED } },
454 { MATROSKA_ID_VIDEOCOLORCHROMASITINGVERT, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, chroma_siting_vert), { .u = MATROSKA_COLOUR_CHROMASITINGVERT_UNDETERMINED } },
455 { MATROSKA_ID_VIDEOCOLORRANGE, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, range), { .u = AVCOL_RANGE_UNSPECIFIED } },
456 { MATROSKA_ID_VIDEOCOLORTRANSFERCHARACTERISTICS, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, transfer_characteristics), { .u = AVCOL_TRC_UNSPECIFIED } },
457 { MATROSKA_ID_VIDEOCOLORPRIMARIES, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, primaries), { .u = AVCOL_PRI_UNSPECIFIED } },
Neil Birkbeckbbda13a2016-03-01 00:41:04458 { MATROSKA_ID_VIDEOCOLORMAXCLL, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, max_cll), { .u=0 } },
459 { MATROSKA_ID_VIDEOCOLORMAXFALL, EBML_UINT, 0, offsetof(MatroskaTrackVideoColor, max_fall), { .u=0 } },
460 { MATROSKA_ID_VIDEOCOLORMASTERINGMETA, EBML_NEST, 0, offsetof(MatroskaTrackVideoColor, mastering_meta), { .n = matroska_mastering_meta } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06461 CHILD_OF(matroska_track_video)
Neil Birkbeckbbda13a2016-03-01 00:41:04462};
463
Andreas Rheinhardt9869e212019-07-18 19:07:20464static EbmlSyntax matroska_track_video_projection[] = {
James Almer445204c2016-12-06 17:48:45465 { MATROSKA_ID_VIDEOPROJECTIONTYPE, EBML_UINT, 0, offsetof(MatroskaTrackVideoProjection, type), { .u = MATROSKA_VIDEO_PROJECTION_TYPE_RECTANGULAR } },
466 { MATROSKA_ID_VIDEOPROJECTIONPRIVATE, EBML_BIN, 0, offsetof(MatroskaTrackVideoProjection, private) },
467 { MATROSKA_ID_VIDEOPROJECTIONPOSEYAW, EBML_FLOAT, 0, offsetof(MatroskaTrackVideoProjection, yaw), { .f=0.0 } },
468 { MATROSKA_ID_VIDEOPROJECTIONPOSEPITCH, EBML_FLOAT, 0, offsetof(MatroskaTrackVideoProjection, pitch), { .f=0.0 } },
469 { MATROSKA_ID_VIDEOPROJECTIONPOSEROLL, EBML_FLOAT, 0, offsetof(MatroskaTrackVideoProjection, roll), { .f=0.0 } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06470 CHILD_OF(matroska_track_video)
James Almer445204c2016-12-06 17:48:45471};
472
Andreas Rheinhardt9869e212019-07-18 19:07:20473static EbmlSyntax matroska_track_video[] = {
Keiji Costantini84cfce92014-03-01 16:28:15474 { MATROSKA_ID_VIDEOFRAMERATE, EBML_FLOAT, 0, offsetof(MatroskaTrackVideo, frame_rate) },
Michael Niedermayerb3d9ab12014-03-07 22:46:37475 { MATROSKA_ID_VIDEODISPLAYWIDTH, EBML_UINT, 0, offsetof(MatroskaTrackVideo, display_width), { .u=-1 } },
476 { MATROSKA_ID_VIDEODISPLAYHEIGHT, EBML_UINT, 0, offsetof(MatroskaTrackVideo, display_height), { .u=-1 } },
Keiji Costantini84cfce92014-03-01 16:28:15477 { MATROSKA_ID_VIDEOPIXELWIDTH, EBML_UINT, 0, offsetof(MatroskaTrackVideo, pixel_width) },
478 { MATROSKA_ID_VIDEOPIXELHEIGHT, EBML_UINT, 0, offsetof(MatroskaTrackVideo, pixel_height) },
Michael Niedermayerb3d9ab12014-03-07 22:46:37479 { MATROSKA_ID_VIDEOCOLORSPACE, EBML_BIN, 0, offsetof(MatroskaTrackVideo, color_space) },
Michael Niedermayerb3d9ab12014-03-07 22:46:37480 { MATROSKA_ID_VIDEOALPHAMODE, EBML_UINT, 0, offsetof(MatroskaTrackVideo, alpha_mode) },
James Almer4e759072016-12-05 02:22:39481 { MATROSKA_ID_VIDEOCOLOR, EBML_NEST, sizeof(MatroskaTrackVideoColor), offsetof(MatroskaTrackVideo, color), { .n = matroska_track_video_color } },
James Almer445204c2016-12-06 17:48:45482 { MATROSKA_ID_VIDEOPROJECTION, EBML_NEST, 0, offsetof(MatroskaTrackVideo, projection), { .n = matroska_track_video_projection } },
Keiji Costantini84cfce92014-03-01 16:28:15483 { MATROSKA_ID_VIDEOPIXELCROPB, EBML_NONE },
484 { MATROSKA_ID_VIDEOPIXELCROPT, EBML_NONE },
485 { MATROSKA_ID_VIDEOPIXELCROPL, EBML_NONE },
486 { MATROSKA_ID_VIDEOPIXELCROPR, EBML_NONE },
James Almerbad8bbc2016-10-15 21:01:50487 { MATROSKA_ID_VIDEODISPLAYUNIT, EBML_UINT, 0, offsetof(MatroskaTrackVideo, display_unit), { .u= MATROSKA_VIDEO_DISPLAYUNIT_PIXELS } },
Luca Barbato5f022662016-03-28 18:29:54488 { MATROSKA_ID_VIDEOFLAGINTERLACED, EBML_UINT, 0, offsetof(MatroskaTrackVideo, interlaced), { .u = MATROSKA_VIDEO_INTERLACE_FLAG_UNDETERMINED } },
489 { MATROSKA_ID_VIDEOFIELDORDER, EBML_UINT, 0, offsetof(MatroskaTrackVideo, field_order), { .u = MATROSKA_VIDEO_FIELDORDER_UNDETERMINED } },
Vittorio Giovarad4ae8ac2014-08-12 21:28:49490 { MATROSKA_ID_VIDEOSTEREOMODE, EBML_UINT, 0, offsetof(MatroskaTrackVideo, stereo_mode), { .u = MATROSKA_VIDEO_STEREOMODE_TYPE_NB } },
Keiji Costantini84cfce92014-03-01 16:28:15491 { MATROSKA_ID_VIDEOASPECTRATIO, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06492 CHILD_OF(matroska_track)
Aurelien Jacobs2cbc8812008-08-05 00:40:31493};
494
Andreas Rheinhardt9869e212019-07-18 19:07:20495static EbmlSyntax matroska_track_audio[] = {
Keiji Costantini84cfce92014-03-01 16:28:15496 { MATROSKA_ID_AUDIOSAMPLINGFREQ, EBML_FLOAT, 0, offsetof(MatroskaTrackAudio, samplerate), { .f = 8000.0 } },
497 { MATROSKA_ID_AUDIOOUTSAMPLINGFREQ, EBML_FLOAT, 0, offsetof(MatroskaTrackAudio, out_samplerate) },
498 { MATROSKA_ID_AUDIOBITDEPTH, EBML_UINT, 0, offsetof(MatroskaTrackAudio, bitdepth) },
499 { MATROSKA_ID_AUDIOCHANNELS, EBML_UINT, 0, offsetof(MatroskaTrackAudio, channels), { .u = 1 } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06500 CHILD_OF(matroska_track)
Aurelien Jacobs2cbc8812008-08-05 00:40:31501};
502
Andreas Rheinhardt9869e212019-07-18 19:07:20503static EbmlSyntax matroska_track_encoding_compression[] = {
Keiji Costantini84cfce92014-03-01 16:28:15504 { MATROSKA_ID_ENCODINGCOMPALGO, EBML_UINT, 0, offsetof(MatroskaTrackCompression, algo), { .u = 0 } },
505 { MATROSKA_ID_ENCODINGCOMPSETTINGS, EBML_BIN, 0, offsetof(MatroskaTrackCompression, settings) },
Andreas Rheinhardtc1abd952019-05-16 22:30:06506 CHILD_OF(matroska_track_encoding)
Aurelien Jacobs2cbc8812008-08-05 00:40:31507};
508
Andreas Rheinhardt9869e212019-07-18 19:07:20509static EbmlSyntax matroska_track_encoding_encryption[] = {
Michael Niedermayerb3d9ab12014-03-07 22:46:37510 { MATROSKA_ID_ENCODINGENCALGO, EBML_UINT, 0, offsetof(MatroskaTrackEncryption,algo), {.u = 0} },
Frank Galliganb8531032013-03-07 16:11:38511 { MATROSKA_ID_ENCODINGENCKEYID, EBML_BIN, 0, offsetof(MatroskaTrackEncryption,key_id) },
512 { MATROSKA_ID_ENCODINGENCAESSETTINGS, EBML_NONE },
513 { MATROSKA_ID_ENCODINGSIGALGO, EBML_NONE },
514 { MATROSKA_ID_ENCODINGSIGHASHALGO, EBML_NONE },
515 { MATROSKA_ID_ENCODINGSIGKEYID, EBML_NONE },
516 { MATROSKA_ID_ENCODINGSIGNATURE, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06517 CHILD_OF(matroska_track_encoding)
Frank Galliganb8531032013-03-07 16:11:38518};
Andreas Rheinhardt9869e212019-07-18 19:07:20519static EbmlSyntax matroska_track_encoding[] = {
Keiji Costantini84cfce92014-03-01 16:28:15520 { MATROSKA_ID_ENCODINGSCOPE, EBML_UINT, 0, offsetof(MatroskaTrackEncoding, scope), { .u = 1 } },
521 { MATROSKA_ID_ENCODINGTYPE, EBML_UINT, 0, offsetof(MatroskaTrackEncoding, type), { .u = 0 } },
522 { MATROSKA_ID_ENCODINGCOMPRESSION, EBML_NEST, 0, offsetof(MatroskaTrackEncoding, compression), { .n = matroska_track_encoding_compression } },
Michael Niedermayerb3d9ab12014-03-07 22:46:37523 { MATROSKA_ID_ENCODINGENCRYPTION, EBML_NEST, 0, offsetof(MatroskaTrackEncoding, encryption), { .n = matroska_track_encoding_encryption } },
Keiji Costantini84cfce92014-03-01 16:28:15524 { MATROSKA_ID_ENCODINGORDER, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06525 CHILD_OF(matroska_track_encodings)
Aurelien Jacobs2cbc8812008-08-05 00:40:31526};
527
Andreas Rheinhardt9869e212019-07-18 19:07:20528static EbmlSyntax matroska_track_encodings[] = {
Keiji Costantini84cfce92014-03-01 16:28:15529 { MATROSKA_ID_TRACKCONTENTENCODING, EBML_NEST, sizeof(MatroskaTrackEncoding), offsetof(MatroskaTrack, encodings), { .n = matroska_track_encoding } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06530 CHILD_OF(matroska_track)
Aurelien Jacobs2cbc8812008-08-05 00:40:31531};
532
Andreas Rheinhardt9869e212019-07-18 19:07:20533static EbmlSyntax matroska_track_plane[] = {
Kirill Gavrilove6ec9212011-05-21 15:14:14534 { MATROSKA_ID_TRACKPLANEUID, EBML_UINT, 0, offsetof(MatroskaTrackPlane,uid) },
535 { MATROSKA_ID_TRACKPLANETYPE, EBML_UINT, 0, offsetof(MatroskaTrackPlane,type) },
Andreas Rheinhardtc1abd952019-05-16 22:30:06536 CHILD_OF(matroska_track_combine_planes)
Kirill Gavrilove6ec9212011-05-21 15:14:14537};
538
Andreas Rheinhardt9869e212019-07-18 19:07:20539static EbmlSyntax matroska_track_combine_planes[] = {
Michael Niedermayerb3d9ab12014-03-07 22:46:37540 { MATROSKA_ID_TRACKPLANE, EBML_NEST, sizeof(MatroskaTrackPlane), offsetof(MatroskaTrackOperation,combine_planes), {.n = matroska_track_plane} },
Andreas Rheinhardtc1abd952019-05-16 22:30:06541 CHILD_OF(matroska_track_operation)
Kirill Gavrilove6ec9212011-05-21 15:14:14542};
543
Andreas Rheinhardt9869e212019-07-18 19:07:20544static EbmlSyntax matroska_track_operation[] = {
Michael Niedermayerb3d9ab12014-03-07 22:46:37545 { MATROSKA_ID_TRACKCOMBINEPLANES, EBML_NEST, 0, 0, {.n = matroska_track_combine_planes} },
Andreas Rheinhardtc1abd952019-05-16 22:30:06546 CHILD_OF(matroska_track)
Kirill Gavrilove6ec9212011-05-21 15:14:14547};
548
Andreas Rheinhardt9869e212019-07-18 19:07:20549static EbmlSyntax matroska_track[] = {
Keiji Costantini84cfce92014-03-01 16:28:15550 { MATROSKA_ID_TRACKNUMBER, EBML_UINT, 0, offsetof(MatroskaTrack, num) },
551 { MATROSKA_ID_TRACKNAME, EBML_UTF8, 0, offsetof(MatroskaTrack, name) },
552 { MATROSKA_ID_TRACKUID, EBML_UINT, 0, offsetof(MatroskaTrack, uid) },
553 { MATROSKA_ID_TRACKTYPE, EBML_UINT, 0, offsetof(MatroskaTrack, type) },
554 { MATROSKA_ID_CODECID, EBML_STR, 0, offsetof(MatroskaTrack, codec_id) },
555 { MATROSKA_ID_CODECPRIVATE, EBML_BIN, 0, offsetof(MatroskaTrack, codec_priv) },
Anton Khirnoveb3b5502014-04-29 10:03:13556 { MATROSKA_ID_CODECDELAY, EBML_UINT, 0, offsetof(MatroskaTrack, codec_delay) },
Steve Lhommeb5dd9642020-03-22 08:59:26557 { MATROSKA_ID_TRACKLANGUAGE, EBML_STR, 0, offsetof(MatroskaTrack, language), { .s = "eng" } },
Keiji Costantini84cfce92014-03-01 16:28:15558 { MATROSKA_ID_TRACKDEFAULTDURATION, EBML_UINT, 0, offsetof(MatroskaTrack, default_duration) },
Michael Niedermayerb3d9ab12014-03-07 22:46:37559 { MATROSKA_ID_TRACKTIMECODESCALE, EBML_FLOAT, 0, offsetof(MatroskaTrack, time_scale), { .f = 1.0 } },
560 { MATROSKA_ID_TRACKFLAGDEFAULT, EBML_UINT, 0, offsetof(MatroskaTrack, flag_default), { .u = 1 } },
561 { MATROSKA_ID_TRACKFLAGFORCED, EBML_UINT, 0, offsetof(MatroskaTrack, flag_forced), { .u = 0 } },
Keiji Costantini84cfce92014-03-01 16:28:15562 { MATROSKA_ID_TRACKVIDEO, EBML_NEST, 0, offsetof(MatroskaTrack, video), { .n = matroska_track_video } },
563 { MATROSKA_ID_TRACKAUDIO, EBML_NEST, 0, offsetof(MatroskaTrack, audio), { .n = matroska_track_audio } },
Michael Niedermayerb3d9ab12014-03-07 22:46:37564 { MATROSKA_ID_TRACKOPERATION, EBML_NEST, 0, offsetof(MatroskaTrack, operation), { .n = matroska_track_operation } },
Keiji Costantini84cfce92014-03-01 16:28:15565 { MATROSKA_ID_TRACKCONTENTENCODINGS, EBML_NEST, 0, 0, { .n = matroska_track_encodings } },
Michael Niedermayerb3d9ab12014-03-07 22:46:37566 { MATROSKA_ID_TRACKMAXBLKADDID, EBML_UINT, 0, offsetof(MatroskaTrack, max_block_additional_id) },
Michael Niedermayerb3d9ab12014-03-07 22:46:37567 { MATROSKA_ID_SEEKPREROLL, EBML_UINT, 0, offsetof(MatroskaTrack, seek_preroll) },
Keiji Costantini84cfce92014-03-01 16:28:15568 { MATROSKA_ID_TRACKFLAGENABLED, EBML_NONE },
569 { MATROSKA_ID_TRACKFLAGLACING, EBML_NONE },
570 { MATROSKA_ID_CODECNAME, EBML_NONE },
571 { MATROSKA_ID_CODECDECODEALL, EBML_NONE },
572 { MATROSKA_ID_CODECINFOURL, EBML_NONE },
573 { MATROSKA_ID_CODECDOWNLOADURL, EBML_NONE },
574 { MATROSKA_ID_TRACKMINCACHE, EBML_NONE },
575 { MATROSKA_ID_TRACKMAXCACHE, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06576 CHILD_OF(matroska_tracks)
Aurelien Jacobs2cbc8812008-08-05 00:40:31577};
578
Andreas Rheinhardt9869e212019-07-18 19:07:20579static EbmlSyntax matroska_tracks[] = {
Keiji Costantini84cfce92014-03-01 16:28:15580 { MATROSKA_ID_TRACKENTRY, EBML_NEST, sizeof(MatroskaTrack), offsetof(MatroskaDemuxContext, tracks), { .n = matroska_track } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06581 CHILD_OF(matroska_segment)
Aurelien Jacobs2cbc8812008-08-05 00:40:31582};
583
Andreas Rheinhardt9869e212019-07-18 19:07:20584static EbmlSyntax matroska_attachment[] = {
Diego Biurrunf69befe2014-03-07 12:54:18585 { MATROSKA_ID_FILEUID, EBML_UINT, 0, offsetof(MatroskaAttachment, uid) },
586 { MATROSKA_ID_FILENAME, EBML_UTF8, 0, offsetof(MatroskaAttachment, filename) },
587 { MATROSKA_ID_FILEMIMETYPE, EBML_STR, 0, offsetof(MatroskaAttachment, mime) },
588 { MATROSKA_ID_FILEDATA, EBML_BIN, 0, offsetof(MatroskaAttachment, bin) },
Keiji Costantini84cfce92014-03-01 16:28:15589 { MATROSKA_ID_FILEDESC, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06590 CHILD_OF(matroska_attachments)
Aurelien Jacobsb414cb82008-08-05 00:40:24591};
592
Andreas Rheinhardt9869e212019-07-18 19:07:20593static EbmlSyntax matroska_attachments[] = {
Diego Biurrunf69befe2014-03-07 12:54:18594 { MATROSKA_ID_ATTACHEDFILE, EBML_NEST, sizeof(MatroskaAttachment), offsetof(MatroskaDemuxContext, attachments), { .n = matroska_attachment } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06595 CHILD_OF(matroska_segment)
Aurelien Jacobsb414cb82008-08-05 00:40:24596};
597
Andreas Rheinhardt9869e212019-07-18 19:07:20598static EbmlSyntax matroska_chapter_display[] = {
Rodger Combscf2719a2015-09-20 14:34:05599 { MATROSKA_ID_CHAPSTRING, EBML_UTF8, 0, offsetof(MatroskaChapter, title) },
600 { MATROSKA_ID_CHAPLANG, EBML_NONE },
601 { MATROSKA_ID_CHAPCOUNTRY, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06602 CHILD_OF(matroska_chapter_entry)
Aurelien Jacobs6bbd7c72008-08-05 00:40:21603};
604
Andreas Rheinhardt9869e212019-07-18 19:07:20605static EbmlSyntax matroska_chapter_entry[] = {
Keiji Costantini84cfce92014-03-01 16:28:15606 { MATROSKA_ID_CHAPTERTIMESTART, EBML_UINT, 0, offsetof(MatroskaChapter, start), { .u = AV_NOPTS_VALUE } },
607 { MATROSKA_ID_CHAPTERTIMEEND, EBML_UINT, 0, offsetof(MatroskaChapter, end), { .u = AV_NOPTS_VALUE } },
608 { MATROSKA_ID_CHAPTERUID, EBML_UINT, 0, offsetof(MatroskaChapter, uid) },
609 { MATROSKA_ID_CHAPTERDISPLAY, EBML_NEST, 0, 0, { .n = matroska_chapter_display } },
Aurelien Jacobs6bbd7c72008-08-05 00:40:21610 { MATROSKA_ID_CHAPTERFLAGHIDDEN, EBML_NONE },
Aurelien Jacobs5df3cc62008-08-13 21:15:15611 { MATROSKA_ID_CHAPTERFLAGENABLED, EBML_NONE },
612 { MATROSKA_ID_CHAPTERPHYSEQUIV, EBML_NONE },
613 { MATROSKA_ID_CHAPTERATOM, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06614 CHILD_OF(matroska_chapter)
Aurelien Jacobs6bbd7c72008-08-05 00:40:21615};
616
Andreas Rheinhardt9869e212019-07-18 19:07:20617static EbmlSyntax matroska_chapter[] = {
Keiji Costantini84cfce92014-03-01 16:28:15618 { MATROSKA_ID_CHAPTERATOM, EBML_NEST, sizeof(MatroskaChapter), offsetof(MatroskaDemuxContext, chapters), { .n = matroska_chapter_entry } },
Aurelien Jacobs6bbd7c72008-08-05 00:40:21619 { MATROSKA_ID_EDITIONUID, EBML_NONE },
620 { MATROSKA_ID_EDITIONFLAGHIDDEN, EBML_NONE },
621 { MATROSKA_ID_EDITIONFLAGDEFAULT, EBML_NONE },
Aurelien Jacobs5df3cc62008-08-13 21:15:15622 { MATROSKA_ID_EDITIONFLAGORDERED, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06623 CHILD_OF(matroska_chapters)
Aurelien Jacobs6bbd7c72008-08-05 00:40:21624};
625
Andreas Rheinhardt9869e212019-07-18 19:07:20626static EbmlSyntax matroska_chapters[] = {
Keiji Costantini84cfce92014-03-01 16:28:15627 { MATROSKA_ID_EDITIONENTRY, EBML_NEST, 0, 0, { .n = matroska_chapter } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06628 CHILD_OF(matroska_segment)
Aurelien Jacobs6bbd7c72008-08-05 00:40:21629};
630
Andreas Rheinhardt9869e212019-07-18 19:07:20631static EbmlSyntax matroska_index_pos[] = {
Keiji Costantini84cfce92014-03-01 16:28:15632 { MATROSKA_ID_CUETRACK, EBML_UINT, 0, offsetof(MatroskaIndexPos, track) },
633 { MATROSKA_ID_CUECLUSTERPOSITION, EBML_UINT, 0, offsetof(MatroskaIndexPos, pos) },
James Almer5ab7b3b2013-09-15 09:32:36634 { MATROSKA_ID_CUERELATIVEPOSITION,EBML_NONE },
James Almer56f17402013-09-21 01:15:49635 { MATROSKA_ID_CUEDURATION, EBML_NONE },
Aurelien Jacobs5df3cc62008-08-13 21:15:15636 { MATROSKA_ID_CUEBLOCKNUMBER, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06637 CHILD_OF(matroska_index_entry)
Aurelien Jacobse5929fd2008-08-05 00:40:15638};
639
Andreas Rheinhardt9869e212019-07-18 19:07:20640static EbmlSyntax matroska_index_entry[] = {
Keiji Costantini84cfce92014-03-01 16:28:15641 { MATROSKA_ID_CUETIME, EBML_UINT, 0, offsetof(MatroskaIndex, time) },
642 { MATROSKA_ID_CUETRACKPOSITION, EBML_NEST, sizeof(MatroskaIndexPos), offsetof(MatroskaIndex, pos), { .n = matroska_index_pos } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06643 CHILD_OF(matroska_index)
Aurelien Jacobse5929fd2008-08-05 00:40:15644};
645
Andreas Rheinhardt9869e212019-07-18 19:07:20646static EbmlSyntax matroska_index[] = {
Keiji Costantini84cfce92014-03-01 16:28:15647 { MATROSKA_ID_POINTENTRY, EBML_NEST, sizeof(MatroskaIndex), offsetof(MatroskaDemuxContext, index), { .n = matroska_index_entry } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06648 CHILD_OF(matroska_segment)
Aurelien Jacobse5929fd2008-08-05 00:40:15649};
650
Andreas Rheinhardt9869e212019-07-18 19:07:20651static EbmlSyntax matroska_simpletag[] = {
Keiji Costantini84cfce92014-03-01 16:28:15652 { MATROSKA_ID_TAGNAME, EBML_UTF8, 0, offsetof(MatroskaTag, name) },
653 { MATROSKA_ID_TAGSTRING, EBML_UTF8, 0, offsetof(MatroskaTag, string) },
654 { MATROSKA_ID_TAGLANG, EBML_STR, 0, offsetof(MatroskaTag, lang), { .s = "und" } },
655 { MATROSKA_ID_TAGDEFAULT, EBML_UINT, 0, offsetof(MatroskaTag, def) },
656 { MATROSKA_ID_TAGDEFAULT_BUG, EBML_UINT, 0, offsetof(MatroskaTag, def) },
657 { MATROSKA_ID_SIMPLETAG, EBML_NEST, sizeof(MatroskaTag), offsetof(MatroskaTag, sub), { .n = matroska_simpletag } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06658 CHILD_OF(matroska_tag)
Aurelien Jacobs44015c52008-08-08 23:50:38659};
660
Andreas Rheinhardt9869e212019-07-18 19:07:20661static EbmlSyntax matroska_tagtargets[] = {
Keiji Costantini84cfce92014-03-01 16:28:15662 { MATROSKA_ID_TAGTARGETS_TYPE, EBML_STR, 0, offsetof(MatroskaTagTarget, type) },
663 { MATROSKA_ID_TAGTARGETS_TYPEVALUE, EBML_UINT, 0, offsetof(MatroskaTagTarget, typevalue), { .u = 50 } },
664 { MATROSKA_ID_TAGTARGETS_TRACKUID, EBML_UINT, 0, offsetof(MatroskaTagTarget, trackuid) },
665 { MATROSKA_ID_TAGTARGETS_CHAPTERUID, EBML_UINT, 0, offsetof(MatroskaTagTarget, chapteruid) },
666 { MATROSKA_ID_TAGTARGETS_ATTACHUID, EBML_UINT, 0, offsetof(MatroskaTagTarget, attachuid) },
Andreas Rheinhardtc1abd952019-05-16 22:30:06667 CHILD_OF(matroska_tag)
Aurelien Jacobs929e9de2009-02-15 15:53:55668};
669
Andreas Rheinhardt9869e212019-07-18 19:07:20670static EbmlSyntax matroska_tag[] = {
Keiji Costantini84cfce92014-03-01 16:28:15671 { MATROSKA_ID_SIMPLETAG, EBML_NEST, sizeof(MatroskaTag), offsetof(MatroskaTags, tag), { .n = matroska_simpletag } },
672 { MATROSKA_ID_TAGTARGETS, EBML_NEST, 0, offsetof(MatroskaTags, target), { .n = matroska_tagtargets } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06673 CHILD_OF(matroska_tags)
Aurelien Jacobs44015c52008-08-08 23:50:38674};
675
Andreas Rheinhardt9869e212019-07-18 19:07:20676static EbmlSyntax matroska_tags[] = {
Keiji Costantini84cfce92014-03-01 16:28:15677 { MATROSKA_ID_TAG, EBML_NEST, sizeof(MatroskaTags), offsetof(MatroskaDemuxContext, tags), { .n = matroska_tag } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06678 CHILD_OF(matroska_segment)
Aurelien Jacobs434d4962008-08-05 00:40:18679};
680
Andreas Rheinhardt9869e212019-07-18 19:07:20681static EbmlSyntax matroska_seekhead_entry[] = {
Keiji Costantini84cfce92014-03-01 16:28:15682 { MATROSKA_ID_SEEKID, EBML_UINT, 0, offsetof(MatroskaSeekhead, id) },
683 { MATROSKA_ID_SEEKPOSITION, EBML_UINT, 0, offsetof(MatroskaSeekhead, pos), { .u = -1 } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06684 CHILD_OF(matroska_seekhead)
Aurelien Jacobs13b350a2008-08-05 00:40:36685};
686
Andreas Rheinhardt9869e212019-07-18 19:07:20687static EbmlSyntax matroska_seekhead[] = {
Keiji Costantini84cfce92014-03-01 16:28:15688 { MATROSKA_ID_SEEKENTRY, EBML_NEST, sizeof(MatroskaSeekhead), offsetof(MatroskaDemuxContext, seekhead), { .n = matroska_seekhead_entry } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06689 CHILD_OF(matroska_segment)
Aurelien Jacobs13b350a2008-08-05 00:40:36690};
691
Andreas Rheinhardt9869e212019-07-18 19:07:20692static EbmlSyntax matroska_segment[] = {
Andreas Rheinhardt71c90882019-05-16 22:30:18693 { MATROSKA_ID_CLUSTER, EBML_STOP },
wm4cac22952015-02-09 19:39:00694 { MATROSKA_ID_INFO, EBML_LEVEL1, 0, 0, { .n = matroska_info } },
695 { MATROSKA_ID_TRACKS, EBML_LEVEL1, 0, 0, { .n = matroska_tracks } },
696 { MATROSKA_ID_ATTACHMENTS, EBML_LEVEL1, 0, 0, { .n = matroska_attachments } },
697 { MATROSKA_ID_CHAPTERS, EBML_LEVEL1, 0, 0, { .n = matroska_chapters } },
698 { MATROSKA_ID_CUES, EBML_LEVEL1, 0, 0, { .n = matroska_index } },
699 { MATROSKA_ID_TAGS, EBML_LEVEL1, 0, 0, { .n = matroska_tags } },
700 { MATROSKA_ID_SEEKHEAD, EBML_LEVEL1, 0, 0, { .n = matroska_seekhead } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06701 { 0 } /* We don't want to go back to level 0, so don't add the parent. */
Aurelien Jacobsce6f28b2008-08-05 00:40:58702};
703
Andreas Rheinhardt9869e212019-07-18 19:07:20704static EbmlSyntax matroska_segments[] = {
Keiji Costantini84cfce92014-03-01 16:28:15705 { MATROSKA_ID_SEGMENT, EBML_NEST, 0, 0, { .n = matroska_segment } },
Aurelien Jacobsce6f28b2008-08-05 00:40:58706 { 0 }
707};
708
Andreas Rheinhardt9869e212019-07-18 19:07:20709static EbmlSyntax matroska_blockmore[] = {
Andreas Rheinhardtdbc50f82019-11-20 12:26:59710 { MATROSKA_ID_BLOCKADDID, EBML_UINT, 0, offsetof(MatroskaBlock,additional_id), { .u = 1 } },
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:48711 { MATROSKA_ID_BLOCKADDITIONAL, EBML_BIN, 0, offsetof(MatroskaBlock,additional) },
Andreas Rheinhardtc1abd952019-05-16 22:30:06712 CHILD_OF(matroska_blockadditions)
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:48713};
714
Andreas Rheinhardt9869e212019-07-18 19:07:20715static EbmlSyntax matroska_blockadditions[] = {
Michael Niedermayerb3d9ab12014-03-07 22:46:37716 { MATROSKA_ID_BLOCKMORE, EBML_NEST, 0, 0, {.n = matroska_blockmore} },
Andreas Rheinhardtc1abd952019-05-16 22:30:06717 CHILD_OF(matroska_blockgroup)
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:48718};
719
Andreas Rheinhardt9869e212019-07-18 19:07:20720static EbmlSyntax matroska_blockgroup[] = {
Keiji Costantini84cfce92014-03-01 16:28:15721 { MATROSKA_ID_BLOCK, EBML_BIN, 0, offsetof(MatroskaBlock, bin) },
Michael Niedermayerb3d9ab12014-03-07 22:46:37722 { MATROSKA_ID_BLOCKADDITIONS, EBML_NEST, 0, 0, { .n = matroska_blockadditions} },
Michael Niedermayerb3d9ab12014-03-07 22:46:37723 { MATROSKA_ID_BLOCKDURATION, EBML_UINT, 0, offsetof(MatroskaBlock, duration) },
724 { MATROSKA_ID_DISCARDPADDING, EBML_SINT, 0, offsetof(MatroskaBlock, discard_padding) },
Chris Cunninghamac258402017-02-03 22:42:44725 { MATROSKA_ID_BLOCKREFERENCE, EBML_SINT, 0, offsetof(MatroskaBlock, reference), { .i = INT64_MIN } },
Anton Khirnov564b7e02013-05-15 13:48:15726 { MATROSKA_ID_CODECSTATE, EBML_NONE },
Keiji Costantini84cfce92014-03-01 16:28:15727 { 1, EBML_UINT, 0, offsetof(MatroskaBlock, non_simple), { .u = 1 } },
Andreas Rheinhardtc1abd952019-05-16 22:30:06728 CHILD_OF(matroska_cluster_parsing)
Aurelien Jacobs209472b2008-08-05 00:41:05729};
730
Andreas Rheinhardt38255cd2019-05-16 22:30:10731// The following array contains SimpleBlock and BlockGroup twice
732// in order to reuse the other values for matroska_cluster_enter.
Andreas Rheinhardt9869e212019-07-18 19:07:20733static EbmlSyntax matroska_cluster_parsing[] = {
Andreas Rheinhardtbc3306f2019-05-16 22:30:00734 { MATROSKA_ID_SIMPLEBLOCK, EBML_BIN, 0, offsetof(MatroskaBlock, bin) },
Andreas Rheinhardt38255cd2019-05-16 22:30:10735 { MATROSKA_ID_BLOCKGROUP, EBML_NEST, 0, 0, { .n = matroska_blockgroup } },
Keiji Costantini84cfce92014-03-01 16:28:15736 { MATROSKA_ID_CLUSTERTIMECODE, EBML_UINT, 0, offsetof(MatroskaCluster, timecode) },
Keiji Costantini84cfce92014-03-01 16:28:15737 { MATROSKA_ID_SIMPLEBLOCK, EBML_STOP },
Andreas Rheinhardt38255cd2019-05-16 22:30:10738 { MATROSKA_ID_BLOCKGROUP, EBML_STOP },
Keiji Costantini84cfce92014-03-01 16:28:15739 { MATROSKA_ID_CLUSTERPOSITION, EBML_NONE },
740 { MATROSKA_ID_CLUSTERPREVSIZE, EBML_NONE },
Andreas Rheinhardtc1abd952019-05-16 22:30:06741 CHILD_OF(matroska_segment)
Dale Curtis8336eb62012-04-19 18:12:24742};
743
Andreas Rheinhardt9869e212019-07-18 19:07:20744static EbmlSyntax matroska_cluster_enter[] = {
Andreas Rheinhardt38255cd2019-05-16 22:30:10745 { MATROSKA_ID_CLUSTER, EBML_NEST, 0, 0, { .n = &matroska_cluster_parsing[2] } },
Andreas Rheinhardt865c5372019-05-16 22:30:08746 { 0 }
747};
Andreas Rheinhardtc1abd952019-05-16 22:30:06748#undef CHILD_OF
Dale Curtis8336eb62012-04-19 18:12:24749
Andreas Rheinhardt67e957b2020-04-16 01:39:05750static const CodecMime mkv_image_mime_tags[] = {
751 {"image/gif" , AV_CODEC_ID_GIF},
752 {"image/jpeg" , AV_CODEC_ID_MJPEG},
753 {"image/png" , AV_CODEC_ID_PNG},
754 {"image/tiff" , AV_CODEC_ID_TIFF},
755
756 {"" , AV_CODEC_ID_NONE}
757};
758
759static const CodecMime mkv_mime_tags[] = {
760 {"text/plain" , AV_CODEC_ID_TEXT},
761 {"application/x-truetype-font", AV_CODEC_ID_TTF},
762 {"application/x-font" , AV_CODEC_ID_TTF},
763 {"application/vnd.ms-opentype", AV_CODEC_ID_OTF},
764 {"binary" , AV_CODEC_ID_BIN_DATA},
765
766 {"" , AV_CODEC_ID_NONE}
767};
768
Alex Converseb0f29db2012-02-20 08:42:33769static const char *const matroska_doctypes[] = { "matroska", "webm" };
James Zern470491f2010-05-22 01:41:32770
Michael Niedermayerf573acc2016-06-24 16:26:46771static int matroska_read_close(AVFormatContext *s);
772
Andreas Rheinhardt310f3262019-05-16 22:30:02773/*
774 * This function prepares the status for parsing of level 1 elements.
775 */
776static int matroska_reset_status(MatroskaDemuxContext *matroska,
777 uint32_t id, int64_t position)
778{
779 if (position >= 0) {
Andreas Rheinhardtc294f382019-08-17 00:27:51780 int64_t err = avio_seek(matroska->ctx->pb, position, SEEK_SET);
Andreas Rheinhardt310f3262019-05-16 22:30:02781 if (err < 0)
782 return err;
783 }
784
Andreas Rheinhardt51203052019-05-16 22:30:14785 matroska->current_id = id;
786 matroska->num_levels = 1;
787 matroska->unknown_count = 0;
Andreas Rheinhardta3db9f62019-05-16 22:30:05788 matroska->resync_pos = avio_tell(matroska->ctx->pb);
789 if (id)
790 matroska->resync_pos -= (av_log2(id) + 7) / 8;
Andreas Rheinhardt310f3262019-05-16 22:30:02791
792 return 0;
793}
794
Reimar Döffingerd4931702012-02-13 22:06:19795static int matroska_resync(MatroskaDemuxContext *matroska, int64_t last_pos)
796{
797 AVIOContext *pb = matroska->ctx->pb;
798 uint32_t id;
Reimar Döffingerd4931702012-02-13 22:06:19799
Andreas Rheinhardt27f40b12019-05-16 22:30:01800 /* Try to seek to the last position to resync from. If this doesn't work,
801 * we resync from the earliest position available: The start of the buffer. */
802 if (last_pos < avio_tell(pb) && avio_seek(pb, last_pos + 1, SEEK_SET) < 0) {
803 av_log(matroska->ctx, AV_LOG_WARNING,
804 "Seek to desired resync point failed. Seeking to "
805 "earliest point available instead.\n");
806 avio_seek(pb, FFMAX(avio_tell(pb) + (pb->buffer - pb->buf_ptr),
807 last_pos + 1), SEEK_SET);
Sophia Wang8c830622016-09-27 19:00:29808 }
Reimar Döffingerd4931702012-02-13 22:06:19809
810 id = avio_rb32(pb);
811
812 // try to find a toplevel element
James Almerd34ec642014-08-07 20:12:41813 while (!avio_feof(pb)) {
Sean McGovern8835c552013-05-27 22:11:50814 if (id == MATROSKA_ID_INFO || id == MATROSKA_ID_TRACKS ||
815 id == MATROSKA_ID_CUES || id == MATROSKA_ID_TAGS ||
Reimar Döffingerd4931702012-02-13 22:06:19816 id == MATROSKA_ID_SEEKHEAD || id == MATROSKA_ID_ATTACHMENTS ||
Sean McGovern8835c552013-05-27 22:11:50817 id == MATROSKA_ID_CLUSTER || id == MATROSKA_ID_CHAPTERS) {
Andreas Rheinhardt8a286e72019-05-16 22:30:03818 /* Prepare the context for parsing of a level 1 element. */
819 matroska_reset_status(matroska, id, -1);
Michael Niedermayerfccc37c2019-08-28 17:04:42820 /* Given that we are here means that an error has occurred,
Andreas Rheinhardt8a286e72019-05-16 22:30:03821 * so treat the segment as unknown length in order not to
822 * discard valid data that happens to be beyond the designated
823 * end of the segment. */
824 matroska->levels[0].length = EBML_UNKNOWN_LENGTH;
Keiji Costantini84cfce92014-03-01 16:28:15825 return 0;
Reimar Döffingerd4931702012-02-13 22:06:19826 }
827 id = (id << 8) | avio_r8(pb);
828 }
Keiji Costantini84cfce92014-03-01 16:28:15829
Reimar Döffingerd4931702012-02-13 22:06:19830 matroska->done = 1;
Andreas Rheinhardt27f40b12019-05-16 22:30:01831 return pb->error ? pb->error : AVERROR_EOF;
Reimar Döffingerd4931702012-02-13 22:06:19832}
833
David Conradb061d892007-06-04 22:10:54834/*
David Conradb061d892007-06-04 22:10:54835 * Read: an "EBML number", which is defined as a variable-length
836 * array of bytes. The first byte indicates the length by giving a
837 * number of 0-bits followed by a one. The position of the first
838 * "one" bit inside the first byte indicates the length of this
839 * number.
Diego Biurrun5968d2d2008-08-05 08:28:57840 * Returns: number of bytes read, < 0 on error
David Conradb061d892007-06-04 22:10:54841 */
Anton Khirnov471fe572011-02-20 10:04:12842static int ebml_read_num(MatroskaDemuxContext *matroska, AVIOContext *pb,
Andreas Rheinhardt239c7362019-06-25 01:08:56843 int max_size, uint64_t *number, int eof_forbidden)
David Conradb061d892007-06-04 22:10:54844{
Andreas Rheinhardt239c7362019-06-25 01:08:56845 int read, n = 1;
846 uint64_t total;
847 int64_t pos;
David Conradb061d892007-06-04 22:10:54848
Andreas Rheinhardt239c7362019-06-25 01:08:56849 /* The first byte tells us the length in bytes - except when it is zero. */
850 total = avio_r8(pb);
851 if (pb->eof_reached)
852 goto err;
David Conradb061d892007-06-04 22:10:54853
854 /* get the length of the EBML number */
Reimar Döffingerff6a5fc2010-09-02 19:17:46855 read = 8 - ff_log2_tab[total];
Andreas Rheinhardt239c7362019-06-25 01:08:56856
857 if (!total || read > max_size) {
858 pos = avio_tell(pb) - 1;
859 if (!total) {
860 av_log(matroska->ctx, AV_LOG_ERROR,
861 "0x00 at pos %"PRId64" (0x%"PRIx64") invalid as first byte "
862 "of an EBML number\n", pos, pos);
863 } else {
864 av_log(matroska->ctx, AV_LOG_ERROR,
865 "Length %d indicated by an EBML number's first byte 0x%02x "
866 "at pos %"PRId64" (0x%"PRIx64") exceeds max length %d.\n",
867 read, (uint8_t) total, pos, pos, max_size);
868 }
David Conradb061d892007-06-04 22:10:54869 return AVERROR_INVALIDDATA;
870 }
871
872 /* read out length */
Reimar Döffingerff6a5fc2010-09-02 19:17:46873 total ^= 1 << ff_log2_tab[total];
David Conradb061d892007-06-04 22:10:54874 while (n++ < read)
Anton Khirnove63a3622011-02-21 15:43:01875 total = (total << 8) | avio_r8(pb);
David Conradb061d892007-06-04 22:10:54876
Andreas Rheinhardt239c7362019-06-25 01:08:56877 if (pb->eof_reached) {
878 eof_forbidden = 1;
879 goto err;
880 }
881
David Conradb061d892007-06-04 22:10:54882 *number = total;
883
884 return read;
Andreas Rheinhardt239c7362019-06-25 01:08:56885
886err:
887 pos = avio_tell(pb);
888 if (pb->error) {
889 av_log(matroska->ctx, AV_LOG_ERROR,
890 "Read error at pos. %"PRIu64" (0x%"PRIx64")\n",
891 pos, pos);
892 return pb->error;
893 }
894 if (eof_forbidden) {
895 av_log(matroska->ctx, AV_LOG_ERROR, "File ended prematurely "
896 "at pos. %"PRIu64" (0x%"PRIx64")\n", pos, pos);
897 return AVERROR(EIO);
898 }
899 return AVERROR_EOF;
David Conradb061d892007-06-04 22:10:54900}
901
Reimar Döffinger1b4d3272010-09-06 17:51:44902/**
903 * Read a EBML length value.
904 * This needs special handling for the "unknown length" case which has multiple
905 * encodings.
906 */
Anton Khirnov471fe572011-02-20 10:04:12907static int ebml_read_length(MatroskaDemuxContext *matroska, AVIOContext *pb,
Reimar Döffinger1b4d3272010-09-06 17:51:44908 uint64_t *number)
909{
Andreas Rheinhardt239c7362019-06-25 01:08:56910 int res = ebml_read_num(matroska, pb, 8, number, 1);
Reimar Döffinger1b4d3272010-09-06 17:51:44911 if (res > 0 && *number + 1 == 1ULL << (7 * res))
Steve Lhommea2c77022019-02-23 10:14:33912 *number = EBML_UNKNOWN_LENGTH;
Reimar Döffinger1b4d3272010-09-06 17:51:44913 return res;
914}
915
David Conradb061d892007-06-04 22:10:54916/*
David Conradb061d892007-06-04 22:10:54917 * Read the next element as an unsigned int.
Andreas Rheinhardta569a7b2019-06-23 23:42:30918 * Returns NEEDS_CHECKING.
David Conradb061d892007-06-04 22:10:54919 */
Anton Khirnov471fe572011-02-20 10:04:12920static int ebml_read_uint(AVIOContext *pb, int size, uint64_t *num)
David Conradb061d892007-06-04 22:10:54921{
Aurelien Jacobsc6cd2b32008-08-05 00:41:55922 int n = 0;
David Conradb061d892007-06-04 22:10:54923
Diego Biurrun5968d2d2008-08-05 08:28:57924 /* big-endian ordering; build up number */
David Conradb061d892007-06-04 22:10:54925 *num = 0;
926 while (n++ < size)
Anton Khirnove63a3622011-02-21 15:43:01927 *num = (*num << 8) | avio_r8(pb);
David Conradb061d892007-06-04 22:10:54928
Andreas Rheinhardta569a7b2019-06-23 23:42:30929 return NEEDS_CHECKING;
David Conradb061d892007-06-04 22:10:54930}
931
932/*
Jan Gerberd03eea32013-11-15 18:00:37933 * Read the next element as a signed int.
Andreas Rheinhardta569a7b2019-06-23 23:42:30934 * Returns NEEDS_CHECKING.
Jan Gerberd03eea32013-11-15 18:00:37935 */
936static int ebml_read_sint(AVIOContext *pb, int size, int64_t *num)
937{
938 int n = 1;
939
Jan Gerberd03eea32013-11-15 18:00:37940 if (size == 0) {
941 *num = 0;
942 } else {
Michael Niedermayercddd15b2013-11-15 20:30:30943 *num = sign_extend(avio_r8(pb), 8);
Jan Gerberd03eea32013-11-15 18:00:37944
945 /* big-endian ordering; build up number */
946 while (n++ < size)
Michael Niedermayer2f8c8162015-07-01 09:59:57947 *num = ((uint64_t)*num << 8) | avio_r8(pb);
Jan Gerberd03eea32013-11-15 18:00:37948 }
949
Andreas Rheinhardta569a7b2019-06-23 23:42:30950 return NEEDS_CHECKING;
Jan Gerberd03eea32013-11-15 18:00:37951}
952
953/*
David Conradb061d892007-06-04 22:10:54954 * Read the next element as a float.
Andreas Rheinhardta569a7b2019-06-23 23:42:30955 * Returns NEEDS_CHECKING or < 0 on obvious failure.
David Conradb061d892007-06-04 22:10:54956 */
Anton Khirnov471fe572011-02-20 10:04:12957static int ebml_read_float(AVIOContext *pb, int size, double *num)
David Conradb061d892007-06-04 22:10:54958{
Keiji Costantini84cfce92014-03-01 16:28:15959 if (size == 0)
Aurelien Jacobs4a194c82010-09-05 21:37:40960 *num = 0;
Keiji Costantini84cfce92014-03-01 16:28:15961 else if (size == 4)
Mans Rullgard3383a532011-11-27 14:04:16962 *num = av_int2float(avio_rb32(pb));
Keiji Costantini84cfce92014-03-01 16:28:15963 else if (size == 8)
Mans Rullgard3383a532011-11-27 14:04:16964 *num = av_int2double(avio_rb64(pb));
Keiji Costantini84cfce92014-03-01 16:28:15965 else
David Conradb061d892007-06-04 22:10:54966 return AVERROR_INVALIDDATA;
David Conradb061d892007-06-04 22:10:54967
Andreas Rheinhardta569a7b2019-06-23 23:42:30968 return NEEDS_CHECKING;
David Conradb061d892007-06-04 22:10:54969}
970
971/*
972 * Read the next element as an ASCII string.
Andreas Rheinhardta569a7b2019-06-23 23:42:30973 * 0 is success, < 0 or NEEDS_CHECKING is failure.
David Conradb061d892007-06-04 22:10:54974 */
Anton Khirnov471fe572011-02-20 10:04:12975static int ebml_read_ascii(AVIOContext *pb, int size, char **str)
David Conradb061d892007-06-04 22:10:54976{
Ronald S. Bultjecd40c312012-02-25 00:12:18977 char *res;
Andreas Rheinhardta569a7b2019-06-23 23:42:30978 int ret;
Ronald S. Bultjecd40c312012-02-25 00:12:18979
Diego Biurrun5968d2d2008-08-05 08:28:57980 /* EBML strings are usually not 0-terminated, so we allocate one
David Conradb061d892007-06-04 22:10:54981 * byte more, read the string and NULL-terminate it ourselves. */
Ronald S. Bultjecd40c312012-02-25 00:12:18982 if (!(res = av_malloc(size + 1)))
Panagiotis Issaris769e10f2007-07-19 15:21:30983 return AVERROR(ENOMEM);
Andreas Rheinhardta569a7b2019-06-23 23:42:30984 if ((ret = avio_read(pb, (uint8_t *) res, size)) != size) {
Ronald S. Bultjecd40c312012-02-25 00:12:18985 av_free(res);
Andreas Rheinhardta569a7b2019-06-23 23:42:30986 return ret < 0 ? ret : NEEDS_CHECKING;
David Conradb061d892007-06-04 22:10:54987 }
Ronald S. Bultjecd40c312012-02-25 00:12:18988 (res)[size] = '\0';
989 av_free(*str);
990 *str = res;
David Conradb061d892007-06-04 22:10:54991
992 return 0;
993}
994
995/*
Aurelien Jacobs737c40d2008-08-05 00:42:39996 * Read the next element as binary data.
Andreas Rheinhardta569a7b2019-06-23 23:42:30997 * 0 is success, < 0 or NEEDS_CHECKING is failure.
Aurelien Jacobs737c40d2008-08-05 00:42:39998 */
Andreas Rheinhardt7087fc92019-05-16 22:30:12999static int ebml_read_binary(AVIOContext *pb, int length,
1000 int64_t pos, EbmlBin *bin)
Aurelien Jacobs737c40d2008-08-05 00:42:391001{
James Almera6188662018-04-04 17:12:541002 int ret;
Aurelien Jacobs737c40d2008-08-05 00:42:391003
James Almera6188662018-04-04 17:12:541004 ret = av_buffer_realloc(&bin->buf, length + AV_INPUT_BUFFER_PADDING_SIZE);
1005 if (ret < 0)
1006 return ret;
1007 memset(bin->buf->data + length, 0, AV_INPUT_BUFFER_PADDING_SIZE);
1008
1009 bin->data = bin->buf->data;
Aurelien Jacobs737c40d2008-08-05 00:42:391010 bin->size = length;
Andreas Rheinhardt7087fc92019-05-16 22:30:121011 bin->pos = pos;
Andreas Rheinhardta569a7b2019-06-23 23:42:301012 if ((ret = avio_read(pb, bin->data, length)) != length) {
James Almera6188662018-04-04 17:12:541013 av_buffer_unref(&bin->buf);
1014 bin->data = NULL;
Michael Niedermayer5e1bacf2012-12-04 02:30:401015 bin->size = 0;
Andreas Rheinhardta569a7b2019-06-23 23:42:301016 return ret < 0 ? ret : NEEDS_CHECKING;
David Conrad5549aa62010-05-18 21:21:371017 }
Aurelien Jacobs737c40d2008-08-05 00:42:391018
1019 return 0;
1020}
1021
1022/*
David Conradb061d892007-06-04 22:10:541023 * Read the next element, but only the header. The contents
1024 * are supposed to be sub-elements which can be read separately.
1025 * 0 is success, < 0 is failure.
1026 */
Andreas Rheinhardt7087fc92019-05-16 22:30:121027static int ebml_read_master(MatroskaDemuxContext *matroska,
1028 uint64_t length, int64_t pos)
David Conradb061d892007-06-04 22:10:541029{
David Conradb061d892007-06-04 22:10:541030 MatroskaLevel *level;
David Conradb061d892007-06-04 22:10:541031
David Conradb061d892007-06-04 22:10:541032 if (matroska->num_levels >= EBML_MAX_DEPTH) {
1033 av_log(matroska->ctx, AV_LOG_ERROR,
1034 "File moves beyond max. allowed depth (%d)\n", EBML_MAX_DEPTH);
Panagiotis Issaris85565db2007-07-19 15:38:331035 return AVERROR(ENOSYS);
David Conradb061d892007-06-04 22:10:541036 }
1037
Keiji Costantini84cfce92014-03-01 16:28:151038 level = &matroska->levels[matroska->num_levels++];
Andreas Rheinhardt7087fc92019-05-16 22:30:121039 level->start = pos;
David Conradb061d892007-06-04 22:10:541040 level->length = length;
1041
1042 return 0;
1043}
1044
1045/*
Andreas Rheinhardtd5274f82019-12-03 17:09:101046 * Read a signed "EBML number"
Diego Biurrun5968d2d2008-08-05 08:28:571047 * Return: number of bytes processed, < 0 on error
David Conradb061d892007-06-04 22:10:541048 */
Aurelien Jacobsc1e01132008-08-05 00:42:521049static int matroska_ebmlnum_sint(MatroskaDemuxContext *matroska,
Andreas Rheinhardtd5274f82019-12-03 17:09:101050 AVIOContext *pb, int64_t *num)
David Conradb061d892007-06-04 22:10:541051{
1052 uint64_t unum;
1053 int res;
1054
1055 /* read as unsigned number first */
Andreas Rheinhardtd5274f82019-12-03 17:09:101056 if ((res = ebml_read_num(matroska, pb, 8, &unum, 1)) < 0)
David Conradb061d892007-06-04 22:10:541057 return res;
1058
1059 /* make signed (weird way) */
Keiji Costantini84cfce92014-03-01 16:28:151060 *num = unum - ((1LL << (7 * res - 1)) - 1);
David Conradb061d892007-06-04 22:10:541061
1062 return res;
1063}
1064
Andreas Rheinhardt559e3422019-05-16 22:30:041065static int ebml_parse(MatroskaDemuxContext *matroska,
1066 EbmlSyntax *syntax, void *data);
Aurelien Jacobs789ed102008-08-05 00:40:001067
Andreas Rheinhardt559e3422019-05-16 22:30:041068static EbmlSyntax *ebml_parse_id(EbmlSyntax *syntax, uint32_t id)
Aurelien Jacobs789ed102008-08-05 00:40:001069{
1070 int i;
Andreas Rheinhardt38255cd2019-05-16 22:30:101071
1072 // Whoever touches this should be aware of the duplication
1073 // existing in matroska_cluster_parsing.
Keiji Costantini84cfce92014-03-01 16:28:151074 for (i = 0; syntax[i].id; i++)
Aurelien Jacobs789ed102008-08-05 00:40:001075 if (id == syntax[i].id)
1076 break;
Aurelien Jacobs789ed102008-08-05 00:40:001077
Andreas Rheinhardt559e3422019-05-16 22:30:041078 return &syntax[i];
Aurelien Jacobs66a37e02008-08-05 00:42:171079}
1080
Aurelien Jacobs9bcb92c2008-08-05 00:42:131081static int ebml_parse_nest(MatroskaDemuxContext *matroska, EbmlSyntax *syntax,
Aurelien Jacobs6314cca2008-08-05 00:42:231082 void *data)
Aurelien Jacobs789ed102008-08-05 00:40:001083{
Andreas Rheinhardt68541272019-05-16 22:30:191084 int res;
Aurelien Jacobs789ed102008-08-05 00:40:001085
Andreas Rheinhardt71c90882019-05-16 22:30:181086 if (data) {
Andreas Rheinhardt68541272019-05-16 22:30:191087 for (int i = 0; syntax[i].id; i++)
1088 switch (syntax[i].type) {
1089 case EBML_UINT:
1090 *(uint64_t *) ((char *) data + syntax[i].data_offset) = syntax[i].def.u;
1091 break;
1092 case EBML_SINT:
1093 *(int64_t *) ((char *) data + syntax[i].data_offset) = syntax[i].def.i;
1094 break;
1095 case EBML_FLOAT:
1096 *(double *) ((char *) data + syntax[i].data_offset) = syntax[i].def.f;
1097 break;
1098 case EBML_STR:
1099 case EBML_UTF8:
1100 // the default may be NULL
1101 if (syntax[i].def.s) {
1102 uint8_t **dst = (uint8_t **) ((uint8_t *) data + syntax[i].data_offset);
1103 *dst = av_strdup(syntax[i].def.s);
1104 if (!*dst)
1105 return AVERROR(ENOMEM);
1106 }
1107 break;
Anton Khirnov668643b2013-09-04 06:55:171108 }
Aurelien Jacobs789ed102008-08-05 00:40:001109
Andreas Rheinhardt68541272019-05-16 22:30:191110 if (!matroska->levels[matroska->num_levels - 1].length) {
1111 matroska->num_levels--;
1112 return 0;
1113 }
Andreas Rheinhardt71c90882019-05-16 22:30:181114 }
Aurelien Jacobs789ed102008-08-05 00:40:001115
Andreas Rheinhardtb31c9b72019-06-23 23:46:541116 do {
1117 res = ebml_parse(matroska, syntax, data);
1118 } while (!res);
1119
1120 return res == LEVEL_ENDED ? 0 : res;
Aurelien Jacobs789ed102008-08-05 00:40:001121}
1122
wm47e240f92015-06-12 11:11:411123static int is_ebml_id_valid(uint32_t id)
1124{
1125 // Due to endian nonsense in Matroska, the highest byte with any bits set
1126 // will contain the leading length bit. This bit in turn identifies the
1127 // total byte length of the element by its position within the byte.
1128 unsigned int bits = av_log2(id);
1129 return id && (bits + 7) / 8 == (8 - bits % 8);
1130}
1131
wm4cac22952015-02-09 19:39:001132/*
1133 * Allocate and return the entry for the level1 element with the given ID. If
1134 * an entry already exists, return the existing entry.
1135 */
1136static MatroskaLevel1Element *matroska_find_level1_elem(MatroskaDemuxContext *matroska,
1137 uint32_t id)
1138{
1139 int i;
1140 MatroskaLevel1Element *elem;
1141
wm47e240f92015-06-12 11:11:411142 if (!is_ebml_id_valid(id))
1143 return NULL;
1144
wm4cac22952015-02-09 19:39:001145 // Some files link to all clusters; useless.
1146 if (id == MATROSKA_ID_CLUSTER)
1147 return NULL;
1148
1149 // There can be multiple seekheads.
1150 if (id != MATROSKA_ID_SEEKHEAD) {
1151 for (i = 0; i < matroska->num_level1_elems; i++) {
1152 if (matroska->level1_elems[i].id == id)
1153 return &matroska->level1_elems[i];
1154 }
1155 }
1156
1157 // Only a completely broken file would have more elements.
1158 // It also provides a low-effort way to escape from circular seekheads
1159 // (every iteration will add a level1 entry).
1160 if (matroska->num_level1_elems >= FF_ARRAY_ELEMS(matroska->level1_elems)) {
1161 av_log(matroska->ctx, AV_LOG_ERROR, "Too many level1 elements or circular seekheads.\n");
1162 return NULL;
1163 }
1164
1165 elem = &matroska->level1_elems[matroska->num_level1_elems++];
1166 *elem = (MatroskaLevel1Element){.id = id};
1167
1168 return elem;
1169}
1170
Andreas Rheinhardt559e3422019-05-16 22:30:041171static int ebml_parse(MatroskaDemuxContext *matroska,
1172 EbmlSyntax *syntax, void *data)
Aurelien Jacobs737c40d2008-08-05 00:42:391173{
Reimar Döffinger14d735b2011-02-06 10:32:031174 static const uint64_t max_lengths[EBML_TYPE_COUNT] = {
Andreas Rheinhardt04b62bd2019-05-16 22:30:151175 // Forbid unknown-length EBML_NONE elements.
1176 [EBML_NONE] = EBML_UNKNOWN_LENGTH - 1,
Reimar Döffinger14d735b2011-02-06 10:32:031177 [EBML_UINT] = 8,
Andreas Rheinhardte5ec1312019-05-16 22:29:501178 [EBML_SINT] = 8,
Reimar Döffinger14d735b2011-02-06 10:32:031179 [EBML_FLOAT] = 8,
1180 // max. 16 MB for strings
1181 [EBML_STR] = 0x1000000,
1182 [EBML_UTF8] = 0x1000000,
1183 // max. 256 MB for binary data
1184 [EBML_BIN] = 0x10000000,
1185 // no limits for anything else
1186 };
Anton Khirnov471fe572011-02-20 10:04:121187 AVIOContext *pb = matroska->ctx->pb;
Andreas Rheinhardt559e3422019-05-16 22:30:041188 uint32_t id;
Aurelien Jacobs737c40d2008-08-05 00:42:391189 uint64_t length;
Andreas Rheinhardt7087fc92019-05-16 22:30:121190 int64_t pos = avio_tell(pb), pos_alt;
Andreas Rheinhardtb31c9b72019-06-23 23:46:541191 int res, update_pos = 1, level_check;
wm4cac22952015-02-09 19:39:001192 MatroskaLevel1Element *level1_elem;
Andreas Rheinhardtb31c9b72019-06-23 23:46:541193 MatroskaLevel *level = matroska->num_levels ? &matroska->levels[matroska->num_levels - 1] : NULL;
Aurelien Jacobs737c40d2008-08-05 00:42:391194
Andreas Rheinhardt559e3422019-05-16 22:30:041195 if (!matroska->current_id) {
1196 uint64_t id;
1197 res = ebml_read_num(matroska, pb, 4, &id, 0);
1198 if (res < 0) {
Andreas Rheinhardtb31c9b72019-06-23 23:46:541199 if (pb->eof_reached && res == AVERROR_EOF) {
1200 if (matroska->is_live)
1201 // in live mode, finish parsing if EOF is reached.
1202 return 1;
Andreas Rheinhardt3ed27552019-05-16 22:30:111203 if (level && pos == avio_tell(pb)) {
1204 if (level->length == EBML_UNKNOWN_LENGTH) {
1205 // Unknown-length levels automatically end at EOF.
1206 matroska->num_levels--;
1207 return LEVEL_ENDED;
1208 } else {
1209 av_log(matroska->ctx, AV_LOG_ERROR, "File ended prematurely "
1210 "at pos. %"PRIu64" (0x%"PRIx64")\n", pos, pos);
1211 }
Andreas Rheinhardtb31c9b72019-06-23 23:46:541212 }
1213 }
1214 return res;
Andreas Rheinhardt559e3422019-05-16 22:30:041215 }
1216 matroska->current_id = id | 1 << 7 * res;
Andreas Rheinhardt7087fc92019-05-16 22:30:121217 pos_alt = pos + res;
1218 } else {
1219 pos_alt = pos;
1220 pos -= (av_log2(matroska->current_id) + 7) / 8;
1221 }
Andreas Rheinhardt559e3422019-05-16 22:30:041222
1223 id = matroska->current_id;
1224
1225 syntax = ebml_parse_id(syntax, id);
Andreas Rheinhardt559e3422019-05-16 22:30:041226 if (!syntax->id && id != EBML_ID_VOID && id != EBML_ID_CRC32) {
Andreas Rheinhardtb31c9b72019-06-23 23:46:541227 if (level && level->length == EBML_UNKNOWN_LENGTH) {
1228 // Unknown-length levels end when an element from an upper level
1229 // in the hierarchy is encountered.
1230 while (syntax->def.n) {
1231 syntax = ebml_parse_id(syntax->def.n, id);
1232 if (syntax->id) {
1233 matroska->num_levels--;
1234 return LEVEL_ENDED;
1235 }
1236 };
1237 }
1238
1239 av_log(matroska->ctx, AV_LOG_DEBUG, "Unknown entry 0x%"PRIX32" at pos. "
1240 "%"PRId64"\n", id, pos);
1241 update_pos = 0; /* Don't update resync_pos as an error might have happened. */
Andreas Rheinhardt559e3422019-05-16 22:30:041242 }
1243
Andreas Rheinhardt71c90882019-05-16 22:30:181244 if (data) {
Andreas Rheinhardt68541272019-05-16 22:30:191245 data = (char *) data + syntax->data_offset;
1246 if (syntax->list_elem_size) {
1247 EbmlList *list = data;
James Almer3b3150c2019-09-03 21:45:041248 void *newelem;
1249
1250 if ((unsigned)list->nb_elem + 1 >= UINT_MAX / syntax->list_elem_size)
1251 return AVERROR(ENOMEM);
1252 newelem = av_fast_realloc(list->elem,
1253 &list->alloc_elem_size,
1254 (list->nb_elem + 1) * syntax->list_elem_size);
Andreas Rheinhardt68541272019-05-16 22:30:191255 if (!newelem)
1256 return AVERROR(ENOMEM);
1257 list->elem = newelem;
1258 data = (char *) list->elem + list->nb_elem * syntax->list_elem_size;
1259 memset(data, 0, syntax->list_elem_size);
1260 list->nb_elem++;
1261 }
Andreas Rheinhardt71c90882019-05-16 22:30:181262 }
Aurelien Jacobs737c40d2008-08-05 00:42:391263
Andreas Rheinhardtbc3306f2019-05-16 22:30:001264 if (syntax->type != EBML_STOP) {
Aurelien Jacobsc3ade622010-06-11 16:34:011265 matroska->current_id = 0;
Reimar Döffinger1b4d3272010-09-06 17:51:441266 if ((res = ebml_read_length(matroska, pb, &length)) < 0)
Aurelien Jacobs737c40d2008-08-05 00:42:391267 return res;
Andreas Rheinhardt7087fc92019-05-16 22:30:121268
1269 pos_alt += res;
1270
Steve Lhomme93261172019-02-13 12:20:451271 if (matroska->num_levels > 0) {
Andreas Rheinhardt via ffmpeg-devel18a851a2019-03-27 11:18:441272 if (length != EBML_UNKNOWN_LENGTH &&
1273 level->length != EBML_UNKNOWN_LENGTH) {
Andreas Rheinhardt7087fc92019-05-16 22:30:121274 uint64_t elem_end = pos_alt + length,
Andreas Rheinhardt via ffmpeg-devel18a851a2019-03-27 11:18:441275 level_end = level->start + level->length;
1276
Andreas Rheinhardtb31c9b72019-06-23 23:46:541277 if (elem_end < level_end) {
1278 level_check = 0;
1279 } else if (elem_end == level_end) {
1280 level_check = LEVEL_ENDED;
1281 } else {
Andreas Rheinhardt via ffmpeg-devel18a851a2019-03-27 11:18:441282 av_log(matroska->ctx, AV_LOG_ERROR,
1283 "Element at 0x%"PRIx64" ending at 0x%"PRIx64" exceeds "
1284 "containing master element ending at 0x%"PRIx64"\n",
1285 pos, elem_end, level_end);
1286 return AVERROR_INVALIDDATA;
1287 }
Andreas Rheinhardtb31c9b72019-06-23 23:46:541288 } else if (length != EBML_UNKNOWN_LENGTH) {
1289 level_check = 0;
Andreas Rheinhardt via ffmpeg-devel18a851a2019-03-27 11:18:441290 } else if (level->length != EBML_UNKNOWN_LENGTH) {
1291 av_log(matroska->ctx, AV_LOG_ERROR, "Unknown-sized element "
1292 "at 0x%"PRIx64" inside parent with finite size\n", pos);
1293 return AVERROR_INVALIDDATA;
Andreas Rheinhardt3c70b942019-05-16 22:30:161294 } else {
Andreas Rheinhardtb31c9b72019-06-23 23:46:541295 level_check = 0;
Andreas Rheinhardt3c70b942019-05-16 22:30:161296 if (id != MATROSKA_ID_CLUSTER && (syntax->type == EBML_LEVEL1
1297 || syntax->type == EBML_NEST)) {
1298 // According to the current specifications only clusters and
1299 // segments are allowed to be unknown-length. We also accept
1300 // other unknown-length master elements.
1301 av_log(matroska->ctx, AV_LOG_WARNING,
1302 "Found unknown-length element 0x%"PRIX32" other than "
1303 "a cluster at 0x%"PRIx64". Spec-incompliant, but "
1304 "parsing will nevertheless be attempted.\n", id, pos);
1305 update_pos = -1;
1306 }
1307 }
Andreas Rheinhardtb31c9b72019-06-23 23:46:541308 } else
1309 level_check = 0;
Andreas Rheinhardta3db9f62019-05-16 22:30:051310
Andreas Rheinhardt04b62bd2019-05-16 22:30:151311 if (max_lengths[syntax->type] && length > max_lengths[syntax->type]) {
1312 if (length != EBML_UNKNOWN_LENGTH) {
1313 av_log(matroska->ctx, AV_LOG_ERROR,
1314 "Invalid length 0x%"PRIx64" > 0x%"PRIx64" for element "
1315 "with ID 0x%"PRIX32" at 0x%"PRIx64"\n",
1316 length, max_lengths[syntax->type], id, pos);
1317 } else if (syntax->type != EBML_NONE) {
1318 av_log(matroska->ctx, AV_LOG_ERROR,
1319 "Element with ID 0x%"PRIX32" at pos. 0x%"PRIx64" has "
1320 "unknown length, yet the length of an element of its "
1321 "type must be known.\n", id, pos);
1322 } else {
1323 av_log(matroska->ctx, AV_LOG_ERROR,
1324 "Found unknown-length element with ID 0x%"PRIX32" at "
1325 "pos. 0x%"PRIx64" for which no syntax for parsing is "
1326 "available.\n", id, pos);
1327 }
1328 return AVERROR_INVALIDDATA;
1329 }
1330
Andreas Rheinhardt51203052019-05-16 22:30:141331 if (!(pb->seekable & AVIO_SEEKABLE_NORMAL)) {
1332 // Loosing sync will likely manifest itself as encountering unknown
1333 // elements which are not reliably distinguishable from elements
1334 // belonging to future extensions of the format.
1335 // We use a heuristic to detect such situations: If the current
1336 // element is not expected at the current syntax level and there
1337 // were only a few unknown elements in a row, then the element is
1338 // skipped or considered defective based upon the length of the
1339 // current element (i.e. how much would be skipped); if there were
1340 // more than a few skipped elements in a row and skipping the current
1341 // element would lead us more than SKIP_THRESHOLD away from the last
Michael Niedermayerfccc37c2019-08-28 17:04:421342 // known good position, then it is inferred that an error occurred.
Andreas Rheinhardt51203052019-05-16 22:30:141343 // The dependency on the number of unknown elements in a row exists
1344 // because the distance to the last known good position is
1345 // automatically big if the last parsed element was big.
1346 // In both cases, each unknown element is considered equivalent to
1347 // UNKNOWN_EQUIV of skipped bytes for the check.
1348 // The whole check is only done for non-seekable output, because
1349 // in this situation skipped data can't simply be rechecked later.
1350 // This is especially important when using unkown length elements
1351 // as the check for whether a child exceeds its containing master
1352 // element is not effective in this situation.
1353 if (update_pos) {
1354 matroska->unknown_count = 0;
1355 } else {
1356 int64_t dist = length + UNKNOWN_EQUIV * matroska->unknown_count++;
1357
1358 if (matroska->unknown_count > 3)
1359 dist += pos_alt - matroska->resync_pos;
1360
1361 if (dist > SKIP_THRESHOLD) {
1362 av_log(matroska->ctx, AV_LOG_ERROR,
1363 "Unknown element %"PRIX32" at pos. 0x%"PRIx64" with "
1364 "length 0x%"PRIx64" considered as invalid data. Last "
1365 "known good position 0x%"PRIx64", %d unknown elements"
1366 " in a row\n", id, pos, length, matroska->resync_pos,
1367 matroska->unknown_count);
1368 return AVERROR_INVALIDDATA;
1369 }
1370 }
1371 }
1372
Andreas Rheinhardt3c70b942019-05-16 22:30:161373 if (update_pos > 0) {
Andreas Rheinhardta3db9f62019-05-16 22:30:051374 // We have found an element that is allowed at this place
1375 // in the hierarchy and it passed all checks, so treat the beginning
1376 // of the element as the "last known good" position.
1377 matroska->resync_pos = pos;
1378 }
Andreas Rheinhardt71c90882019-05-16 22:30:181379
1380 if (!data && length != EBML_UNKNOWN_LENGTH)
1381 goto skip;
Aurelien Jacobsc3ade622010-06-11 16:34:011382 }
Aurelien Jacobs737c40d2008-08-05 00:42:391383
1384 switch (syntax->type) {
Keiji Costantini84cfce92014-03-01 16:28:151385 case EBML_UINT:
1386 res = ebml_read_uint(pb, length, data);
1387 break;
Michael Niedermayerb3d9ab12014-03-07 22:46:371388 case EBML_SINT:
1389 res = ebml_read_sint(pb, length, data);
1390 break;
Keiji Costantini84cfce92014-03-01 16:28:151391 case EBML_FLOAT:
1392 res = ebml_read_float(pb, length, data);
1393 break;
Aurelien Jacobs737c40d2008-08-05 00:42:391394 case EBML_STR:
Keiji Costantini84cfce92014-03-01 16:28:151395 case EBML_UTF8:
1396 res = ebml_read_ascii(pb, length, data);
1397 break;
1398 case EBML_BIN:
Andreas Rheinhardt7087fc92019-05-16 22:30:121399 res = ebml_read_binary(pb, length, pos_alt, data);
Keiji Costantini84cfce92014-03-01 16:28:151400 break;
wm4cac22952015-02-09 19:39:001401 case EBML_LEVEL1:
Keiji Costantini84cfce92014-03-01 16:28:151402 case EBML_NEST:
Andreas Rheinhardt7087fc92019-05-16 22:30:121403 if ((res = ebml_read_master(matroska, length, pos_alt)) < 0)
Keiji Costantini84cfce92014-03-01 16:28:151404 return res;
1405 if (id == MATROSKA_ID_SEGMENT)
Andreas Rheinhardt7087fc92019-05-16 22:30:121406 matroska->segment_start = pos_alt;
wm4cac22952015-02-09 19:39:001407 if (id == MATROSKA_ID_CUES)
1408 matroska->cues_parsing_deferred = 0;
1409 if (syntax->type == EBML_LEVEL1 &&
1410 (level1_elem = matroska_find_level1_elem(matroska, syntax->id))) {
Andreas Rheinhardt806ac7d2019-05-16 22:30:211411 if (!level1_elem->pos) {
1412 // Zero is not a valid position for a level 1 element.
1413 level1_elem->pos = pos;
1414 } else if (level1_elem->pos != pos)
wm4cac22952015-02-09 19:39:001415 av_log(matroska->ctx, AV_LOG_ERROR, "Duplicate element\n");
1416 level1_elem->parsed = 1;
1417 }
Andreas Rheinhardtb31c9b72019-06-23 23:46:541418 if (res = ebml_parse_nest(matroska, syntax->def.n, data))
1419 return res;
1420 break;
Keiji Costantini84cfce92014-03-01 16:28:151421 case EBML_STOP:
1422 return 1;
Andreas Rheinhardt71c90882019-05-16 22:30:181423 skip:
Michael Niedermayer668c8732012-08-04 00:27:511424 default:
Andreas Rheinhardtff5ea592019-06-23 23:42:311425 if (length) {
Andreas Rheinhardteb33be12019-07-06 16:59:221426 int64_t res2;
Andreas Rheinhardtff5ea592019-06-23 23:42:311427 if (ffio_limit(pb, length) != length) {
1428 // ffio_limit emits its own error message,
1429 // so we don't have to.
1430 return AVERROR(EIO);
1431 }
Andreas Rheinhardteb33be12019-07-06 16:59:221432 if ((res2 = avio_skip(pb, length - 1)) >= 0) {
Andreas Rheinhardtff5ea592019-06-23 23:42:311433 // avio_skip might take us past EOF. We check for this
1434 // by skipping only length - 1 bytes, reading a byte and
1435 // checking the error flags. This is done in order to check
1436 // that the element has been properly skipped even when
1437 // no filesize (that ffio_limit relies on) is available.
1438 avio_r8(pb);
1439 res = NEEDS_CHECKING;
Andreas Rheinhardteb33be12019-07-06 16:59:221440 } else
1441 res = res2;
Andreas Rheinhardtff5ea592019-06-23 23:42:311442 } else
1443 res = 0;
Aurelien Jacobs737c40d2008-08-05 00:42:391444 }
Andreas Rheinhardta569a7b2019-06-23 23:42:301445 if (res) {
1446 if (res == NEEDS_CHECKING) {
1447 if (pb->eof_reached) {
1448 if (pb->error)
1449 res = pb->error;
1450 else
1451 res = AVERROR_EOF;
1452 } else
Andreas Rheinhardtb31c9b72019-06-23 23:46:541453 goto level_check;
Andreas Rheinhardta569a7b2019-06-23 23:42:301454 }
1455
1456 if (res == AVERROR_INVALIDDATA)
1457 av_log(matroska->ctx, AV_LOG_ERROR, "Invalid element\n");
1458 else if (res == AVERROR(EIO))
1459 av_log(matroska->ctx, AV_LOG_ERROR, "Read error\n");
1460 else if (res == AVERROR_EOF) {
1461 av_log(matroska->ctx, AV_LOG_ERROR, "File ended prematurely\n");
1462 res = AVERROR(EIO);
1463 }
Andreas Rheinhardtb31c9b72019-06-23 23:46:541464
1465 return res;
Andreas Rheinhardta569a7b2019-06-23 23:42:301466 }
Andreas Rheinhardtb31c9b72019-06-23 23:46:541467
1468level_check:
1469 if (level_check == LEVEL_ENDED && matroska->num_levels) {
1470 level = &matroska->levels[matroska->num_levels - 1];
1471 pos = avio_tell(pb);
1472
1473 // Given that pos >= level->start no check for
1474 // level->length != EBML_UNKNOWN_LENGTH is necessary.
1475 while (matroska->num_levels && pos == level->start + level->length) {
1476 matroska->num_levels--;
1477 level--;
1478 }
1479 }
1480
1481 return level_check;
Aurelien Jacobs737c40d2008-08-05 00:42:391482}
1483
Aurelien Jacobs789ed102008-08-05 00:40:001484static void ebml_free(EbmlSyntax *syntax, void *data)
1485{
1486 int i, j;
Keiji Costantini84cfce92014-03-01 16:28:151487 for (i = 0; syntax[i].id; i++) {
1488 void *data_off = (char *) data + syntax[i].data_offset;
Aurelien Jacobs789ed102008-08-05 00:40:001489 switch (syntax[i].type) {
1490 case EBML_STR:
Keiji Costantini84cfce92014-03-01 16:28:151491 case EBML_UTF8:
1492 av_freep(data_off);
1493 break;
1494 case EBML_BIN:
James Almera6188662018-04-04 17:12:541495 av_buffer_unref(&((EbmlBin *) data_off)->buf);
Keiji Costantini84cfce92014-03-01 16:28:151496 break;
wm4cac22952015-02-09 19:39:001497 case EBML_LEVEL1:
Aurelien Jacobs789ed102008-08-05 00:40:001498 case EBML_NEST:
1499 if (syntax[i].list_elem_size) {
1500 EbmlList *list = data_off;
1501 char *ptr = list->elem;
Keiji Costantini84cfce92014-03-01 16:28:151502 for (j = 0; j < list->nb_elem;
1503 j++, ptr += syntax[i].list_elem_size)
Aurelien Jacobs789ed102008-08-05 00:40:001504 ebml_free(syntax[i].def.n, ptr);
Michael Niedermayer6e70e4a2015-01-06 11:48:381505 av_freep(&list->elem);
Michael Schenk18b94662016-11-25 08:36:201506 list->nb_elem = 0;
James Almer3b3150c2019-09-03 21:45:041507 list->alloc_elem_size = 0;
Aurelien Jacobs789ed102008-08-05 00:40:001508 } else
1509 ebml_free(syntax[i].def.n, data_off);
Keiji Costantini84cfce92014-03-01 16:28:151510 default:
1511 break;
Aurelien Jacobs789ed102008-08-05 00:40:001512 }
1513 }
1514}
1515
Aurelien Jacobs737c40d2008-08-05 00:42:391516/*
1517 * Autodetecting...
1518 */
Carl Eugen Hoyos4d8875e2019-03-21 00:18:371519static int matroska_probe(const AVProbeData *p)
Aurelien Jacobs737c40d2008-08-05 00:42:391520{
1521 uint64_t total = 0;
James Zern470491f2010-05-22 01:41:321522 int len_mask = 0x80, size = 1, n = 1, i;
Aurelien Jacobs737c40d2008-08-05 00:42:391523
Diego Biurrun5968d2d2008-08-05 08:28:571524 /* EBML header? */
Aurelien Jacobs737c40d2008-08-05 00:42:391525 if (AV_RB32(p->buf) != EBML_ID_HEADER)
1526 return 0;
1527
1528 /* length of header */
1529 total = p->buf[4];
1530 while (size <= 8 && !(total & len_mask)) {
1531 size++;
1532 len_mask >>= 1;
1533 }
1534 if (size > 8)
Keiji Costantini84cfce92014-03-01 16:28:151535 return 0;
Aurelien Jacobs737c40d2008-08-05 00:42:391536 total &= (len_mask - 1);
1537 while (n < size)
1538 total = (total << 8) | p->buf[4 + n++];
1539
Andreas Rheinhardt9c6d14a2019-05-16 22:30:171540 if (total + 1 == 1ULL << (7 * size)){
1541 /* Unknown-length header - simply parse the whole buffer. */
1542 total = p->buf_size - 4 - size;
1543 } else {
1544 /* Does the probe data contain the whole header? */
1545 if (p->buf_size < 4 + size + total)
1546 return 0;
1547 }
Aurelien Jacobs737c40d2008-08-05 00:42:391548
James Zern470491f2010-05-22 01:41:321549 /* The header should contain a known document type. For now,
Aurelien Jacobs737c40d2008-08-05 00:42:391550 * we don't parse the whole header but simply check for the
1551 * availability of that array of characters inside the header.
1552 * Not fully fool-proof, but good enough. */
James Zern470491f2010-05-22 01:41:321553 for (i = 0; i < FF_ARRAY_ELEMS(matroska_doctypes); i++) {
Michael Niedermayer17b26302015-05-11 01:51:171554 size_t probelen = strlen(matroska_doctypes[i]);
Chris Evans69619a12011-07-20 00:51:481555 if (total < probelen)
1556 continue;
Keiji Costantini84cfce92014-03-01 16:28:151557 for (n = 4 + size; n <= 4 + size + total - probelen; n++)
1558 if (!memcmp(p->buf + n, matroska_doctypes[i], probelen))
James Zern470491f2010-05-22 01:41:321559 return AVPROBE_SCORE_MAX;
1560 }
Aurelien Jacobs737c40d2008-08-05 00:42:391561
David Conradc7b913c2010-05-22 01:41:351562 // probably valid EBML header but no recognized doctype
Diego Biurrune0f8be62013-03-25 15:12:511563 return AVPROBE_SCORE_EXTENSION;
Aurelien Jacobs737c40d2008-08-05 00:42:391564}
1565
1566static MatroskaTrack *matroska_find_track_by_num(MatroskaDemuxContext *matroska,
Andreas Rheinhardtba36a072019-12-26 03:17:241567 uint64_t num)
Aurelien Jacobs737c40d2008-08-05 00:42:391568{
1569 MatroskaTrack *tracks = matroska->tracks.elem;
1570 int i;
1571
Keiji Costantini84cfce92014-03-01 16:28:151572 for (i = 0; i < matroska->tracks.nb_elem; i++)
Aurelien Jacobs737c40d2008-08-05 00:42:391573 if (tracks[i].num == num)
1574 return &tracks[i];
1575
Andreas Rheinhardtba36a072019-12-26 03:17:241576 av_log(matroska->ctx, AV_LOG_ERROR, "Invalid track number %"PRIu64"\n", num);
Aurelien Jacobs737c40d2008-08-05 00:42:391577 return NULL;
1578}
1579
Keiji Costantini84cfce92014-03-01 16:28:151580static int matroska_decode_buffer(uint8_t **buf, int *buf_size,
Aurelien Jacobsf7b96872008-08-05 00:42:051581 MatroskaTrack *track)
Evgeniy Stepanov935ec5a2008-06-22 15:49:441582{
Aurelien Jacobs2cbc8812008-08-05 00:40:311583 MatroskaTrackEncoding *encodings = track->encodings.elem;
Keiji Costantini84cfce92014-03-01 16:28:151584 uint8_t *data = *buf;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441585 int isize = *buf_size;
Keiji Costantini84cfce92014-03-01 16:28:151586 uint8_t *pkt_data = NULL;
Diego Biurrun529506b2012-02-12 09:58:461587 uint8_t av_unused *newpktdata;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441588 int pkt_size = isize;
1589 int result = 0;
1590 int olen;
1591
Michael Niedermayer4b7c5232012-06-14 23:29:301592 if (pkt_size >= 10000000U)
Luca Barbatoc9a39ce2012-09-14 18:03:371593 return AVERROR_INVALIDDATA;
Aurelien Jacobs4f906882010-08-17 14:05:231594
Aurelien Jacobs2cbc8812008-08-05 00:40:311595 switch (encodings[0].compression.algo) {
Keiji Costantini84cfce92014-03-01 16:28:151596 case MATROSKA_TRACK_ENCODING_COMP_HEADERSTRIP:
1597 {
Luca Barbato8d4dd552012-09-14 16:51:491598 int header_size = encodings[0].compression.settings.size;
1599 uint8_t *header = encodings[0].compression.settings.data;
1600
Michael Niedermayer1df2e3c2012-09-20 11:30:441601 if (header_size && !header) {
Michael Niedermayer0efcf162012-11-23 17:10:021602 av_log(NULL, AV_LOG_ERROR, "Compression size but no data in headerstrip\n");
Michael Niedermayer26776972012-04-17 15:12:221603 return -1;
1604 }
Michael Niedermayer1df2e3c2012-09-20 11:30:441605
Luca Barbato8d4dd552012-09-14 16:51:491606 if (!header_size)
1607 return 0;
1608
1609 pkt_size = isize + header_size;
James Almer9703b7d2018-04-04 21:12:531610 pkt_data = av_malloc(pkt_size + AV_INPUT_BUFFER_PADDING_SIZE);
Luca Barbato8d4dd552012-09-14 16:51:491611 if (!pkt_data)
1612 return AVERROR(ENOMEM);
1613
1614 memcpy(pkt_data, header, header_size);
1615 memcpy(pkt_data + header_size, data, isize);
1616 break;
1617 }
Diego Biurrun2a91ada2012-10-18 17:48:271618#if CONFIG_LZO
Evgeniy Stepanov935ec5a2008-06-22 15:49:441619 case MATROSKA_TRACK_ENCODING_COMP_LZO:
1620 do {
Andreas Rheinhardt2ff687c2019-12-28 02:40:331621 int insize = isize;
Keiji Costantini84cfce92014-03-01 16:28:151622 olen = pkt_size *= 3;
James Almer9703b7d2018-04-04 21:12:531623 newpktdata = av_realloc(pkt_data, pkt_size + AV_LZO_OUTPUT_PADDING
1624 + AV_INPUT_BUFFER_PADDING_SIZE);
Luca Barbato581281e2012-09-14 16:39:581625 if (!newpktdata) {
Luca Barbatoc9a39ce2012-09-14 18:03:371626 result = AVERROR(ENOMEM);
Luca Barbato581281e2012-09-14 16:39:581627 goto failed;
1628 }
1629 pkt_data = newpktdata;
Andreas Rheinhardt2ff687c2019-12-28 02:40:331630 result = av_lzo1x_decode(pkt_data, &olen, data, &insize);
Keiji Costantini84cfce92014-03-01 16:28:151631 } while (result == AV_LZO_OUTPUT_FULL && pkt_size < 10000000);
Luca Barbatoc9a39ce2012-09-14 18:03:371632 if (result) {
1633 result = AVERROR_INVALIDDATA;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441634 goto failed;
Luca Barbatoc9a39ce2012-09-14 18:03:371635 }
Evgeniy Stepanov935ec5a2008-06-22 15:49:441636 pkt_size -= olen;
1637 break;
Diego Biurrun2a91ada2012-10-18 17:48:271638#endif
Aurelien Jacobsb250f9c2009-01-13 23:44:161639#if CONFIG_ZLIB
Keiji Costantini84cfce92014-03-01 16:28:151640 case MATROSKA_TRACK_ENCODING_COMP_ZLIB:
1641 {
1642 z_stream zstream = { 0 };
Evgeniy Stepanov935ec5a2008-06-22 15:49:441643 if (inflateInit(&zstream) != Z_OK)
1644 return -1;
Keiji Costantini84cfce92014-03-01 16:28:151645 zstream.next_in = data;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441646 zstream.avail_in = isize;
1647 do {
Keiji Costantini84cfce92014-03-01 16:28:151648 pkt_size *= 3;
James Almer9703b7d2018-04-04 21:12:531649 newpktdata = av_realloc(pkt_data, pkt_size + AV_INPUT_BUFFER_PADDING_SIZE);
Michael Niedermayer77d2ef12011-07-28 12:59:541650 if (!newpktdata) {
1651 inflateEnd(&zstream);
Michael Niedermayer171af592015-05-12 16:32:121652 result = AVERROR(ENOMEM);
Michael Niedermayer77d2ef12011-07-28 12:59:541653 goto failed;
1654 }
Keiji Costantini84cfce92014-03-01 16:28:151655 pkt_data = newpktdata;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441656 zstream.avail_out = pkt_size - zstream.total_out;
Keiji Costantini84cfce92014-03-01 16:28:151657 zstream.next_out = pkt_data + zstream.total_out;
Michael Niedermayer171af592015-05-12 16:32:121658 result = inflate(&zstream, Z_NO_FLUSH);
Keiji Costantini84cfce92014-03-01 16:28:151659 } while (result == Z_OK && pkt_size < 10000000);
Evgeniy Stepanov935ec5a2008-06-22 15:49:441660 pkt_size = zstream.total_out;
1661 inflateEnd(&zstream);
Luca Barbatoc9a39ce2012-09-14 18:03:371662 if (result != Z_STREAM_END) {
1663 if (result == Z_MEM_ERROR)
1664 result = AVERROR(ENOMEM);
1665 else
1666 result = AVERROR_INVALIDDATA;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441667 goto failed;
Luca Barbatoc9a39ce2012-09-14 18:03:371668 }
Evgeniy Stepanov935ec5a2008-06-22 15:49:441669 break;
1670 }
1671#endif
Aurelien Jacobsb250f9c2009-01-13 23:44:161672#if CONFIG_BZLIB
Keiji Costantini84cfce92014-03-01 16:28:151673 case MATROSKA_TRACK_ENCODING_COMP_BZLIB:
1674 {
1675 bz_stream bzstream = { 0 };
Evgeniy Stepanov935ec5a2008-06-22 15:49:441676 if (BZ2_bzDecompressInit(&bzstream, 0, 0) != BZ_OK)
1677 return -1;
Keiji Costantini84cfce92014-03-01 16:28:151678 bzstream.next_in = data;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441679 bzstream.avail_in = isize;
1680 do {
Keiji Costantini84cfce92014-03-01 16:28:151681 pkt_size *= 3;
James Almer9703b7d2018-04-04 21:12:531682 newpktdata = av_realloc(pkt_data, pkt_size + AV_INPUT_BUFFER_PADDING_SIZE);
Michael Niedermayer77d2ef12011-07-28 12:59:541683 if (!newpktdata) {
1684 BZ2_bzDecompressEnd(&bzstream);
Michael Niedermayer171af592015-05-12 16:32:121685 result = AVERROR(ENOMEM);
Michael Niedermayer77d2ef12011-07-28 12:59:541686 goto failed;
1687 }
Keiji Costantini84cfce92014-03-01 16:28:151688 pkt_data = newpktdata;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441689 bzstream.avail_out = pkt_size - bzstream.total_out_lo32;
Keiji Costantini84cfce92014-03-01 16:28:151690 bzstream.next_out = pkt_data + bzstream.total_out_lo32;
Michael Niedermayer171af592015-05-12 16:32:121691 result = BZ2_bzDecompress(&bzstream);
Keiji Costantini84cfce92014-03-01 16:28:151692 } while (result == BZ_OK && pkt_size < 10000000);
Evgeniy Stepanov935ec5a2008-06-22 15:49:441693 pkt_size = bzstream.total_out_lo32;
1694 BZ2_bzDecompressEnd(&bzstream);
Luca Barbatoc9a39ce2012-09-14 18:03:371695 if (result != BZ_STREAM_END) {
1696 if (result == BZ_MEM_ERROR)
1697 result = AVERROR(ENOMEM);
1698 else
1699 result = AVERROR_INVALIDDATA;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441700 goto failed;
Luca Barbatoc9a39ce2012-09-14 18:03:371701 }
Evgeniy Stepanov935ec5a2008-06-22 15:49:441702 break;
1703 }
1704#endif
Aurelien Jacobs28f27e02008-08-20 23:08:071705 default:
Luca Barbatoc9a39ce2012-09-14 18:03:371706 return AVERROR_INVALIDDATA;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441707 }
1708
James Almer9703b7d2018-04-04 21:12:531709 memset(pkt_data + pkt_size, 0, AV_INPUT_BUFFER_PADDING_SIZE);
1710
Keiji Costantini84cfce92014-03-01 16:28:151711 *buf = pkt_data;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441712 *buf_size = pkt_size;
1713 return 0;
Keiji Costantini84cfce92014-03-01 16:28:151714
1715failed:
Evgeniy Stepanov935ec5a2008-06-22 15:49:441716 av_free(pkt_data);
Luca Barbatoc9a39ce2012-09-14 18:03:371717 return result;
Evgeniy Stepanov935ec5a2008-06-22 15:49:441718}
1719
Aurelien Jacobs929e9de2009-02-15 15:53:551720static void matroska_convert_tag(AVFormatContext *s, EbmlList *list,
Anton Khirnovd2d67e42011-05-22 10:46:291721 AVDictionary **metadata, char *prefix)
Aurelien Jacobs44015c52008-08-08 23:50:381722{
1723 MatroskaTag *tags = list->elem;
Aurelien Jacobs929e9de2009-02-15 15:53:551724 char key[1024];
1725 int i;
Aurelien Jacobs44015c52008-08-08 23:50:381726
Keiji Costantini84cfce92014-03-01 16:28:151727 for (i = 0; i < list->nb_elem; i++) {
1728 const char *lang = tags[i].lang &&
1729 strcmp(tags[i].lang, "und") ? tags[i].lang : NULL;
Anton Khirnovbf800c72010-11-03 06:29:041730
1731 if (!tags[i].name) {
1732 av_log(s, AV_LOG_WARNING, "Skipping invalid tag with no TagName.\n");
1733 continue;
1734 }
Keiji Costantini84cfce92014-03-01 16:28:151735 if (prefix)
1736 snprintf(key, sizeof(key), "%s/%s", prefix, tags[i].name);
1737 else
1738 av_strlcpy(key, tags[i].name, sizeof(key));
Aurelien Jacobsf702df32009-02-15 16:05:371739 if (tags[i].def || !lang) {
Keiji Costantini84cfce92014-03-01 16:28:151740 av_dict_set(metadata, key, tags[i].string, 0);
1741 if (tags[i].sub.nb_elem)
1742 matroska_convert_tag(s, &tags[i].sub, metadata, key);
Aurelien Jacobsf702df32009-02-15 16:05:371743 }
1744 if (lang) {
1745 av_strlcat(key, "-", sizeof(key));
1746 av_strlcat(key, lang, sizeof(key));
Anton Khirnovd2d67e42011-05-22 10:46:291747 av_dict_set(metadata, key, tags[i].string, 0);
Aurelien Jacobsf702df32009-02-15 16:05:371748 if (tags[i].sub.nb_elem)
1749 matroska_convert_tag(s, &tags[i].sub, metadata, key);
1750 }
Aurelien Jacobs929e9de2009-02-15 15:53:551751 }
Anton Khirnovad7768f2010-10-16 13:20:411752 ff_metadata_conv(metadata, NULL, ff_mkv_metadata_conv);
Aurelien Jacobs929e9de2009-02-15 15:53:551753}
1754
1755static void matroska_convert_tags(AVFormatContext *s)
1756{
1757 MatroskaDemuxContext *matroska = s->priv_data;
1758 MatroskaTags *tags = matroska->tags.elem;
1759 int i, j;
1760
Keiji Costantini84cfce92014-03-01 16:28:151761 for (i = 0; i < matroska->tags.nb_elem; i++) {
Aurelien Jacobs929e9de2009-02-15 15:53:551762 if (tags[i].target.attachuid) {
Diego Biurrunf69befe2014-03-07 12:54:181763 MatroskaAttachment *attachment = matroska->attachments.elem;
Luca Barbatoa0fa6d02015-10-31 18:45:271764 int found = 0;
1765 for (j = 0; j < matroska->attachments.nb_elem; j++) {
Keiji Costantini84cfce92014-03-01 16:28:151766 if (attachment[j].uid == tags[i].target.attachuid &&
Luca Barbatoa0fa6d02015-10-31 18:45:271767 attachment[j].stream) {
Aurelien Jacobs929e9de2009-02-15 15:53:551768 matroska_convert_tag(s, &tags[i].tag,
1769 &attachment[j].stream->metadata, NULL);
Luca Barbatoa0fa6d02015-10-31 18:45:271770 found = 1;
1771 }
1772 }
1773 if (!found) {
1774 av_log(NULL, AV_LOG_WARNING,
1775 "The tags at index %d refer to a "
1776 "non-existent attachment %"PRId64".\n",
1777 i, tags[i].target.attachuid);
1778 }
Aurelien Jacobs929e9de2009-02-15 15:53:551779 } else if (tags[i].target.chapteruid) {
1780 MatroskaChapter *chapter = matroska->chapters.elem;
Luca Barbatoa0fa6d02015-10-31 18:45:271781 int found = 0;
1782 for (j = 0; j < matroska->chapters.nb_elem; j++) {
Keiji Costantini84cfce92014-03-01 16:28:151783 if (chapter[j].uid == tags[i].target.chapteruid &&
Luca Barbatoa0fa6d02015-10-31 18:45:271784 chapter[j].chapter) {
Aurelien Jacobs929e9de2009-02-15 15:53:551785 matroska_convert_tag(s, &tags[i].tag,
1786 &chapter[j].chapter->metadata, NULL);
Luca Barbatoa0fa6d02015-10-31 18:45:271787 found = 1;
1788 }
1789 }
1790 if (!found) {
1791 av_log(NULL, AV_LOG_WARNING,
1792 "The tags at index %d refer to a non-existent chapter "
1793 "%"PRId64".\n",
1794 i, tags[i].target.chapteruid);
1795 }
Aurelien Jacobs929e9de2009-02-15 15:53:551796 } else if (tags[i].target.trackuid) {
1797 MatroskaTrack *track = matroska->tracks.elem;
Luca Barbatoa0fa6d02015-10-31 18:45:271798 int found = 0;
1799 for (j = 0; j < matroska->tracks.nb_elem; j++) {
1800 if (track[j].uid == tags[i].target.trackuid &&
1801 track[j].stream) {
Aurelien Jacobs929e9de2009-02-15 15:53:551802 matroska_convert_tag(s, &tags[i].tag,
1803 &track[j].stream->metadata, NULL);
Luca Barbatoa0fa6d02015-10-31 18:45:271804 found = 1;
1805 }
1806 }
1807 if (!found) {
1808 av_log(NULL, AV_LOG_WARNING,
1809 "The tags at index %d refer to a non-existent track "
1810 "%"PRId64".\n",
1811 i, tags[i].target.trackuid);
1812 }
Aurelien Jacobs929e9de2009-02-15 15:53:551813 } else {
Aurelien Jacobs4f909c72009-06-13 22:29:381814 matroska_convert_tag(s, &tags[i].tag, &s->metadata,
1815 tags[i].target.type);
Aurelien Jacobs929e9de2009-02-15 15:53:551816 }
Aurelien Jacobs44015c52008-08-08 23:50:381817 }
1818}
1819
Keiji Costantini84cfce92014-03-01 16:28:151820static int matroska_parse_seekhead_entry(MatroskaDemuxContext *matroska,
Andreas Rheinhardt730ac1a2019-05-16 22:30:201821 int64_t pos)
Aurelien Jacobs13b350a2008-08-05 00:40:361822{
Andreas Rheinhardt60f75c92019-05-16 22:30:131823 uint32_t saved_id = matroska->current_id;
Anton Khirnov384c9c22011-03-03 19:11:451824 int64_t before_pos = avio_tell(matroska->ctx->pb);
Aaron Colwell31ad14c2011-07-09 05:48:431825 int ret = 0;
David Conradb061d892007-06-04 22:10:541826
Anton Khirnovf47ac3c2011-07-09 06:11:301827 /* seek */
Andreas Rheinhardt730ac1a2019-05-16 22:30:201828 if (avio_seek(matroska->ctx->pb, pos, SEEK_SET) == pos) {
Diego Biurrun5968d2d2008-08-05 08:28:571829 /* We don't want to lose our seekhead level, so we add
Aurelien Jacobs43485712008-08-05 00:40:431830 * a dummy. This is a crude hack. */
1831 if (matroska->num_levels == EBML_MAX_DEPTH) {
1832 av_log(matroska->ctx, AV_LOG_INFO,
1833 "Max EBML element depth (%d) reached, "
1834 "cannot parse further.\n", EBML_MAX_DEPTH);
Aaron Colwell31ad14c2011-07-09 05:48:431835 ret = AVERROR_INVALIDDATA;
1836 } else {
Andreas Rheinhardt60f75c92019-05-16 22:30:131837 matroska->levels[matroska->num_levels] = (MatroskaLevel) { 0, EBML_UNKNOWN_LENGTH };
Anton Khirnovf47ac3c2011-07-09 06:11:301838 matroska->num_levels++;
Keiji Costantini84cfce92014-03-01 16:28:151839 matroska->current_id = 0;
David Conradb061d892007-06-04 22:10:541840
Dustin Brody4a9628f2011-09-08 22:43:321841 ret = ebml_parse(matroska, matroska_segment, matroska);
Andreas Rheinhardtb31c9b72019-06-23 23:46:541842 if (ret == LEVEL_ENDED) {
1843 /* This can only happen if the seek brought us beyond EOF. */
1844 ret = AVERROR_EOF;
1845 }
Aurelien Jacobs43485712008-08-05 00:40:431846 }
David Conradb061d892007-06-04 22:10:541847 }
Andreas Rheinhardta9f05152019-05-16 22:30:091848 /* Seek back - notice that in all instances where this is used
1849 * it is safe to set the level to 1. */
Andreas Rheinhardt8a286e72019-05-16 22:30:031850 matroska_reset_status(matroska, saved_id, before_pos);
Aaron Colwell31ad14c2011-07-09 05:48:431851
1852 return ret;
1853}
1854
1855static void matroska_execute_seekhead(MatroskaDemuxContext *matroska)
1856{
1857 EbmlList *seekhead_list = &matroska->seekhead;
David Conradb061d892007-06-04 22:10:541858 int i;
1859
1860 // we should not do any seeking in the streaming case
James Almer4de591e2017-03-21 20:02:301861 if (!(matroska->ctx->pb->seekable & AVIO_SEEKABLE_NORMAL))
David Conradb061d892007-06-04 22:10:541862 return;
1863
wm4cac22952015-02-09 19:39:001864 for (i = 0; i < seekhead_list->nb_elem; i++) {
1865 MatroskaSeekhead *seekheads = seekhead_list->elem;
Andreas Rheinhardt730ac1a2019-05-16 22:30:201866 uint32_t id = seekheads[i].id;
1867 int64_t pos = seekheads[i].pos + matroska->segment_start;
wm46551aca2014-12-06 15:53:301868
wm4cac22952015-02-09 19:39:001869 MatroskaLevel1Element *elem = matroska_find_level1_elem(matroska, id);
1870 if (!elem || elem->parsed)
David Conradb061d892007-06-04 22:10:541871 continue;
1872
wm4cac22952015-02-09 19:39:001873 elem->pos = pos;
1874
Aaron Colwell31ad14c2011-07-09 05:48:431875 // defer cues parsing until we actually need cue data.
wm4cac22952015-02-09 19:39:001876 if (id == MATROSKA_ID_CUES)
David Conradb061d892007-06-04 22:10:541877 continue;
David Conradb061d892007-06-04 22:10:541878
wm4cac22952015-02-09 19:39:001879 if (matroska_parse_seekhead_entry(matroska, pos) < 0) {
Reimar Döffinger47e015e2012-02-12 13:09:031880 // mark index as broken
1881 matroska->cues_parsing_deferred = -1;
Aaron Colwell31ad14c2011-07-09 05:48:431882 break;
Reimar Döffinger47e015e2012-02-12 13:09:031883 }
wm4cac22952015-02-09 19:39:001884
1885 elem->parsed = 1;
Michael Niedermayer72c98442014-12-07 21:45:341886 }
Aaron Colwell31ad14c2011-07-09 05:48:431887}
David Conradb061d892007-06-04 22:10:541888
Michael Niedermayerb3d9ab12014-03-07 22:46:371889static void matroska_add_index_entries(MatroskaDemuxContext *matroska)
Keiji Costantini84cfce92014-03-01 16:28:151890{
Aaron Colwell31ad14c2011-07-09 05:48:431891 EbmlList *index_list;
1892 MatroskaIndex *index;
Andreas Cadhalpuneb9fb502015-05-03 21:07:201893 uint64_t index_scale = 1;
Aaron Colwell31ad14c2011-07-09 05:48:431894 int i, j;
David Conradb061d892007-06-04 22:10:541895
wm478623252015-02-09 19:39:011896 if (matroska->ctx->flags & AVFMT_FLAG_IGNIDX)
1897 return;
1898
Aaron Colwell31ad14c2011-07-09 05:48:431899 index_list = &matroska->index;
Keiji Costantini84cfce92014-03-01 16:28:151900 index = index_list->elem;
Rodger Combs4f7d9b72015-10-08 20:34:591901 if (index_list->nb_elem < 2)
1902 return;
1903 if (index[1].time > 1E14 / matroska->time_scale) {
1904 av_log(matroska->ctx, AV_LOG_WARNING, "Dropping apparently-broken index.\n");
1905 return;
Aaron Colwell31ad14c2011-07-09 05:48:431906 }
1907 for (i = 0; i < index_list->nb_elem; i++) {
Keiji Costantini84cfce92014-03-01 16:28:151908 EbmlList *pos_list = &index[i].pos;
Aaron Colwell31ad14c2011-07-09 05:48:431909 MatroskaIndexPos *pos = pos_list->elem;
1910 for (j = 0; j < pos_list->nb_elem; j++) {
Keiji Costantini84cfce92014-03-01 16:28:151911 MatroskaTrack *track = matroska_find_track_by_num(matroska,
1912 pos[j].track);
Aaron Colwell31ad14c2011-07-09 05:48:431913 if (track && track->stream)
1914 av_add_index_entry(track->stream,
1915 pos[j].pos + matroska->segment_start,
Keiji Costantini84cfce92014-03-01 16:28:151916 index[i].time / index_scale, 0, 0,
Aaron Colwell31ad14c2011-07-09 05:48:431917 AVINDEX_KEYFRAME);
David Conradb061d892007-06-04 22:10:541918 }
1919 }
David Conradb061d892007-06-04 22:10:541920}
1921
Aaron Colwell6c4cc0f2011-09-22 14:51:001922static void matroska_parse_cues(MatroskaDemuxContext *matroska) {
Aaron Colwell6c4cc0f2011-09-22 14:51:001923 int i;
1924
wm478623252015-02-09 19:39:011925 if (matroska->ctx->flags & AVFMT_FLAG_IGNIDX)
1926 return;
1927
wm4cac22952015-02-09 19:39:001928 for (i = 0; i < matroska->num_level1_elems; i++) {
1929 MatroskaLevel1Element *elem = &matroska->level1_elems[i];
1930 if (elem->id == MATROSKA_ID_CUES && !elem->parsed) {
1931 if (matroska_parse_seekhead_entry(matroska, elem->pos) < 0)
1932 matroska->cues_parsing_deferred = -1;
1933 elem->parsed = 1;
Aaron Colwell6c4cc0f2011-09-22 14:51:001934 break;
wm4cac22952015-02-09 19:39:001935 }
1936 }
Aaron Colwell6c4cc0f2011-09-22 14:51:001937
Aaron Colwell6c4cc0f2011-09-22 14:51:001938 matroska_add_index_entries(matroska);
1939}
1940
Aurelien Jacobsf7b96872008-08-05 00:42:051941static int matroska_aac_profile(char *codec_id)
David Conradb061d892007-06-04 22:10:541942{
Keiji Costantini84cfce92014-03-01 16:28:151943 static const char *const aac_profiles[] = { "MAIN", "LC", "SSR" };
David Conradb061d892007-06-04 22:10:541944 int profile;
1945
Keiji Costantini84cfce92014-03-01 16:28:151946 for (profile = 0; profile < FF_ARRAY_ELEMS(aac_profiles); profile++)
David Conradb061d892007-06-04 22:10:541947 if (strstr(codec_id, aac_profiles[profile]))
1948 break;
1949 return profile + 1;
1950}
1951
Aurelien Jacobsf7b96872008-08-05 00:42:051952static int matroska_aac_sri(int samplerate)
David Conradb061d892007-06-04 22:10:541953{
David Conradb061d892007-06-04 22:10:541954 int sri;
1955
Keiji Costantini84cfce92014-03-01 16:28:151956 for (sri = 0; sri < FF_ARRAY_ELEMS(avpriv_mpeg4audio_sample_rates); sri++)
Anton Khirnov59a9a232011-10-17 07:28:531957 if (avpriv_mpeg4audio_sample_rates[sri] == samplerate)
David Conradb061d892007-06-04 22:10:541958 break;
1959 return sri;
1960}
1961
Aaron Colwell2e061132012-03-05 18:02:481962static void matroska_metadata_creation_time(AVDictionary **metadata, int64_t date_utc)
1963{
Aaron Colwell2e061132012-03-05 18:02:481964 /* Convert to seconds and adjust by number of seconds between 2001-01-01 and Epoch */
Marton Balint13b90ff2016-06-29 22:55:481965 avpriv_dict_set_timestamp(metadata, "creation_time", date_utc / 1000 + 978307200000000LL);
Aaron Colwell2e061132012-03-05 18:02:481966}
1967
Anton Khirnov4efdadc2014-05-25 12:05:511968static int matroska_parse_flac(AVFormatContext *s,
1969 MatroskaTrack *track,
1970 int *offset)
1971{
Anton Khirnov23f741f2014-05-26 10:48:561972 AVStream *st = track->stream;
Anton Khirnov4efdadc2014-05-25 12:05:511973 uint8_t *p = track->codec_priv.data;
1974 int size = track->codec_priv.size;
1975
1976 if (size < 8 + FLAC_STREAMINFO_SIZE || p[4] & 0x7f) {
1977 av_log(s, AV_LOG_WARNING, "Invalid FLAC private data\n");
1978 track->codec_priv.size = 0;
1979 return 0;
1980 }
1981 *offset = 8;
1982 track->codec_priv.size = 8 + FLAC_STREAMINFO_SIZE;
1983
Anton Khirnov23f741f2014-05-26 10:48:561984 p += track->codec_priv.size;
1985 size -= track->codec_priv.size;
1986
1987 /* parse the remaining metadata blocks if present */
1988 while (size >= 4) {
1989 int block_last, block_type, block_size;
1990
1991 flac_parse_block_header(p, &block_last, &block_type, &block_size);
1992
1993 p += 4;
1994 size -= 4;
1995 if (block_size > size)
1996 return 0;
1997
1998 /* check for the channel mask */
1999 if (block_type == FLAC_METADATA_TYPE_VORBIS_COMMENT) {
2000 AVDictionary *dict = NULL;
2001 AVDictionaryEntry *chmask;
2002
2003 ff_vorbis_comment(s, &dict, p, block_size, 0);
2004 chmask = av_dict_get(dict, "WAVEFORMATEXTENSIBLE_CHANNEL_MASK", NULL, 0);
2005 if (chmask) {
2006 uint64_t mask = strtol(chmask->value, NULL, 0);
2007 if (!mask || mask & ~0x3ffffULL) {
2008 av_log(s, AV_LOG_WARNING,
2009 "Invalid value of WAVEFORMATEXTENSIBLE_CHANNEL_MASK\n");
2010 } else
Anton Khirnov92005142014-06-18 18:42:522011 st->codecpar->channel_layout = mask;
Anton Khirnov23f741f2014-05-26 10:48:562012 }
2013 av_dict_free(&dict);
2014 }
2015
2016 p += block_size;
2017 size -= block_size;
2018 }
2019
Anton Khirnov4efdadc2014-05-25 12:05:512020 return 0;
2021}
2022
James Almer1273bc62016-10-13 17:22:072023static int mkv_field_order(MatroskaDemuxContext *matroska, int64_t field_order)
Luca Barbato5f022662016-03-28 18:29:542024{
James Almer1273bc62016-10-13 17:22:072025 int major, minor, micro, bttb = 0;
2026
2027 /* workaround a bug in our Matroska muxer, introduced in version 57.36 alongside
2028 * this function, and fixed in 57.52 */
Andreas Cadhalpuneb751f02016-10-16 19:47:002029 if (matroska->muxingapp && sscanf(matroska->muxingapp, "Lavf%d.%d.%d", &major, &minor, &micro) == 3)
James Almer1273bc62016-10-13 17:22:072030 bttb = (major == 57 && minor >= 36 && minor <= 51 && micro >= 100);
2031
Luca Barbato5f022662016-03-28 18:29:542032 switch (field_order) {
2033 case MATROSKA_VIDEO_FIELDORDER_PROGRESSIVE:
2034 return AV_FIELD_PROGRESSIVE;
2035 case MATROSKA_VIDEO_FIELDORDER_UNDETERMINED:
2036 return AV_FIELD_UNKNOWN;
2037 case MATROSKA_VIDEO_FIELDORDER_TT:
2038 return AV_FIELD_TT;
2039 case MATROSKA_VIDEO_FIELDORDER_BB:
2040 return AV_FIELD_BB;
2041 case MATROSKA_VIDEO_FIELDORDER_BT:
James Almer1273bc62016-10-13 17:22:072042 return bttb ? AV_FIELD_TB : AV_FIELD_BT;
Luca Barbato5f022662016-03-28 18:29:542043 case MATROSKA_VIDEO_FIELDORDER_TB:
James Almer1273bc62016-10-13 17:22:072044 return bttb ? AV_FIELD_BT : AV_FIELD_TB;
Luca Barbato5f022662016-03-28 18:29:542045 default:
2046 return AV_FIELD_UNKNOWN;
2047 }
2048}
2049
Aaron Colwellfebfb492015-12-02 23:13:182050static void mkv_stereo_mode_display_mul(int stereo_mode,
2051 int *h_width, int *h_height)
Aaron Colwellec83efd2015-11-23 20:06:142052{
2053 switch (stereo_mode) {
2054 case MATROSKA_VIDEO_STEREOMODE_TYPE_MONO:
2055 case MATROSKA_VIDEO_STEREOMODE_TYPE_CHECKERBOARD_RL:
2056 case MATROSKA_VIDEO_STEREOMODE_TYPE_CHECKERBOARD_LR:
2057 case MATROSKA_VIDEO_STEREOMODE_TYPE_BOTH_EYES_BLOCK_RL:
2058 case MATROSKA_VIDEO_STEREOMODE_TYPE_BOTH_EYES_BLOCK_LR:
2059 break;
2060 case MATROSKA_VIDEO_STEREOMODE_TYPE_RIGHT_LEFT:
2061 case MATROSKA_VIDEO_STEREOMODE_TYPE_LEFT_RIGHT:
2062 case MATROSKA_VIDEO_STEREOMODE_TYPE_COL_INTERLEAVED_RL:
2063 case MATROSKA_VIDEO_STEREOMODE_TYPE_COL_INTERLEAVED_LR:
2064 *h_width = 2;
2065 break;
2066 case MATROSKA_VIDEO_STEREOMODE_TYPE_BOTTOM_TOP:
2067 case MATROSKA_VIDEO_STEREOMODE_TYPE_TOP_BOTTOM:
2068 case MATROSKA_VIDEO_STEREOMODE_TYPE_ROW_INTERLEAVED_RL:
2069 case MATROSKA_VIDEO_STEREOMODE_TYPE_ROW_INTERLEAVED_LR:
2070 *h_height = 2;
2071 break;
2072 }
2073}
2074
Neil Birkbeckbbda13a2016-03-01 00:41:042075static int mkv_parse_video_color(AVStream *st, const MatroskaTrack *track) {
James Almer4e759072016-12-05 02:22:392076 const MatroskaTrackVideoColor *color = track->video.color.elem;
2077 const MatroskaMasteringMeta *mastering_meta;
2078 int has_mastering_primaries, has_mastering_luminance;
2079
2080 if (!track->video.color.nb_elem)
2081 return 0;
2082
2083 mastering_meta = &color->mastering_meta;
Neil Birkbeckbbda13a2016-03-01 00:41:042084 // Mastering primaries are CIE 1931 coords, and must be > 0.
James Almer4e759072016-12-05 02:22:392085 has_mastering_primaries =
Neil Birkbeckbbda13a2016-03-01 00:41:042086 mastering_meta->r_x > 0 && mastering_meta->r_y > 0 &&
2087 mastering_meta->g_x > 0 && mastering_meta->g_y > 0 &&
2088 mastering_meta->b_x > 0 && mastering_meta->b_y > 0 &&
2089 mastering_meta->white_x > 0 && mastering_meta->white_y > 0;
James Almer4e759072016-12-05 02:22:392090 has_mastering_luminance = mastering_meta->max_luminance > 0;
Neil Birkbeckbbda13a2016-03-01 00:41:042091
James Almer4e759072016-12-05 02:22:392092 if (color->matrix_coefficients != AVCOL_SPC_RESERVED)
2093 st->codecpar->color_space = color->matrix_coefficients;
2094 if (color->primaries != AVCOL_PRI_RESERVED &&
2095 color->primaries != AVCOL_PRI_RESERVED0)
2096 st->codecpar->color_primaries = color->primaries;
2097 if (color->transfer_characteristics != AVCOL_TRC_RESERVED &&
2098 color->transfer_characteristics != AVCOL_TRC_RESERVED0)
2099 st->codecpar->color_trc = color->transfer_characteristics;
2100 if (color->range != AVCOL_RANGE_UNSPECIFIED &&
2101 color->range <= AVCOL_RANGE_JPEG)
2102 st->codecpar->color_range = color->range;
2103 if (color->chroma_siting_horz != MATROSKA_COLOUR_CHROMASITINGHORZ_UNDETERMINED &&
2104 color->chroma_siting_vert != MATROSKA_COLOUR_CHROMASITINGVERT_UNDETERMINED &&
2105 color->chroma_siting_horz < MATROSKA_COLOUR_CHROMASITINGHORZ_NB &&
2106 color->chroma_siting_vert < MATROSKA_COLOUR_CHROMASITINGVERT_NB) {
James Almer47ee6f12016-10-18 02:50:142107 st->codecpar->chroma_location =
James Almer4e759072016-12-05 02:22:392108 avcodec_chroma_pos_to_enum((color->chroma_siting_horz - 1) << 7,
2109 (color->chroma_siting_vert - 1) << 7);
James Almer47ee6f12016-10-18 02:50:142110 }
James Almer095147a2017-04-25 18:04:002111 if (color->max_cll && color->max_fall) {
2112 size_t size = 0;
2113 int ret;
2114 AVContentLightMetadata *metadata = av_content_light_metadata_alloc(&size);
2115 if (!metadata)
2116 return AVERROR(ENOMEM);
2117 ret = av_stream_add_side_data(st, AV_PKT_DATA_CONTENT_LIGHT_LEVEL,
2118 (uint8_t *)metadata, size);
2119 if (ret < 0) {
2120 av_freep(&metadata);
2121 return ret;
2122 }
2123 metadata->MaxCLL = color->max_cll;
2124 metadata->MaxFALL = color->max_fall;
2125 }
Neil Birkbeckbbda13a2016-03-01 00:41:042126
2127 if (has_mastering_primaries || has_mastering_luminance) {
Neil Birkbeckbbda13a2016-03-01 00:41:042128 AVMasteringDisplayMetadata *metadata =
2129 (AVMasteringDisplayMetadata*) av_stream_new_side_data(
2130 st, AV_PKT_DATA_MASTERING_DISPLAY_METADATA,
2131 sizeof(AVMasteringDisplayMetadata));
2132 if (!metadata) {
2133 return AVERROR(ENOMEM);
2134 }
2135 memset(metadata, 0, sizeof(AVMasteringDisplayMetadata));
2136 if (has_mastering_primaries) {
James Almer3b4e9a32019-10-03 23:52:202137 metadata->display_primaries[0][0] = av_d2q(mastering_meta->r_x, INT_MAX);
2138 metadata->display_primaries[0][1] = av_d2q(mastering_meta->r_y, INT_MAX);
2139 metadata->display_primaries[1][0] = av_d2q(mastering_meta->g_x, INT_MAX);
2140 metadata->display_primaries[1][1] = av_d2q(mastering_meta->g_y, INT_MAX);
2141 metadata->display_primaries[2][0] = av_d2q(mastering_meta->b_x, INT_MAX);
2142 metadata->display_primaries[2][1] = av_d2q(mastering_meta->b_y, INT_MAX);
2143 metadata->white_point[0] = av_d2q(mastering_meta->white_x, INT_MAX);
2144 metadata->white_point[1] = av_d2q(mastering_meta->white_y, INT_MAX);
Neil Birkbeckbbda13a2016-03-01 00:41:042145 metadata->has_primaries = 1;
2146 }
2147 if (has_mastering_luminance) {
James Almer3b4e9a32019-10-03 23:52:202148 metadata->max_luminance = av_d2q(mastering_meta->max_luminance, INT_MAX);
2149 metadata->min_luminance = av_d2q(mastering_meta->min_luminance, INT_MAX);
Neil Birkbeckbbda13a2016-03-01 00:41:042150 metadata->has_luminance = 1;
2151 }
2152 }
2153 return 0;
2154}
2155
James Almer445204c2016-12-06 17:48:452156static int mkv_parse_video_projection(AVStream *st, const MatroskaTrack *track) {
2157 AVSphericalMapping *spherical;
2158 enum AVSphericalProjection projection;
2159 size_t spherical_size;
Vittorio Giovaraf20bcec2017-03-16 21:20:472160 uint32_t l = 0, t = 0, r = 0, b = 0;
2161 uint32_t padding = 0;
James Almer445204c2016-12-06 17:48:452162 int ret;
Vittorio Giovarabde96422017-02-10 21:02:222163 GetByteContext gb;
2164
2165 bytestream2_init(&gb, track->video.projection.private.data,
2166 track->video.projection.private.size);
2167
2168 if (bytestream2_get_byte(&gb) != 0) {
2169 av_log(NULL, AV_LOG_WARNING, "Unknown spherical metadata\n");
2170 return 0;
2171 }
2172
2173 bytestream2_skip(&gb, 3); // flags
James Almer445204c2016-12-06 17:48:452174
2175 switch (track->video.projection.type) {
2176 case MATROSKA_VIDEO_PROJECTION_TYPE_EQUIRECTANGULAR:
Vittorio Giovara9ae35062017-03-07 22:34:322177 if (track->video.projection.private.size == 20) {
Vittorio Giovarabde96422017-02-10 21:02:222178 t = bytestream2_get_be32(&gb);
2179 b = bytestream2_get_be32(&gb);
2180 l = bytestream2_get_be32(&gb);
2181 r = bytestream2_get_be32(&gb);
2182
2183 if (b >= UINT_MAX - t || r >= UINT_MAX - l) {
2184 av_log(NULL, AV_LOG_ERROR,
2185 "Invalid bounding rectangle coordinates "
Vittorio Giovaraf20bcec2017-03-16 21:20:472186 "%"PRIu32",%"PRIu32",%"PRIu32",%"PRIu32"\n",
Vittorio Giovarabde96422017-02-10 21:02:222187 l, t, r, b);
2188 return AVERROR_INVALIDDATA;
2189 }
Vittorio Giovara9ae35062017-03-07 22:34:322190 } else if (track->video.projection.private.size != 0) {
Vittorio Giovarabde96422017-02-10 21:02:222191 av_log(NULL, AV_LOG_ERROR, "Unknown spherical metadata\n");
2192 return AVERROR_INVALIDDATA;
2193 }
Vittorio Giovara9ae35062017-03-07 22:34:322194
2195 if (l || t || r || b)
2196 projection = AV_SPHERICAL_EQUIRECTANGULAR_TILE;
2197 else
2198 projection = AV_SPHERICAL_EQUIRECTANGULAR;
James Almer445204c2016-12-06 17:48:452199 break;
2200 case MATROSKA_VIDEO_PROJECTION_TYPE_CUBEMAP:
Vittorio Giovarabde96422017-02-10 21:02:222201 if (track->video.projection.private.size < 4) {
2202 av_log(NULL, AV_LOG_ERROR, "Missing projection private properties\n");
James Almer445204c2016-12-06 17:48:452203 return AVERROR_INVALIDDATA;
Vittorio Giovarabde96422017-02-10 21:02:222204 } else if (track->video.projection.private.size == 12) {
2205 uint32_t layout = bytestream2_get_be32(&gb);
Vittorio Giovara9ae35062017-03-07 22:34:322206 if (layout) {
Vittorio Giovarabde96422017-02-10 21:02:222207 av_log(NULL, AV_LOG_WARNING,
2208 "Unknown spherical cubemap layout %"PRIu32"\n", layout);
2209 return 0;
2210 }
Vittorio Giovara9ae35062017-03-07 22:34:322211 projection = AV_SPHERICAL_CUBEMAP;
Vittorio Giovarabde96422017-02-10 21:02:222212 padding = bytestream2_get_be32(&gb);
2213 } else {
2214 av_log(NULL, AV_LOG_ERROR, "Unknown spherical metadata\n");
2215 return AVERROR_INVALIDDATA;
2216 }
James Almer445204c2016-12-06 17:48:452217 break;
James Almer55fe72a2017-11-02 23:42:052218 case MATROSKA_VIDEO_PROJECTION_TYPE_RECTANGULAR:
2219 /* No Spherical metadata */
2220 return 0;
James Almer445204c2016-12-06 17:48:452221 default:
James Almer251849f2016-12-06 17:48:452222 av_log(NULL, AV_LOG_WARNING,
2223 "Unknown spherical metadata type %"PRIu64"\n",
2224 track->video.projection.type);
James Almer445204c2016-12-06 17:48:452225 return 0;
2226 }
2227
2228 spherical = av_spherical_alloc(&spherical_size);
2229 if (!spherical)
2230 return AVERROR(ENOMEM);
James Almer251849f2016-12-06 17:48:452231
James Almer445204c2016-12-06 17:48:452232 spherical->projection = projection;
2233
James Almer251849f2016-12-06 17:48:452234 spherical->yaw = (int32_t) (track->video.projection.yaw * (1 << 16));
2235 spherical->pitch = (int32_t) (track->video.projection.pitch * (1 << 16));
2236 spherical->roll = (int32_t) (track->video.projection.roll * (1 << 16));
James Almer445204c2016-12-06 17:48:452237
Vittorio Giovarabde96422017-02-10 21:02:222238 spherical->padding = padding;
2239
2240 spherical->bound_left = l;
2241 spherical->bound_top = t;
2242 spherical->bound_right = r;
2243 spherical->bound_bottom = b;
2244
James Almer445204c2016-12-06 17:48:452245 ret = av_stream_add_side_data(st, AV_PKT_DATA_SPHERICAL, (uint8_t *)spherical,
2246 spherical_size);
James Almer8396d542016-12-08 04:21:112247 if (ret < 0) {
2248 av_freep(&spherical);
James Almer445204c2016-12-06 17:48:452249 return ret;
James Almer8396d542016-12-08 04:21:112250 }
James Almer445204c2016-12-06 17:48:452251
2252 return 0;
2253}
2254
Mats Peterson71f73ee2016-01-10 02:59:212255static int get_qt_codec(MatroskaTrack *track, uint32_t *fourcc, enum AVCodecID *codec_id)
2256{
2257 const AVCodecTag *codec_tags;
2258
2259 codec_tags = track->type == MATROSKA_TRACK_TYPE_VIDEO ?
2260 ff_codec_movvideo_tags : ff_codec_movaudio_tags;
2261
2262 /* Normalize noncompliant private data that starts with the fourcc
2263 * by expanding/shifting the data by 4 bytes and storing the data
2264 * size at the start. */
2265 if (ff_codec_get_id(codec_tags, AV_RL32(track->codec_priv.data))) {
James Almera6188662018-04-04 17:12:542266 int ret = av_buffer_realloc(&track->codec_priv.buf,
2267 track->codec_priv.size + 4 + AV_INPUT_BUFFER_PADDING_SIZE);
2268 if (ret < 0)
2269 return ret;
2270
2271 track->codec_priv.data = track->codec_priv.buf->data;
2272 memmove(track->codec_priv.data + 4, track->codec_priv.data, track->codec_priv.size);
Mats Peterson71f73ee2016-01-10 02:59:212273 track->codec_priv.size += 4;
2274 AV_WB32(track->codec_priv.data, track->codec_priv.size);
2275 }
2276
2277 *fourcc = AV_RL32(track->codec_priv.data + 4);
2278 *codec_id = ff_codec_get_id(codec_tags, *fourcc);
2279
2280 return 0;
2281}
2282
Anton Khirnov6df478b2014-05-25 07:07:322283static int matroska_parse_tracks(AVFormatContext *s)
David Conradb061d892007-06-04 22:10:542284{
2285 MatroskaDemuxContext *matroska = s->priv_data;
Anton Khirnov6df478b2014-05-25 07:07:322286 MatroskaTrack *tracks = matroska->tracks.elem;
Aurelien Jacobs9a9a3b02008-08-05 00:40:492287 AVStream *st;
Anton Khirnov4efdadc2014-05-25 12:05:512288 int i, j, ret;
Michael Niedermayer69de2292014-05-28 10:41:352289 int k;
David Conradb061d892007-06-04 22:10:542290
Keiji Costantini84cfce92014-03-01 16:28:152291 for (i = 0; i < matroska->tracks.nb_elem; i++) {
Aurelien Jacobsd88d8062008-08-05 00:40:522292 MatroskaTrack *track = &tracks[i];
Anton Khirnov36ef5362012-08-05 09:11:042293 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
Aurelien Jacobsdc6c36c2011-08-17 22:21:212294 EbmlList *encodings_list = &track->encodings;
Aurelien Jacobs9c25baf2008-08-05 00:40:552295 MatroskaTrackEncoding *encodings = encodings_list->elem;
Aurelien Jacobsd88d8062008-08-05 00:40:522296 uint8_t *extradata = NULL;
2297 int extradata_size = 0;
2298 int extradata_offset = 0;
Aurelien Jacobs5fec3a22011-06-13 23:58:112299 uint32_t fourcc = 0;
Anton Khirnov471fe572011-02-20 10:04:122300 AVIOContext b;
Frank Galliganb8531032013-03-07 16:11:382301 char* key_id_base64 = NULL;
Carl Eugen Hoyos96fc2902014-02-25 23:02:512302 int bit_depth = -1;
David Conradb061d892007-06-04 22:10:542303
Aurelien Jacobsd88d8062008-08-05 00:40:522304 /* Apply some sanity checks. */
Aurelien Jacobs9c25baf2008-08-05 00:40:552305 if (track->type != MATROSKA_TRACK_TYPE_VIDEO &&
2306 track->type != MATROSKA_TRACK_TYPE_AUDIO &&
Matthew Heaney818ebe92013-08-08 22:40:032307 track->type != MATROSKA_TRACK_TYPE_SUBTITLE &&
2308 track->type != MATROSKA_TRACK_TYPE_METADATA) {
Aurelien Jacobs9c25baf2008-08-05 00:40:552309 av_log(matroska->ctx, AV_LOG_INFO,
2310 "Unknown or unsupported track type %"PRIu64"\n",
2311 track->type);
2312 continue;
2313 }
Gabriel Dumef929ab02014-08-14 20:31:242314 if (!track->codec_id)
Aurelien Jacobsd88d8062008-08-05 00:40:522315 continue;
David Conradb061d892007-06-04 22:10:542316
Andreas Cadhalpun5b76c822015-06-15 18:59:222317 if (track->audio.samplerate < 0 || track->audio.samplerate > INT_MAX ||
2318 isnan(track->audio.samplerate)) {
2319 av_log(matroska->ctx, AV_LOG_WARNING,
2320 "Invalid sample rate %f, defaulting to 8000 instead.\n",
2321 track->audio.samplerate);
2322 track->audio.samplerate = 8000;
2323 }
2324
Aurelien Jacobs9c25baf2008-08-05 00:40:552325 if (track->type == MATROSKA_TRACK_TYPE_VIDEO) {
Nikolas Bowee07649e2018-01-18 23:21:562326 if (!track->default_duration && track->video.frame_rate > 0) {
2327 double default_duration = 1000000000 / track->video.frame_rate;
2328 if (default_duration > UINT64_MAX || default_duration < 0) {
2329 av_log(matroska->ctx, AV_LOG_WARNING,
2330 "Invalid frame rate %e. Cannot calculate default duration.\n",
2331 track->video.frame_rate);
2332 } else {
2333 track->default_duration = default_duration;
2334 }
2335 }
Michael Niedermayerf51ce342013-04-03 21:40:132336 if (track->video.display_width == -1)
Aurelien Jacobs9c25baf2008-08-05 00:40:552337 track->video.display_width = track->video.pixel_width;
Michael Niedermayerf51ce342013-04-03 21:40:132338 if (track->video.display_height == -1)
Aurelien Jacobs9c25baf2008-08-05 00:40:552339 track->video.display_height = track->video.pixel_height;
Aurelien Jacobsfdb5e022011-06-14 00:00:062340 if (track->video.color_space.size == 4)
2341 fourcc = AV_RL32(track->video.color_space.data);
Aurelien Jacobs9c25baf2008-08-05 00:40:552342 } else if (track->type == MATROSKA_TRACK_TYPE_AUDIO) {
2343 if (!track->audio.out_samplerate)
2344 track->audio.out_samplerate = track->audio.samplerate;
2345 }
2346 if (encodings_list->nb_elem > 1) {
2347 av_log(matroska->ctx, AV_LOG_ERROR,
Dustin Brodyd7d2f0e2011-09-15 07:34:382348 "Multiple combined encodings not supported");
Aurelien Jacobs9c25baf2008-08-05 00:40:552349 } else if (encodings_list->nb_elem == 1) {
Frank Galliganb8531032013-03-07 16:11:382350 if (encodings[0].type) {
2351 if (encodings[0].encryption.key_id.size > 0) {
2352 /* Save the encryption key id to be stored later as a
2353 metadata tag. */
2354 const int b64_size = AV_BASE64_SIZE(encodings[0].encryption.key_id.size);
2355 key_id_base64 = av_malloc(b64_size);
2356 if (key_id_base64 == NULL)
2357 return AVERROR(ENOMEM);
2358
2359 av_base64_encode(key_id_base64, b64_size,
2360 encodings[0].encryption.key_id.data,
2361 encodings[0].encryption.key_id.size);
2362 } else {
2363 encodings[0].scope = 0;
2364 av_log(matroska->ctx, AV_LOG_ERROR,
2365 "Unsupported encoding type");
2366 }
2367 } else if (
Aurelien Jacobsb250f9c2009-01-13 23:44:162368#if CONFIG_ZLIB
Keiji Costantini84cfce92014-03-01 16:28:152369 encodings[0].compression.algo != MATROSKA_TRACK_ENCODING_COMP_ZLIB &&
Aurelien Jacobs9c25baf2008-08-05 00:40:552370#endif
Aurelien Jacobsb250f9c2009-01-13 23:44:162371#if CONFIG_BZLIB
Aurelien Jacobs9c25baf2008-08-05 00:40:552372 encodings[0].compression.algo != MATROSKA_TRACK_ENCODING_COMP_BZLIB &&
2373#endif
Diego Biurrun2a91ada2012-10-18 17:48:272374#if CONFIG_LZO
Keiji Costantini84cfce92014-03-01 16:28:152375 encodings[0].compression.algo != MATROSKA_TRACK_ENCODING_COMP_LZO &&
Diego Biurrun2a91ada2012-10-18 17:48:272376#endif
Frank Galliganb8531032013-03-07 16:11:382377 encodings[0].compression.algo != MATROSKA_TRACK_ENCODING_COMP_HEADERSTRIP) {
Aurelien Jacobs9c25baf2008-08-05 00:40:552378 encodings[0].scope = 0;
2379 av_log(matroska->ctx, AV_LOG_ERROR,
2380 "Unsupported encoding type");
Keiji Costantini84cfce92014-03-01 16:28:152381 } else if (track->codec_priv.size && encodings[0].scope & 2) {
Aurelien Jacobs9c25baf2008-08-05 00:40:552382 uint8_t *codec_priv = track->codec_priv.data;
Luca Barbato8d4dd552012-09-14 16:51:492383 int ret = matroska_decode_buffer(&track->codec_priv.data,
2384 &track->codec_priv.size,
2385 track);
2386 if (ret < 0) {
Aurelien Jacobs9c25baf2008-08-05 00:40:552387 track->codec_priv.data = NULL;
2388 track->codec_priv.size = 0;
2389 av_log(matroska->ctx, AV_LOG_ERROR,
2390 "Failed to decode codec private data\n");
Aurelien Jacobs9c25baf2008-08-05 00:40:552391 }
Luca Barbato8d4dd552012-09-14 16:51:492392
James Almera6188662018-04-04 17:12:542393 if (codec_priv != track->codec_priv.data) {
2394 av_buffer_unref(&track->codec_priv.buf);
2395 if (track->codec_priv.data) {
2396 track->codec_priv.buf = av_buffer_create(track->codec_priv.data,
2397 track->codec_priv.size + AV_INPUT_BUFFER_PADDING_SIZE,
2398 NULL, NULL, 0);
2399 if (!track->codec_priv.buf) {
2400 av_freep(&track->codec_priv.data);
2401 track->codec_priv.size = 0;
2402 return AVERROR(ENOMEM);
2403 }
2404 }
2405 }
Aurelien Jacobs9c25baf2008-08-05 00:40:552406 }
2407 }
2408
Keiji Costantini84cfce92014-03-01 16:28:152409 for (j = 0; ff_mkv_codec_tags[j].id != AV_CODEC_ID_NONE; j++) {
2410 if (!strncmp(ff_mkv_codec_tags[j].str, track->codec_id,
2411 strlen(ff_mkv_codec_tags[j].str))) {
2412 codec_id = ff_mkv_codec_tags[j].id;
Aurelien Jacobsd88d8062008-08-05 00:40:522413 break;
David Conradb061d892007-06-04 22:10:542414 }
Aurelien Jacobsd88d8062008-08-05 00:40:522415 }
David Conradb061d892007-06-04 22:10:542416
Anton Khirnov3b3bbdd2011-06-18 09:43:242417 st = track->stream = avformat_new_stream(s, NULL);
Michael Niedermayerfb33bff2014-08-15 18:33:212418 if (!st) {
Frank Galliganb8531032013-03-07 16:11:382419 av_free(key_id_base64);
Aurelien Jacobsd88d8062008-08-05 00:40:522420 return AVERROR(ENOMEM);
Frank Galliganb8531032013-03-07 16:11:382421 }
2422
2423 if (key_id_base64) {
2424 /* export encryption key id as base64 metadata tag */
Andreas Rheinhardt40d9cbd2019-11-10 04:07:312425 av_dict_set(&st->metadata, "enc_key_id", key_id_base64,
2426 AV_DICT_DONT_STRDUP_VAL);
Frank Galliganb8531032013-03-07 16:11:382427 }
Aurelien Jacobsd88d8062008-08-05 00:40:522428
Keiji Costantini84cfce92014-03-01 16:28:152429 if (!strcmp(track->codec_id, "V_MS/VFW/FOURCC") &&
Michael Niedermayerb3d9ab12014-03-07 22:46:372430 track->codec_priv.size >= 40 &&
Gabriel Dume4b1f5e52014-08-14 20:31:252431 track->codec_priv.data) {
Keiji Costantini84cfce92014-03-01 16:28:152432 track->ms_compat = 1;
Michael Niedermayerb3d9ab12014-03-07 22:46:372433 bit_depth = AV_RL16(track->codec_priv.data + 14);
2434 fourcc = AV_RL32(track->codec_priv.data + 16);
Keiji Costantini84cfce92014-03-01 16:28:152435 codec_id = ff_codec_get_id(ff_codec_bmp_tags,
Michael Niedermayerb3d9ab12014-03-07 22:46:372436 fourcc);
Carl Eugen Hoyosade58512014-04-27 07:34:132437 if (!codec_id)
2438 codec_id = ff_codec_get_id(ff_codec_movvideo_tags,
2439 fourcc);
Keiji Costantini84cfce92014-03-01 16:28:152440 extradata_offset = 40;
2441 } else if (!strcmp(track->codec_id, "A_MS/ACM") &&
2442 track->codec_priv.size >= 14 &&
Gabriel Dume4b1f5e52014-08-14 20:31:252443 track->codec_priv.data) {
Max Hornca402f32011-04-12 15:44:202444 int ret;
Keiji Costantini84cfce92014-03-01 16:28:152445 ffio_init_context(&b, track->codec_priv.data,
2446 track->codec_priv.size,
Michael Niedermayerd0b45042013-01-04 12:00:142447 0, NULL, NULL, NULL, NULL);
Derek Buitenhuis6f69f7a2016-04-10 19:58:152448 ret = ff_get_wav_header(s, &b, st->codecpar, track->codec_priv.size, 0);
Max Hornca402f32011-04-12 15:44:202449 if (ret < 0)
2450 return ret;
Anton Khirnov92005142014-06-18 18:42:522451 codec_id = st->codecpar->codec_id;
Derek Buitenhuis6f69f7a2016-04-10 19:58:152452 fourcc = st->codecpar->codec_tag;
Aurelien Jacobs038146e2009-10-01 21:14:052453 extradata_offset = FFMIN(track->codec_priv.size, 18);
Michael Niedermayer48218582014-01-19 17:35:332454 } else if (!strcmp(track->codec_id, "A_QUICKTIME")
Mats Peterson71f73ee2016-01-10 02:59:212455 /* Normally 36, but allow noncompliant private data */
2456 && (track->codec_priv.size >= 32)
Michael Niedermayer81a663f2014-08-15 19:31:592457 && (track->codec_priv.data)) {
Mats Peterson535d09a2016-01-15 22:25:382458 uint16_t sample_size;
Mats Peterson71f73ee2016-01-10 02:59:212459 int ret = get_qt_codec(track, &fourcc, &codec_id);
2460 if (ret < 0)
2461 return ret;
Mats Peterson535d09a2016-01-15 22:25:382462 sample_size = AV_RB16(track->codec_priv.data + 26);
Mats Peterson6f1466d2016-01-08 11:55:592463 if (fourcc == 0) {
Mats Peterson535d09a2016-01-15 22:25:382464 if (sample_size == 8) {
Mats Peterson6f1466d2016-01-08 11:55:592465 fourcc = MKTAG('r','a','w',' ');
2466 codec_id = ff_codec_get_id(ff_codec_movaudio_tags, fourcc);
Mats Peterson535d09a2016-01-15 22:25:382467 } else if (sample_size == 16) {
Mats Peterson6f1466d2016-01-08 11:55:592468 fourcc = MKTAG('t','w','o','s');
2469 codec_id = ff_codec_get_id(ff_codec_movaudio_tags, fourcc);
2470 }
2471 }
Mats Peterson535d09a2016-01-15 22:25:382472 if ((fourcc == MKTAG('t','w','o','s') ||
2473 fourcc == MKTAG('s','o','w','t')) &&
2474 sample_size == 8)
2475 codec_id = AV_CODEC_ID_PCM_S8;
Keiji Costantini84cfce92014-03-01 16:28:152476 } else if (!strcmp(track->codec_id, "V_QUICKTIME") &&
Michael Niedermayerb3d9ab12014-03-07 22:46:372477 (track->codec_priv.size >= 21) &&
Gabriel Dume4b1f5e52014-08-14 20:31:252478 (track->codec_priv.data)) {
Mats Peterson71f73ee2016-01-10 02:59:212479 int ret = get_qt_codec(track, &fourcc, &codec_id);
2480 if (ret < 0)
2481 return ret;
Mats Peterson6a975cb2016-01-06 03:16:322482 if (codec_id == AV_CODEC_ID_NONE && AV_RL32(track->codec_priv.data+4) == AV_RL32("SMI ")) {
2483 fourcc = MKTAG('S','V','Q','3');
2484 codec_id = ff_codec_get_id(ff_codec_movvideo_tags, fourcc);
2485 }
Clément Bœschcd4d6cb2017-03-26 23:31:522486 if (codec_id == AV_CODEC_ID_NONE)
Vittorio Giovara8fc11ab2015-05-11 16:23:432487 av_log(matroska->ctx, AV_LOG_ERROR,
Clément Bœschcd4d6cb2017-03-26 23:31:522488 "mov FourCC not found %s.\n", av_fourcc2str(fourcc));
Mats Peterson79736032015-12-27 20:28:092489 if (track->codec_priv.size >= 86) {
2490 bit_depth = AV_RB16(track->codec_priv.data + 82);
2491 ffio_init_context(&b, track->codec_priv.data,
2492 track->codec_priv.size,
2493 0, NULL, NULL, NULL, NULL);
Mats Peterson6aac43f2016-02-24 17:14:052494 if (ff_get_qtpalette(codec_id, &b, track->palette)) {
Mats Peterson79736032015-12-27 20:28:092495 bit_depth &= 0x1F;
Mats Peterson6aac43f2016-02-24 17:14:052496 track->has_palette = 1;
Mats Peterson79736032015-12-27 20:28:092497 }
2498 }
Anton Khirnov36ef5362012-08-05 09:11:042499 } else if (codec_id == AV_CODEC_ID_PCM_S16BE) {
Aurelien Jacobseb9cf502008-08-20 00:49:452500 switch (track->audio.bitdepth) {
Keiji Costantini84cfce92014-03-01 16:28:152501 case 8:
2502 codec_id = AV_CODEC_ID_PCM_U8;
2503 break;
2504 case 24:
2505 codec_id = AV_CODEC_ID_PCM_S24BE;
2506 break;
2507 case 32:
2508 codec_id = AV_CODEC_ID_PCM_S32BE;
2509 break;
Aurelien Jacobseb9cf502008-08-20 00:49:452510 }
Anton Khirnov36ef5362012-08-05 09:11:042511 } else if (codec_id == AV_CODEC_ID_PCM_S16LE) {
Aurelien Jacobseb9cf502008-08-20 00:49:452512 switch (track->audio.bitdepth) {
Keiji Costantini84cfce92014-03-01 16:28:152513 case 8:
2514 codec_id = AV_CODEC_ID_PCM_U8;
2515 break;
2516 case 24:
2517 codec_id = AV_CODEC_ID_PCM_S24LE;
2518 break;
2519 case 32:
2520 codec_id = AV_CODEC_ID_PCM_S32LE;
2521 break;
Aurelien Jacobseb9cf502008-08-20 00:49:452522 }
Keiji Costantini84cfce92014-03-01 16:28:152523 } else if (codec_id == AV_CODEC_ID_PCM_F32LE &&
2524 track->audio.bitdepth == 64) {
Anton Khirnov36ef5362012-08-05 09:11:042525 codec_id = AV_CODEC_ID_PCM_F64LE;
2526 } else if (codec_id == AV_CODEC_ID_AAC && !track->codec_priv.size) {
Aurelien Jacobsd88d8062008-08-05 00:40:522527 int profile = matroska_aac_profile(track->codec_id);
Keiji Costantini84cfce92014-03-01 16:28:152528 int sri = matroska_aac_sri(track->audio.samplerate);
Vittorio Giovara059a9342015-06-29 21:48:342529 extradata = av_mallocz(5 + AV_INPUT_BUFFER_PADDING_SIZE);
Gabriel Dumef929ab02014-08-14 20:31:242530 if (!extradata)
Aurelien Jacobs28f450a2008-08-05 00:40:092531 return AVERROR(ENOMEM);
Keiji Costantini84cfce92014-03-01 16:28:152532 extradata[0] = (profile << 3) | ((sri & 0x0E) >> 1);
2533 extradata[1] = ((sri & 0x01) << 7) | (track->audio.channels << 3);
Aurelien Jacobsd88d8062008-08-05 00:40:522534 if (strstr(track->codec_id, "SBR")) {
Keiji Costantini84cfce92014-03-01 16:28:152535 sri = matroska_aac_sri(track->audio.out_samplerate);
2536 extradata[2] = 0x56;
2537 extradata[3] = 0xE5;
2538 extradata[4] = 0x80 | (sri << 3);
Aurelien Jacobsd88d8062008-08-05 00:40:522539 extradata_size = 5;
Aurelien Jacobs16f97ab2008-08-05 00:41:102540 } else
Aurelien Jacobsd88d8062008-08-05 00:40:522541 extradata_size = 2;
Michael Niedermayer29d147c2015-07-27 20:53:162542 } else if (codec_id == AV_CODEC_ID_ALAC && track->codec_priv.size && track->codec_priv.size < INT_MAX - 12 - AV_INPUT_BUFFER_PADDING_SIZE) {
Paul B Mahol9644fc92013-06-07 10:06:152543 /* Only ALAC's magic cookie is stored in Matroska's track headers.
Keiji Costantini84cfce92014-03-01 16:28:152544 * Create the "atom size", "tag", and "tag version" fields the
2545 * decoder expects manually. */
Paul B Mahol9644fc92013-06-07 10:06:152546 extradata_size = 12 + track->codec_priv.size;
Keiji Costantini84cfce92014-03-01 16:28:152547 extradata = av_mallocz(extradata_size +
Vittorio Giovara059a9342015-06-29 21:48:342548 AV_INPUT_BUFFER_PADDING_SIZE);
Gabriel Dumef929ab02014-08-14 20:31:242549 if (!extradata)
Paul B Mahol9644fc92013-06-07 10:06:152550 return AVERROR(ENOMEM);
2551 AV_WB32(extradata, extradata_size);
2552 memcpy(&extradata[4], "alac", 4);
2553 AV_WB32(&extradata[8], 0);
2554 memcpy(&extradata[12], track->codec_priv.data,
Keiji Costantini84cfce92014-03-01 16:28:152555 track->codec_priv.size);
Anton Khirnov36ef5362012-08-05 09:11:042556 } else if (codec_id == AV_CODEC_ID_TTA) {
Andreas Rheinhardt668490a2019-12-03 17:09:052557 uint8_t *ptr;
Andreas Rheinhardtf7bf59b2019-12-03 17:09:032558 if (track->audio.channels > UINT16_MAX ||
2559 track->audio.bitdepth > UINT16_MAX) {
2560 av_log(matroska->ctx, AV_LOG_WARNING,
2561 "Too large audio channel number %"PRIu64
2562 " or bitdepth %"PRIu64". Skipping track.\n",
2563 track->audio.channels, track->audio.bitdepth);
2564 if (matroska->ctx->error_recognition & AV_EF_EXPLODE)
2565 return AVERROR_INVALIDDATA;
2566 else
2567 continue;
2568 }
2569 if (track->audio.out_samplerate < 0 || track->audio.out_samplerate > INT_MAX)
2570 return AVERROR_INVALIDDATA;
Andreas Rheinhardteec26b52019-12-03 17:09:042571 extradata_size = 22;
Michael Niedermayer29d147c2015-07-27 20:53:162572 extradata = av_mallocz(extradata_size + AV_INPUT_BUFFER_PADDING_SIZE);
Gabriel Dumef929ab02014-08-14 20:31:242573 if (!extradata)
Aurelien Jacobsd88d8062008-08-05 00:40:522574 return AVERROR(ENOMEM);
Andreas Rheinhardt668490a2019-12-03 17:09:052575 ptr = extradata;
2576 bytestream_put_be32(&ptr, AV_RB32("TTA1"));
2577 bytestream_put_le16(&ptr, 1);
2578 bytestream_put_le16(&ptr, track->audio.channels);
2579 bytestream_put_le16(&ptr, track->audio.bitdepth);
2580 bytestream_put_le32(&ptr, track->audio.out_samplerate);
2581 bytestream_put_le32(&ptr, av_rescale(matroska->duration * matroska->time_scale,
2582 track->audio.out_samplerate,
2583 AV_TIME_BASE * 1000));
Keiji Costantini84cfce92014-03-01 16:28:152584 } else if (codec_id == AV_CODEC_ID_RV10 ||
2585 codec_id == AV_CODEC_ID_RV20 ||
2586 codec_id == AV_CODEC_ID_RV30 ||
2587 codec_id == AV_CODEC_ID_RV40) {
Aurelien Jacobsd88d8062008-08-05 00:40:522588 extradata_offset = 26;
Anton Khirnov36ef5362012-08-05 09:11:042589 } else if (codec_id == AV_CODEC_ID_RA_144) {
Aurelien Jacobsd88d8062008-08-05 00:40:522590 track->audio.out_samplerate = 8000;
Keiji Costantini84cfce92014-03-01 16:28:152591 track->audio.channels = 1;
Michael Niedermayerb3d9ab12014-03-07 22:46:372592 } else if ((codec_id == AV_CODEC_ID_RA_288 ||
2593 codec_id == AV_CODEC_ID_COOK ||
2594 codec_id == AV_CODEC_ID_ATRAC3 ||
2595 codec_id == AV_CODEC_ID_SIPR)
2596 && track->codec_priv.data) {
Aurelien Jacobs6b102282010-03-12 23:49:062597 int flavor;
Michael Niedermayer0b271362012-04-14 17:33:242598
Keiji Costantini84cfce92014-03-01 16:28:152599 ffio_init_context(&b, track->codec_priv.data,
2600 track->codec_priv.size,
2601 0, NULL, NULL, NULL, NULL);
Anton Khirnov45a8a022011-03-15 08:14:382602 avio_skip(&b, 22);
Anton Khirnove63a3622011-02-21 15:43:012603 flavor = avio_rb16(&b);
2604 track->audio.coded_framesize = avio_rb32(&b);
Anton Khirnov45a8a022011-03-15 08:14:382605 avio_skip(&b, 12);
Anton Khirnove63a3622011-02-21 15:43:012606 track->audio.sub_packet_h = avio_rb16(&b);
2607 track->audio.frame_size = avio_rb16(&b);
2608 track->audio.sub_packet_size = avio_rb16(&b);
Andreas Rheinhardt8287c202019-12-02 09:41:122609 if (track->audio.coded_framesize <= 0 ||
Keiji Costantini84cfce92014-03-01 16:28:152610 track->audio.sub_packet_h <= 0 ||
Andreas Rheinhardtc91e3692020-04-20 05:47:062611 track->audio.frame_size <= 0)
Martin Storsjö569d18a2013-09-16 12:36:242612 return AVERROR_INVALIDDATA;
Andreas Rheinhardt8287c202019-12-02 09:41:122613
Anton Khirnov36ef5362012-08-05 09:11:042614 if (codec_id == AV_CODEC_ID_RA_288) {
Andreas Rheinhardt4f5c6c12020-04-21 22:15:542615 if ((int64_t)track->audio.sub_packet_h * track->audio.coded_framesize
2616 > (2 + (track->audio.sub_packet_h & 1)) * track->audio.frame_size)
2617 return AVERROR_INVALIDDATA;
Anton Khirnov92005142014-06-18 18:42:522618 st->codecpar->block_align = track->audio.coded_framesize;
Aurelien Jacobsd88d8062008-08-05 00:40:522619 track->codec_priv.size = 0;
2620 } else {
Andreas Rheinhardt8287c202019-12-02 09:41:122621 if (codec_id == AV_CODEC_ID_SIPR) {
Michael Niedermayer62cf5c12013-08-04 19:18:492622 static const int sipr_bit_rate[4] = { 6504, 8496, 5000, 16000 };
Andreas Rheinhardt8287c202019-12-02 09:41:122623 if (flavor > 3)
2624 return AVERROR_INVALIDDATA;
Aurelien Jacobs6b102282010-03-12 23:49:062625 track->audio.sub_packet_size = ff_sipr_subpk_size[flavor];
Anton Khirnov92005142014-06-18 18:42:522626 st->codecpar->bit_rate = sipr_bit_rate[flavor];
Andreas Rheinhardtc91e3692020-04-20 05:47:062627 } else if (track->audio.sub_packet_size <= 0)
2628 return AVERROR_INVALIDDATA;
Anton Khirnov92005142014-06-18 18:42:522629 st->codecpar->block_align = track->audio.sub_packet_size;
Keiji Costantini84cfce92014-03-01 16:28:152630 extradata_offset = 78;
David Conradb061d892007-06-04 22:10:542631 }
Andreas Rheinhardt8287c202019-12-02 09:41:122632 track->audio.buf = av_malloc_array(track->audio.sub_packet_h,
2633 track->audio.frame_size);
2634 if (!track->audio.buf)
2635 return AVERROR(ENOMEM);
Anton Khirnov4efdadc2014-05-25 12:05:512636 } else if (codec_id == AV_CODEC_ID_FLAC && track->codec_priv.size) {
2637 ret = matroska_parse_flac(s, track, &extradata_offset);
2638 if (ret < 0)
2639 return ret;
Andreas Rheinhardt048bc3f2019-12-14 00:36:542640 } else if (codec_id == AV_CODEC_ID_WAVPACK && track->codec_priv.size < 2) {
2641 av_log(matroska->ctx, AV_LOG_INFO, "Assuming WavPack version 4.10 "
2642 "in absence of valid CodecPrivate.\n");
2643 extradata_size = 2;
2644 extradata = av_mallocz(2 + AV_INPUT_BUFFER_PADDING_SIZE);
2645 if (!extradata)
2646 return AVERROR(ENOMEM);
2647 AV_WL16(extradata, 0x410);
Carl Eugen Hoyos3d5c8592014-04-06 18:54:482648 } else if (codec_id == AV_CODEC_ID_PRORES && track->codec_priv.size == 4) {
2649 fourcc = AV_RL32(track->codec_priv.data);
James Almeracdea9e2018-01-13 19:04:212650 } else if (codec_id == AV_CODEC_ID_VP9 && track->codec_priv.size) {
2651 /* we don't need any value stored in CodecPrivate.
2652 make sure that it's not exported as extradata. */
2653 track->codec_priv.size = 0;
James Almer8d5604a2018-08-16 21:01:442654 } else if (codec_id == AV_CODEC_ID_AV1 && track->codec_priv.size) {
2655 /* For now, propagate only the OBUs, if any. Once libavcodec is
2656 updated to handle isobmff style extradata this can be removed. */
2657 extradata_offset = 4;
David Conradb061d892007-06-04 22:10:542658 }
Aurelien Jacobse2644402009-08-24 13:40:302659 track->codec_priv.size -= extradata_offset;
Aurelien Jacobsd88d8062008-08-05 00:40:522660
Anton Khirnov36ef5362012-08-05 09:11:042661 if (codec_id == AV_CODEC_ID_NONE)
Aurelien Jacobsd88d8062008-08-05 00:40:522662 av_log(matroska->ctx, AV_LOG_INFO,
Anton Khirnov36ef5362012-08-05 09:11:042663 "Unknown/unsupported AVCodecID %s.\n", track->codec_id);
Aurelien Jacobsd88d8062008-08-05 00:40:522664
Aurelien Jacobs3fc9d7c2008-09-09 11:23:482665 if (track->time_scale < 0.01)
2666 track->time_scale = 1.0;
Keiji Costantini84cfce92014-03-01 16:28:152667 avpriv_set_pts_info(st, 64, matroska->time_scale * track->time_scale,
2668 1000 * 1000 * 1000); /* 64 bit pts in ns */
Aurelien Jacobsd88d8062008-08-05 00:40:522669
Anton Khirnoveb3b5502014-04-29 10:03:132670 /* convert the delay from ns to the track timebase */
Michael Niedermayerb5bc4362016-06-06 02:23:162671 track->codec_delay_in_track_tb = av_rescale_q(track->codec_delay,
Anton Khirnoveb3b5502014-04-29 10:03:132672 (AVRational){ 1, 1000000000 },
2673 st->time_base);
2674
Anton Khirnov92005142014-06-18 18:42:522675 st->codecpar->codec_id = codec_id;
Alex Sukhanov251c96a2013-12-23 09:41:352676
Aurelien Jacobsd88d8062008-08-05 00:40:522677 if (strcmp(track->language, "und"))
Anton Khirnovd2d67e42011-05-22 10:46:292678 av_dict_set(&st->metadata, "language", track->language, 0);
2679 av_dict_set(&st->metadata, "title", track->name, 0);
Aurelien Jacobsd88d8062008-08-05 00:40:522680
2681 if (track->flag_default)
2682 st->disposition |= AV_DISPOSITION_DEFAULT;
Aurelien Jacobs7a617a82010-07-02 16:38:442683 if (track->flag_forced)
2684 st->disposition |= AV_DISPOSITION_FORCED;
Aurelien Jacobsd88d8062008-08-05 00:40:522685
Anton Khirnov92005142014-06-18 18:42:522686 if (!st->codecpar->extradata) {
Keiji Costantini84cfce92014-03-01 16:28:152687 if (extradata) {
Anton Khirnov92005142014-06-18 18:42:522688 st->codecpar->extradata = extradata;
2689 st->codecpar->extradata_size = extradata_size;
Keiji Costantini84cfce92014-03-01 16:28:152690 } else if (track->codec_priv.data && track->codec_priv.size > 0) {
Derek Buitenhuis6f69f7a2016-04-10 19:58:152691 if (ff_alloc_extradata(st->codecpar, track->codec_priv.size))
Aurelien Jacobs553e9f72009-10-01 21:15:362692 return AVERROR(ENOMEM);
Anton Khirnov92005142014-06-18 18:42:522693 memcpy(st->codecpar->extradata,
Aurelien Jacobs553e9f72009-10-01 21:15:362694 track->codec_priv.data + extradata_offset,
2695 track->codec_priv.size);
2696 }
Aurelien Jacobsff0d5a72009-10-01 21:14:462697 }
Aurelien Jacobsd88d8062008-08-05 00:40:522698
2699 if (track->type == MATROSKA_TRACK_TYPE_VIDEO) {
Aurelien Jacobs4c509fe2011-05-23 23:09:242700 MatroskaTrackPlane *planes = track->operation.combine_planes.elem;
Aaron Colwellfebfb492015-12-02 23:13:182701 int display_width_mul = 1;
Aaron Colwellec83efd2015-11-23 20:06:142702 int display_height_mul = 1;
Aurelien Jacobs4c509fe2011-05-23 23:09:242703
Anton Khirnov92005142014-06-18 18:42:522704 st->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;
Derek Buitenhuis6f69f7a2016-04-10 19:58:152705 st->codecpar->codec_tag = fourcc;
Carl Eugen Hoyos96fc2902014-02-25 23:02:512706 if (bit_depth >= 0)
Derek Buitenhuis6f69f7a2016-04-10 19:58:152707 st->codecpar->bits_per_coded_sample = bit_depth;
Anton Khirnov92005142014-06-18 18:42:522708 st->codecpar->width = track->video.pixel_width;
2709 st->codecpar->height = track->video.pixel_height;
Aaron Colwellec83efd2015-11-23 20:06:142710
Luca Barbato5f022662016-03-28 18:29:542711 if (track->video.interlaced == MATROSKA_VIDEO_INTERLACE_FLAG_INTERLACED)
James Almer1273bc62016-10-13 17:22:072712 st->codecpar->field_order = mkv_field_order(matroska, track->video.field_order);
James Almer29b6c2b2016-09-27 17:48:332713 else if (track->video.interlaced == MATROSKA_VIDEO_INTERLACE_FLAG_PROGRESSIVE)
2714 st->codecpar->field_order = AV_FIELD_PROGRESSIVE;
Luca Barbato5f022662016-03-28 18:29:542715
Aaron Colwellec83efd2015-11-23 20:06:142716 if (track->video.stereo_mode && track->video.stereo_mode < MATROSKA_VIDEO_STEREOMODE_TYPE_NB)
2717 mkv_stereo_mode_display_mul(track->video.stereo_mode, &display_width_mul, &display_height_mul);
2718
James Almer8b59ce02016-10-16 13:13:452719 if (track->video.display_unit < MATROSKA_VIDEO_DISPLAYUNIT_UNKNOWN) {
James Almerbad8bbc2016-10-15 21:01:502720 av_reduce(&st->sample_aspect_ratio.num,
2721 &st->sample_aspect_ratio.den,
2722 st->codecpar->height * track->video.display_width * display_width_mul,
2723 st->codecpar->width * track->video.display_height * display_height_mul,
2724 255);
2725 }
Derek Buitenhuis6f69f7a2016-04-10 19:58:152726 if (st->codecpar->codec_id != AV_CODEC_ID_HEVC)
Yusuke Nakamura16b68392013-10-12 09:55:462727 st->need_parsing = AVSTREAM_PARSE_HEADERS;
Michael Niedermayer0fbeeb92013-11-01 16:57:572728
Luca Barbatoac97d472012-04-17 23:32:072729 if (track->default_duration) {
Anton Khirnovaba232c2012-06-26 11:10:012730 av_reduce(&st->avg_frame_rate.num, &st->avg_frame_rate.den,
Luca Barbatoac97d472012-04-17 23:32:072731 1000000000, track->default_duration, 30000);
Anton Khirnovaba232c2012-06-26 11:10:012732#if FF_API_R_FRAME_RATE
Michael Niedermayerfc3cdb02015-02-01 18:34:522733 if ( st->avg_frame_rate.num < st->avg_frame_rate.den * 1000LL
2734 && st->avg_frame_rate.num > st->avg_frame_rate.den * 5LL)
Michael Niedermayer6853e402013-10-05 22:07:282735 st->r_frame_rate = st->avg_frame_rate;
Anton Khirnovaba232c2012-06-26 11:10:012736#endif
Luca Barbatoac97d472012-04-17 23:32:072737 }
Kirill Gavrilove6ec9212011-05-21 15:14:142738
Aurelien Jacobs4c509fe2011-05-23 23:09:242739 /* export stereo mode flag as metadata tag */
Michael Niedermayer37520a92014-08-28 23:26:522740 if (track->video.stereo_mode && track->video.stereo_mode < MATROSKA_VIDEO_STEREOMODE_TYPE_NB)
Clément Bœschca81e3b2012-09-16 00:58:402741 av_dict_set(&st->metadata, "stereo_mode", ff_matroska_video_stereo_mode[track->video.stereo_mode], 0);
Kirill Gavrilove6ec9212011-05-21 15:14:142742
Vignesh Venkatasubramaniance6a8e52013-02-04 23:17:522743 /* export alpha mode flag as metadata tag */
2744 if (track->video.alpha_mode)
2745 av_dict_set(&st->metadata, "alpha_mode", "1", 0);
2746
Aurelien Jacobs4c509fe2011-05-23 23:09:242747 /* if we have virtual track, mark the real tracks */
2748 for (j=0; j < track->operation.combine_planes.nb_elem; j++) {
2749 char buf[32];
Aurelien Jacobsb44bbf92011-05-24 21:26:242750 if (planes[j].type >= MATROSKA_VIDEO_STEREO_PLANE_COUNT)
Aurelien Jacobs4c509fe2011-05-23 23:09:242751 continue;
2752 snprintf(buf, sizeof(buf), "%s_%d",
Clément Bœschca81e3b2012-09-16 00:58:402753 ff_matroska_video_stereo_plane[planes[j].type], i);
Aurelien Jacobs4c509fe2011-05-23 23:09:242754 for (k=0; k < matroska->tracks.nb_elem; k++)
Michael Niedermayer5d309d32015-05-04 13:47:542755 if (planes[j].uid == tracks[k].uid && tracks[k].stream) {
2756 av_dict_set(&tracks[k].stream->metadata,
Aurelien Jacobse6ba3d42011-06-13 17:02:502757 "stereo_mode", buf, 0);
Kirill Gavrilove6ec9212011-05-21 15:14:142758 break;
2759 }
Kirill Gavrilove6ec9212011-05-21 15:14:142760 }
Vittorio Giovarad4ae8ac2014-08-12 21:28:492761 // add stream level stereo3d side data if it is a supported format
2762 if (track->video.stereo_mode < MATROSKA_VIDEO_STEREOMODE_TYPE_NB &&
2763 track->video.stereo_mode != 10 && track->video.stereo_mode != 12) {
2764 int ret = ff_mkv_stereo3d_conv(st, track->video.stereo_mode);
2765 if (ret < 0)
2766 return ret;
2767 }
Neil Birkbeckbbda13a2016-03-01 00:41:042768
James Almeredb4f5d2016-12-05 02:27:542769 ret = mkv_parse_video_color(st, track);
2770 if (ret < 0)
2771 return ret;
James Almer445204c2016-12-06 17:48:452772 ret = mkv_parse_video_projection(st, track);
2773 if (ret < 0)
2774 return ret;
Aurelien Jacobsd88d8062008-08-05 00:40:522775 } else if (track->type == MATROSKA_TRACK_TYPE_AUDIO) {
Anton Khirnov92005142014-06-18 18:42:522776 st->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;
Derek Buitenhuis6f69f7a2016-04-10 19:58:152777 st->codecpar->codec_tag = fourcc;
Anton Khirnov92005142014-06-18 18:42:522778 st->codecpar->sample_rate = track->audio.out_samplerate;
2779 st->codecpar->channels = track->audio.channels;
Derek Buitenhuis6f69f7a2016-04-10 19:58:152780 if (!st->codecpar->bits_per_coded_sample)
2781 st->codecpar->bits_per_coded_sample = track->audio.bitdepth;
James Almer63b5d042018-01-30 01:59:522782 if (st->codecpar->codec_id == AV_CODEC_ID_MP3 ||
2783 st->codecpar->codec_id == AV_CODEC_ID_MLP ||
2784 st->codecpar->codec_id == AV_CODEC_ID_TRUEHD)
Rodger Combsb4b27172015-08-16 08:06:042785 st->need_parsing = AVSTREAM_PARSE_FULL;
Derek Buitenhuis6f69f7a2016-04-10 19:58:152786 else if (st->codecpar->codec_id != AV_CODEC_ID_AAC)
Keiji Costantini84cfce92014-03-01 16:28:152787 st->need_parsing = AVSTREAM_PARSE_HEADERS;
Vignesh Venkatasubramaniand6f86d72013-10-14 17:42:082788 if (track->codec_delay > 0) {
Derek Buitenhuis6f69f7a2016-04-10 19:58:152789 st->codecpar->initial_padding = av_rescale_q(track->codec_delay,
Michael Niedermayerb5bc4362016-06-06 02:23:162790 (AVRational){1, 1000000000},
James Almer49b02462016-06-06 04:14:112791 (AVRational){1, st->codecpar->codec_id == AV_CODEC_ID_OPUS ?
2792 48000 : st->codecpar->sample_rate});
Vignesh Venkatasubramaniand6f86d72013-10-14 17:42:082793 }
2794 if (track->seek_preroll > 0) {
Derek Buitenhuis6f69f7a2016-04-10 19:58:152795 st->codecpar->seek_preroll = av_rescale_q(track->seek_preroll,
2796 (AVRational){1, 1000000000},
2797 (AVRational){1, st->codecpar->sample_rate});
Vignesh Venkatasubramaniand6f86d72013-10-14 17:42:082798 }
Matthew Heaney818ebe92013-08-08 22:40:032799 } else if (codec_id == AV_CODEC_ID_WEBVTT) {
Derek Buitenhuis6f69f7a2016-04-10 19:58:152800 st->codecpar->codec_type = AVMEDIA_TYPE_SUBTITLE;
Matthew Heaney818ebe92013-08-08 22:40:032801
2802 if (!strcmp(track->codec_id, "D_WEBVTT/CAPTIONS")) {
2803 st->disposition |= AV_DISPOSITION_CAPTIONS;
2804 } else if (!strcmp(track->codec_id, "D_WEBVTT/DESCRIPTIONS")) {
2805 st->disposition |= AV_DISPOSITION_DESCRIPTIONS;
2806 } else if (!strcmp(track->codec_id, "D_WEBVTT/METADATA")) {
2807 st->disposition |= AV_DISPOSITION_METADATA;
2808 }
Aurelien Jacobsd88d8062008-08-05 00:40:522809 } else if (track->type == MATROSKA_TRACK_TYPE_SUBTITLE) {
Anton Khirnov92005142014-06-18 18:42:522810 st->codecpar->codec_type = AVMEDIA_TYPE_SUBTITLE;
Aurelien Jacobsd88d8062008-08-05 00:40:522811 }
David Conradb061d892007-06-04 22:10:542812 }
2813
Anton Khirnov6df478b2014-05-25 07:07:322814 return 0;
2815}
2816
2817static int matroska_read_header(AVFormatContext *s)
2818{
2819 MatroskaDemuxContext *matroska = s->priv_data;
2820 EbmlList *attachments_list = &matroska->attachments;
2821 EbmlList *chapters_list = &matroska->chapters;
2822 MatroskaAttachment *attachments;
2823 MatroskaChapter *chapters;
2824 uint64_t max_start = 0;
2825 int64_t pos;
2826 Ebml ebml = { 0 };
2827 int i, j, res;
2828
2829 matroska->ctx = s;
wm4cac22952015-02-09 19:39:002830 matroska->cues_parsing_deferred = 1;
Anton Khirnov6df478b2014-05-25 07:07:322831
2832 /* First read the EBML header. */
Thomas Guillemb8d7f312015-04-10 17:04:512833 if (ebml_parse(matroska, ebml_syntax, &ebml) || !ebml.doctype) {
2834 av_log(matroska->ctx, AV_LOG_ERROR, "EBML header parsing failed\n");
2835 ebml_free(ebml_syntax, &ebml);
2836 return AVERROR_INVALIDDATA;
2837 }
2838 if (ebml.version > EBML_VERSION ||
Anton Khirnov6df478b2014-05-25 07:07:322839 ebml.max_size > sizeof(uint64_t) ||
2840 ebml.id_length > sizeof(uint32_t) ||
Michael Niedermayer0cab0932015-04-19 14:45:242841 ebml.doctype_version > 3) {
Diego Biurrun67deba82015-12-16 17:01:342842 avpriv_report_missing_feature(matroska->ctx,
2843 "EBML version %"PRIu64", doctype %s, doc version %"PRIu64,
2844 ebml.version, ebml.doctype, ebml.doctype_version);
Anton Khirnov6df478b2014-05-25 07:07:322845 ebml_free(ebml_syntax, &ebml);
2846 return AVERROR_PATCHWELCOME;
Michael Niedermayer69de2292014-05-28 10:41:352847 } else if (ebml.doctype_version == 3) {
2848 av_log(matroska->ctx, AV_LOG_WARNING,
2849 "EBML header using unsupported features\n"
2850 "(EBML version %"PRIu64", doctype %s, doc version %"PRIu64")\n",
2851 ebml.version, ebml.doctype, ebml.doctype_version);
Anton Khirnov6df478b2014-05-25 07:07:322852 }
2853 for (i = 0; i < FF_ARRAY_ELEMS(matroska_doctypes); i++)
2854 if (!strcmp(ebml.doctype, matroska_doctypes[i]))
2855 break;
2856 if (i >= FF_ARRAY_ELEMS(matroska_doctypes)) {
2857 av_log(s, AV_LOG_WARNING, "Unknown EBML doctype '%s'\n", ebml.doctype);
2858 if (matroska->ctx->error_recognition & AV_EF_EXPLODE) {
2859 ebml_free(ebml_syntax, &ebml);
2860 return AVERROR_INVALIDDATA;
2861 }
2862 }
2863 ebml_free(ebml_syntax, &ebml);
2864
2865 /* The next thing is a segment. */
2866 pos = avio_tell(matroska->ctx->pb);
2867 res = ebml_parse(matroska, matroska_segments, matroska);
Andreas Rheinhardt60f75c92019-05-16 22:30:132868 // Try resyncing until we find an EBML_STOP type element.
Anton Khirnov6df478b2014-05-25 07:07:322869 while (res != 1) {
2870 res = matroska_resync(matroska, pos);
2871 if (res < 0)
Michael Niedermayerf573acc2016-06-24 16:26:462872 goto fail;
Anton Khirnov6df478b2014-05-25 07:07:322873 pos = avio_tell(matroska->ctx->pb);
2874 res = ebml_parse(matroska, matroska_segment, matroska);
2875 }
Andreas Rheinhardt43c3ceb2019-05-16 22:29:512876 /* Set data_offset as it might be needed later by seek_frame_generic. */
2877 if (matroska->current_id == MATROSKA_ID_CLUSTER)
2878 s->internal->data_offset = avio_tell(matroska->ctx->pb) - 4;
Anton Khirnov6df478b2014-05-25 07:07:322879 matroska_execute_seekhead(matroska);
2880
2881 if (!matroska->time_scale)
2882 matroska->time_scale = 1000000;
2883 if (matroska->duration)
2884 matroska->ctx->duration = matroska->duration * matroska->time_scale *
2885 1000 / AV_TIME_BASE;
2886 av_dict_set(&s->metadata, "title", matroska->title, 0);
Michael Niedermayer69de2292014-05-28 10:41:352887 av_dict_set(&s->metadata, "encoder", matroska->muxingapp, 0);
2888
2889 if (matroska->date_utc.size == 8)
2890 matroska_metadata_creation_time(&s->metadata, AV_RB64(matroska->date_utc.data));
Anton Khirnov6df478b2014-05-25 07:07:322891
2892 res = matroska_parse_tracks(s);
2893 if (res < 0)
Michael Niedermayerf573acc2016-06-24 16:26:462894 goto fail;
Anton Khirnov6df478b2014-05-25 07:07:322895
Diego Biurrunf69befe2014-03-07 12:54:182896 attachments = attachments_list->elem;
2897 for (j = 0; j < attachments_list->nb_elem; j++) {
2898 if (!(attachments[j].filename && attachments[j].mime &&
2899 attachments[j].bin.data && attachments[j].bin.size > 0)) {
Aurelien Jacobs9c25baf2008-08-05 00:40:552900 av_log(matroska->ctx, AV_LOG_ERROR, "incomplete attachment\n");
2901 } else {
Anton Khirnov3b3bbdd2011-06-18 09:43:242902 AVStream *st = avformat_new_stream(s, NULL);
Gabriel Dumef929ab02014-08-14 20:31:242903 if (!st)
Aurelien Jacobs9c25baf2008-08-05 00:40:552904 break;
Diego Biurrunf69befe2014-03-07 12:54:182905 av_dict_set(&st->metadata, "filename", attachments[j].filename, 0);
2906 av_dict_set(&st->metadata, "mimetype", attachments[j].mime, 0);
Anton Khirnov92005142014-06-18 18:42:522907 st->codecpar->codec_id = AV_CODEC_ID_NONE;
Aurelien Jacobs9c25baf2008-08-05 00:40:552908
Andreas Rheinhardt67e957b2020-04-16 01:39:052909 for (i = 0; mkv_image_mime_tags[i].id != AV_CODEC_ID_NONE; i++) {
2910 if (!strncmp(mkv_image_mime_tags[i].str, attachments[j].mime,
2911 strlen(mkv_image_mime_tags[i].str))) {
2912 st->codecpar->codec_id = mkv_image_mime_tags[i].id;
Aurelien Jacobs9c25baf2008-08-05 00:40:552913 break;
2914 }
2915 }
wm4511585c2015-04-03 14:11:532916
Diego Biurrunf69befe2014-03-07 12:54:182917 attachments[j].stream = st;
wm4c4d37cd2015-04-03 14:11:532918
Anton Khirnov92005142014-06-18 18:42:522919 if (st->codecpar->codec_id != AV_CODEC_ID_NONE) {
Andreas Rheinhardt07d40562019-05-16 22:29:522920 AVPacket *pkt = &st->attached_pic;
2921
Anton Khirnov92005142014-06-18 18:42:522922 st->disposition |= AV_DISPOSITION_ATTACHED_PIC;
2923 st->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;
wm4511585c2015-04-03 14:11:532924
Andreas Rheinhardt07d40562019-05-16 22:29:522925 av_init_packet(pkt);
2926 pkt->buf = av_buffer_ref(attachments[j].bin.buf);
2927 if (!pkt->buf)
2928 return AVERROR(ENOMEM);
2929 pkt->data = attachments[j].bin.data;
2930 pkt->size = attachments[j].bin.size;
2931 pkt->stream_index = st->index;
2932 pkt->flags |= AV_PKT_FLAG_KEY;
wm4511585c2015-04-03 14:11:532933 } else {
Anton Khirnov92005142014-06-18 18:42:522934 st->codecpar->codec_type = AVMEDIA_TYPE_ATTACHMENT;
Derek Buitenhuis6f69f7a2016-04-10 19:58:152935 if (ff_alloc_extradata(st->codecpar, attachments[j].bin.size))
wm4511585c2015-04-03 14:11:532936 break;
Anton Khirnov92005142014-06-18 18:42:522937 memcpy(st->codecpar->extradata, attachments[j].bin.data,
wm4c4d37cd2015-04-03 14:11:532938 attachments[j].bin.size);
wm4511585c2015-04-03 14:11:532939
Andreas Rheinhardt67e957b2020-04-16 01:39:052940 for (i = 0; mkv_mime_tags[i].id != AV_CODEC_ID_NONE; i++) {
2941 if (!strncmp(mkv_mime_tags[i].str, attachments[j].mime,
2942 strlen(mkv_mime_tags[i].str))) {
2943 st->codecpar->codec_id = mkv_mime_tags[i].id;
wm4511585c2015-04-03 14:11:532944 break;
2945 }
2946 }
wm4511585c2015-04-03 14:11:532947 }
Aurelien Jacobs9c25baf2008-08-05 00:40:552948 }
2949 }
2950
2951 chapters = chapters_list->elem;
Keiji Costantini84cfce92014-03-01 16:28:152952 for (i = 0; i < chapters_list->nb_elem; i++)
2953 if (chapters[i].start != AV_NOPTS_VALUE && chapters[i].uid &&
2954 (max_start == 0 || chapters[i].start > max_start)) {
Aurelien Jacobs6cb6e152009-02-15 15:25:142955 chapters[i].chapter =
Keiji Costantini84cfce92014-03-01 16:28:152956 avpriv_new_chapter(s, chapters[i].uid,
2957 (AVRational) { 1, 1000000000 },
2958 chapters[i].start, chapters[i].end,
2959 chapters[i].title);
Aurelien Jacobse0e4be52009-01-15 00:42:572960 max_start = chapters[i].start;
2961 }
Aurelien Jacobs9c25baf2008-08-05 00:40:552962
Aaron Colwell6c4cc0f2011-09-22 14:51:002963 matroska_add_index_entries(matroska);
2964
Aurelien Jacobs929e9de2009-02-15 15:53:552965 matroska_convert_tags(s);
2966
Aurelien Jacobsce6f28b2008-08-05 00:40:582967 return 0;
Michael Niedermayerf573acc2016-06-24 16:26:462968fail:
2969 matroska_read_close(s);
2970 return res;
David Conradb061d892007-06-04 22:10:542971}
2972
Aurelien Jacobs737c40d2008-08-05 00:42:392973/*
Aurelien Jacobs737c40d2008-08-05 00:42:392974 * Put one packet in an application-supplied AVPacket struct.
2975 * Returns 0 on success or -1 on failure.
2976 */
2977static int matroska_deliver_packet(MatroskaDemuxContext *matroska,
2978 AVPacket *pkt)
2979{
James Almer78b96be2018-03-26 18:02:372980 if (matroska->queue) {
Mats Peterson6aac43f2016-02-24 17:14:052981 MatroskaTrack *tracks = matroska->tracks.elem;
2982 MatroskaTrack *track;
James Almer78b96be2018-03-26 18:02:372983
2984 ff_packet_list_get(&matroska->queue, &matroska->queue_end, pkt);
Mats Peterson6aac43f2016-02-24 17:14:052985 track = &tracks[pkt->stream_index];
2986 if (track->has_palette) {
Mats Peterson79736032015-12-27 20:28:092987 uint8_t *pal = av_packet_new_side_data(pkt, AV_PKT_DATA_PALETTE, AVPALETTE_SIZE);
2988 if (!pal) {
2989 av_log(matroska->ctx, AV_LOG_ERROR, "Cannot append palette to packet\n");
2990 } else {
Mats Peterson6aac43f2016-02-24 17:14:052991 memcpy(pal, track->palette, AVPALETTE_SIZE);
Mats Peterson79736032015-12-27 20:28:092992 }
Mats Peterson6aac43f2016-02-24 17:14:052993 track->has_palette = 0;
Mats Peterson79736032015-12-27 20:28:092994 }
Aurelien Jacobs737c40d2008-08-05 00:42:392995 return 0;
2996 }
2997
2998 return -1;
2999}
3000
3001/*
3002 * Free all packets in our internal queue.
3003 */
3004static void matroska_clear_queue(MatroskaDemuxContext *matroska)
3005{
James Almer78b96be2018-03-26 18:02:373006 ff_packet_list_free(&matroska->queue, &matroska->queue_end);
Aurelien Jacobs737c40d2008-08-05 00:42:393007}
3008
Luca Barbato2d0e7712012-09-16 23:58:323009static int matroska_parse_laces(MatroskaDemuxContext *matroska, uint8_t **buf,
Andreas Rheinhardtd5274f82019-12-03 17:09:103010 int size, int type, AVIOContext *pb,
Andreas Rheinhardt9ad1a6d2019-12-03 17:09:063011 uint32_t lace_size[256], int *laces)
Luca Barbato2d0e7712012-09-16 23:58:323012{
Andreas Rheinhardtf74eaa12019-12-03 17:09:083013 int n;
Luca Barbato2d0e7712012-09-16 23:58:323014 uint8_t *data = *buf;
Luca Barbato2d0e7712012-09-16 23:58:323015
3016 if (!type) {
Keiji Costantini84cfce92014-03-01 16:28:153017 *laces = 1;
Andreas Rheinhardt9ad1a6d2019-12-03 17:09:063018 lace_size[0] = size;
Luca Barbato2d0e7712012-09-16 23:58:323019 return 0;
3020 }
3021
Michael Niedermayer8c51ea52012-09-20 18:37:263022 av_assert0(size > 0);
Keiji Costantini84cfce92014-03-01 16:28:153023 *laces = *data + 1;
3024 data += 1;
3025 size -= 1;
Luca Barbato2d0e7712012-09-16 23:58:323026
3027 switch (type) {
Keiji Costantini84cfce92014-03-01 16:28:153028 case 0x1: /* Xiph lacing */
3029 {
Luca Barbato2d0e7712012-09-16 23:58:323030 uint8_t temp;
3031 uint32_t total = 0;
Andreas Rheinhardta69f92a2019-12-03 17:09:073032 for (n = 0; n < *laces - 1; n++) {
Andreas Rheinhardt1215b3a2019-05-16 22:29:483033 lace_size[n] = 0;
3034
Luca Barbato2d0e7712012-09-16 23:58:323035 while (1) {
Michael Niedermayer115c3bc2013-04-04 13:17:573036 if (size <= total) {
Andreas Rheinhardta69f92a2019-12-03 17:09:073037 return AVERROR_INVALIDDATA;
Luca Barbato2d0e7712012-09-16 23:58:323038 }
Keiji Costantini84cfce92014-03-01 16:28:153039 temp = *data;
Michael Niedermayerb3d9ab12014-03-07 22:46:373040 total += temp;
Luca Barbato2d0e7712012-09-16 23:58:323041 lace_size[n] += temp;
Keiji Costantini84cfce92014-03-01 16:28:153042 data += 1;
3043 size -= 1;
Luca Barbato2d0e7712012-09-16 23:58:323044 if (temp != 0xff)
3045 break;
3046 }
Luca Barbato2d0e7712012-09-16 23:58:323047 }
3048 if (size <= total) {
Andreas Rheinhardta69f92a2019-12-03 17:09:073049 return AVERROR_INVALIDDATA;
Luca Barbato2d0e7712012-09-16 23:58:323050 }
3051
3052 lace_size[n] = size - total;
3053 break;
3054 }
3055
3056 case 0x2: /* fixed-size lacing */
Anton Khirnov87b017a2012-09-20 18:04:563057 if (size % (*laces)) {
Andreas Rheinhardta69f92a2019-12-03 17:09:073058 return AVERROR_INVALIDDATA;
Luca Barbato2d0e7712012-09-16 23:58:323059 }
3060 for (n = 0; n < *laces; n++)
3061 lace_size[n] = size / *laces;
3062 break;
3063
Keiji Costantini84cfce92014-03-01 16:28:153064 case 0x3: /* EBML lacing */
3065 {
Luca Barbato2d0e7712012-09-16 23:58:323066 uint64_t num;
Luca Barbato8a96df72013-03-28 10:52:523067 uint64_t total;
Andreas Rheinhardtd5274f82019-12-03 17:09:103068 int offset;
3069
3070 avio_skip(pb, 4);
3071
3072 n = ebml_read_num(matroska, pb, 8, &num, 1);
Andreas Rheinhardtdbe3be62019-12-03 17:09:093073 if (n < 0)
3074 return n;
3075 if (num > INT_MAX)
3076 return AVERROR_INVALIDDATA;
Andreas Rheinhardtd5274f82019-12-03 17:09:103077
Luca Barbato2d0e7712012-09-16 23:58:323078 total = lace_size[0] = num;
Andreas Rheinhardtd5274f82019-12-03 17:09:103079 offset = n;
Andreas Rheinhardta69f92a2019-12-03 17:09:073080 for (n = 1; n < *laces - 1; n++) {
Luca Barbato2d0e7712012-09-16 23:58:323081 int64_t snum;
3082 int r;
Andreas Rheinhardtd5274f82019-12-03 17:09:103083 r = matroska_ebmlnum_sint(matroska, pb, &snum);
Andreas Rheinhardtdbe3be62019-12-03 17:09:093084 if (r < 0)
3085 return r;
3086 if (lace_size[n - 1] + snum > (uint64_t)INT_MAX)
3087 return AVERROR_INVALIDDATA;
Andreas Rheinhardtd5274f82019-12-03 17:09:103088
Luca Barbato2d0e7712012-09-16 23:58:323089 lace_size[n] = lace_size[n - 1] + snum;
Keiji Costantini84cfce92014-03-01 16:28:153090 total += lace_size[n];
Andreas Rheinhardtd5274f82019-12-03 17:09:103091 offset += r;
Luca Barbato2d0e7712012-09-16 23:58:323092 }
Andreas Rheinhardtd5274f82019-12-03 17:09:103093 data += offset;
3094 size -= offset;
Luca Barbato2d0e7712012-09-16 23:58:323095 if (size <= total) {
Andreas Rheinhardta69f92a2019-12-03 17:09:073096 return AVERROR_INVALIDDATA;
Luca Barbato2d0e7712012-09-16 23:58:323097 }
3098 lace_size[*laces - 1] = size - total;
3099 break;
3100 }
3101 }
3102
3103 *buf = data;
Luca Barbato2d0e7712012-09-16 23:58:323104
Andreas Rheinhardta69f92a2019-12-03 17:09:073105 return 0;
Luca Barbato2d0e7712012-09-16 23:58:323106}
3107
Luca Barbatoc831ebf2012-09-16 23:28:133108static int matroska_parse_rm_audio(MatroskaDemuxContext *matroska,
Keiji Costantini84cfce92014-03-01 16:28:153109 MatroskaTrack *track, AVStream *st,
3110 uint8_t *data, int size, uint64_t timecode,
Luca Barbatoc831ebf2012-09-16 23:28:133111 int64_t pos)
3112{
Anton Khirnov92005142014-06-18 18:42:523113 int a = st->codecpar->block_align;
Luca Barbatoc831ebf2012-09-16 23:28:133114 int sps = track->audio.sub_packet_size;
3115 int cfs = track->audio.coded_framesize;
Keiji Costantini84cfce92014-03-01 16:28:153116 int h = track->audio.sub_packet_h;
3117 int y = track->audio.sub_packet_cnt;
3118 int w = track->audio.frame_size;
Luca Barbatoc831ebf2012-09-16 23:28:133119 int x;
3120
3121 if (!track->audio.pkt_cnt) {
3122 if (track->audio.sub_packet_cnt == 0)
3123 track->audio.buf_timecode = timecode;
Anton Khirnov92005142014-06-18 18:42:523124 if (st->codecpar->codec_id == AV_CODEC_ID_RA_288) {
Luca Barbatoc831ebf2012-09-16 23:28:133125 if (size < cfs * h / 2) {
3126 av_log(matroska->ctx, AV_LOG_ERROR,
3127 "Corrupt int4 RM-style audio packet size\n");
3128 return AVERROR_INVALIDDATA;
3129 }
Keiji Costantini84cfce92014-03-01 16:28:153130 for (x = 0; x < h / 2; x++)
3131 memcpy(track->audio.buf + x * 2 * w + y * cfs,
3132 data + x * cfs, cfs);
Anton Khirnov92005142014-06-18 18:42:523133 } else if (st->codecpar->codec_id == AV_CODEC_ID_SIPR) {
Luca Barbatoc831ebf2012-09-16 23:28:133134 if (size < w) {
3135 av_log(matroska->ctx, AV_LOG_ERROR,
3136 "Corrupt sipr RM-style audio packet size\n");
3137 return AVERROR_INVALIDDATA;
3138 }
Keiji Costantini84cfce92014-03-01 16:28:153139 memcpy(track->audio.buf + y * w, data, w);
Luca Barbatoc831ebf2012-09-16 23:28:133140 } else {
Michael Niedermayera1ed1c22014-01-10 22:10:473141 if (size < sps * w / sps || h<=0 || w%sps) {
Luca Barbatoc831ebf2012-09-16 23:28:133142 av_log(matroska->ctx, AV_LOG_ERROR,
3143 "Corrupt generic RM-style audio packet size\n");
3144 return AVERROR_INVALIDDATA;
3145 }
Keiji Costantini84cfce92014-03-01 16:28:153146 for (x = 0; x < w / sps; x++)
3147 memcpy(track->audio.buf +
3148 sps * (h * x + ((h + 1) / 2) * (y & 1) + (y >> 1)),
3149 data + x * sps, sps);
Luca Barbatoc831ebf2012-09-16 23:28:133150 }
3151
3152 if (++track->audio.sub_packet_cnt >= h) {
Anton Khirnov92005142014-06-18 18:42:523153 if (st->codecpar->codec_id == AV_CODEC_ID_SIPR)
Luca Barbatoc831ebf2012-09-16 23:28:133154 ff_rm_reorder_sipr_data(track->audio.buf, h, w);
3155 track->audio.sub_packet_cnt = 0;
Keiji Costantini84cfce92014-03-01 16:28:153156 track->audio.pkt_cnt = h * w / a;
Luca Barbatoc831ebf2012-09-16 23:28:133157 }
3158 }
3159
3160 while (track->audio.pkt_cnt) {
Vittorio Giovarae0caa1e2014-10-23 23:05:533161 int ret;
James Almer4f55b942018-04-04 16:53:123162 AVPacket pktl, *pkt = &pktl;
Vittorio Giovarae0caa1e2014-10-23 23:05:533163
3164 ret = av_new_packet(pkt, a);
3165 if (ret < 0) {
Vittorio Giovarae0caa1e2014-10-23 23:05:533166 return ret;
Michael Niedermayer11164912012-10-20 14:55:453167 }
Keiji Costantini84cfce92014-03-01 16:28:153168 memcpy(pkt->data,
3169 track->audio.buf + a * (h * w / a - track->audio.pkt_cnt--),
3170 a);
3171 pkt->pts = track->audio.buf_timecode;
Luca Barbatoc831ebf2012-09-16 23:28:133172 track->audio.buf_timecode = AV_NOPTS_VALUE;
Keiji Costantini84cfce92014-03-01 16:28:153173 pkt->pos = pos;
3174 pkt->stream_index = st->index;
James Almer78b96be2018-03-26 18:02:373175 ret = ff_packet_list_put(&matroska->queue, &matroska->queue_end, pkt, 0);
3176 if (ret < 0) {
James Almer4f55b942018-04-04 16:53:123177 av_packet_unref(pkt);
James Almer78b96be2018-03-26 18:02:373178 return AVERROR(ENOMEM);
3179 }
Luca Barbatoc831ebf2012-09-16 23:28:133180 }
3181
3182 return 0;
3183}
Anton Khirnov9b6f47c2013-05-27 07:44:273184
3185/* reconstruct full wavpack blocks from mangled matroska ones */
3186static int matroska_parse_wavpack(MatroskaTrack *track, uint8_t *src,
3187 uint8_t **pdst, int *size)
3188{
3189 uint8_t *dst = NULL;
3190 int dstlen = 0;
3191 int srclen = *size;
3192 uint32_t samples;
3193 uint16_t ver;
3194 int ret, offset = 0;
3195
Andreas Rheinhardt048bc3f2019-12-14 00:36:543196 if (srclen < 12)
Anton Khirnov9b6f47c2013-05-27 07:44:273197 return AVERROR_INVALIDDATA;
3198
Andreas Rheinhardt048bc3f2019-12-14 00:36:543199 av_assert1(track->stream->codecpar->extradata_size >= 2);
Anton Khirnov92005142014-06-18 18:42:523200 ver = AV_RL16(track->stream->codecpar->extradata);
Anton Khirnov9b6f47c2013-05-27 07:44:273201
3202 samples = AV_RL32(src);
3203 src += 4;
3204 srclen -= 4;
3205
3206 while (srclen >= 8) {
3207 int multiblock;
3208 uint32_t blocksize;
3209 uint8_t *tmp;
3210
3211 uint32_t flags = AV_RL32(src);
3212 uint32_t crc = AV_RL32(src + 4);
3213 src += 8;
3214 srclen -= 8;
3215
3216 multiblock = (flags & 0x1800) != 0x1800;
3217 if (multiblock) {
3218 if (srclen < 4) {
3219 ret = AVERROR_INVALIDDATA;
3220 goto fail;
3221 }
3222 blocksize = AV_RL32(src);
Keiji Costantini84cfce92014-03-01 16:28:153223 src += 4;
3224 srclen -= 4;
Anton Khirnov9b6f47c2013-05-27 07:44:273225 } else
3226 blocksize = srclen;
3227
3228 if (blocksize > srclen) {
3229 ret = AVERROR_INVALIDDATA;
3230 goto fail;
3231 }
3232
James Almer9703b7d2018-04-04 21:12:533233 tmp = av_realloc(dst, dstlen + blocksize + 32 + AV_INPUT_BUFFER_PADDING_SIZE);
Anton Khirnov9b6f47c2013-05-27 07:44:273234 if (!tmp) {
3235 ret = AVERROR(ENOMEM);
3236 goto fail;
3237 }
3238 dst = tmp;
3239 dstlen += blocksize + 32;
3240
Keiji Costantini84cfce92014-03-01 16:28:153241 AV_WL32(dst + offset, MKTAG('w', 'v', 'p', 'k')); // tag
3242 AV_WL32(dst + offset + 4, blocksize + 24); // blocksize - 8
3243 AV_WL16(dst + offset + 8, ver); // version
3244 AV_WL16(dst + offset + 10, 0); // track/index_no
3245 AV_WL32(dst + offset + 12, 0); // total samples
3246 AV_WL32(dst + offset + 16, 0); // block index
3247 AV_WL32(dst + offset + 20, samples); // number of samples
3248 AV_WL32(dst + offset + 24, flags); // flags
3249 AV_WL32(dst + offset + 28, crc); // crc
3250 memcpy(dst + offset + 32, src, blocksize); // block data
Anton Khirnov9b6f47c2013-05-27 07:44:273251
3252 src += blocksize;
3253 srclen -= blocksize;
3254 offset += blocksize + 32;
3255 }
3256
James Almer9703b7d2018-04-04 21:12:533257 memset(dst + dstlen, 0, AV_INPUT_BUFFER_PADDING_SIZE);
3258
Anton Khirnov9b6f47c2013-05-27 07:44:273259 *pdst = dst;
3260 *size = dstlen;
3261
3262 return 0;
3263
3264fail:
3265 av_freep(&dst);
3266 return ret;
3267}
3268
James Almerb8e75a22018-04-04 19:07:363269static int matroska_parse_prores(MatroskaTrack *track, uint8_t *src,
3270 uint8_t **pdst, int *size)
3271{
Andreas Rheinhardtaf50f0a2019-12-06 23:16:193272 uint8_t *dst;
3273 int dstlen = *size + 8;
Andreas Rheinhardt581419e2019-09-28 17:54:253274
3275 dst = av_malloc(dstlen + AV_INPUT_BUFFER_PADDING_SIZE);
James Almerb8e75a22018-04-04 19:07:363276 if (!dst)
3277 return AVERROR(ENOMEM);
3278
3279 AV_WB32(dst, dstlen);
3280 AV_WB32(dst + 4, MKBETAG('i', 'c', 'p', 'f'));
Andreas Rheinhardt581419e2019-09-28 17:54:253281 memcpy(dst + 8, src, dstlen - 8);
3282 memset(dst + dstlen, 0, AV_INPUT_BUFFER_PADDING_SIZE);
James Almerb8e75a22018-04-04 19:07:363283
3284 *pdst = dst;
3285 *size = dstlen;
3286
3287 return 0;
3288}
3289
Matthew Heaney818ebe92013-08-08 22:40:033290static int matroska_parse_webvtt(MatroskaDemuxContext *matroska,
3291 MatroskaTrack *track,
3292 AVStream *st,
3293 uint8_t *data, int data_len,
3294 uint64_t timecode,
3295 uint64_t duration,
3296 int64_t pos)
3297{
James Almer4f55b942018-04-04 16:53:123298 AVPacket pktl, *pkt = &pktl;
Matthew Heaney818ebe92013-08-08 22:40:033299 uint8_t *id, *settings, *text, *buf;
3300 int id_len, settings_len, text_len;
3301 uint8_t *p, *q;
3302 int err;
3303
3304 if (data_len <= 0)
3305 return AVERROR_INVALIDDATA;
3306
3307 p = data;
3308 q = data + data_len;
3309
3310 id = p;
3311 id_len = -1;
3312 while (p < q) {
3313 if (*p == '\r' || *p == '\n') {
3314 id_len = p - id;
3315 if (*p == '\r')
3316 p++;
3317 break;
3318 }
3319 p++;
3320 }
3321
3322 if (p >= q || *p != '\n')
3323 return AVERROR_INVALIDDATA;
3324 p++;
3325
3326 settings = p;
3327 settings_len = -1;
3328 while (p < q) {
3329 if (*p == '\r' || *p == '\n') {
3330 settings_len = p - settings;
3331 if (*p == '\r')
3332 p++;
3333 break;
3334 }
3335 p++;
3336 }
3337
3338 if (p >= q || *p != '\n')
3339 return AVERROR_INVALIDDATA;
3340 p++;
3341
3342 text = p;
3343 text_len = q - p;
3344 while (text_len > 0) {
3345 const int len = text_len - 1;
3346 const uint8_t c = p[len];
3347 if (c != '\r' && c != '\n')
3348 break;
3349 text_len = len;
3350 }
3351
3352 if (text_len <= 0)
3353 return AVERROR_INVALIDDATA;
3354
Matthew Heaney818ebe92013-08-08 22:40:033355 err = av_new_packet(pkt, text_len);
3356 if (err < 0) {
James Almerf4f39582018-02-20 13:26:213357 return err;
Matthew Heaney818ebe92013-08-08 22:40:033358 }
3359
3360 memcpy(pkt->data, text, text_len);
3361
3362 if (id_len > 0) {
3363 buf = av_packet_new_side_data(pkt,
3364 AV_PKT_DATA_WEBVTT_IDENTIFIER,
3365 id_len);
Michael Niedermayerfb33bff2014-08-15 18:33:213366 if (!buf) {
James Almer88eb3682018-02-20 13:25:543367 av_packet_unref(pkt);
Matthew Heaney818ebe92013-08-08 22:40:033368 return AVERROR(ENOMEM);
3369 }
3370 memcpy(buf, id, id_len);
3371 }
3372
3373 if (settings_len > 0) {
3374 buf = av_packet_new_side_data(pkt,
3375 AV_PKT_DATA_WEBVTT_SETTINGS,
3376 settings_len);
Michael Niedermayerfb33bff2014-08-15 18:33:213377 if (!buf) {
James Almer88eb3682018-02-20 13:25:543378 av_packet_unref(pkt);
Matthew Heaney818ebe92013-08-08 22:40:033379 return AVERROR(ENOMEM);
3380 }
3381 memcpy(buf, settings, settings_len);
3382 }
3383
3384 // Do we need this for subtitles?
3385 // pkt->flags = AV_PKT_FLAG_KEY;
3386
3387 pkt->stream_index = st->index;
3388 pkt->pts = timecode;
3389
3390 // Do we need this for subtitles?
3391 // pkt->dts = timecode;
3392
3393 pkt->duration = duration;
3394 pkt->pos = pos;
3395
James Almer78b96be2018-03-26 18:02:373396 err = ff_packet_list_put(&matroska->queue, &matroska->queue_end, pkt, 0);
3397 if (err < 0) {
James Almer4f55b942018-04-04 16:53:123398 av_packet_unref(pkt);
James Almer78b96be2018-03-26 18:02:373399 return AVERROR(ENOMEM);
3400 }
Matthew Heaney818ebe92013-08-08 22:40:033401
3402 return 0;
3403}
3404
Luca Barbatoc831ebf2012-09-16 23:28:133405static int matroska_parse_frame(MatroskaDemuxContext *matroska,
Keiji Costantini84cfce92014-03-01 16:28:153406 MatroskaTrack *track, AVStream *st,
James Almer9703b7d2018-04-04 21:12:533407 AVBufferRef *buf, uint8_t *data, int pkt_size,
Michael Niedermayer8c51ea52012-09-20 18:37:263408 uint64_t timecode, uint64_t lace_duration,
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:483409 int64_t pos, int is_keyframe,
Vignesh Venkatasubramanian7b0a8392013-09-10 18:12:213410 uint8_t *additional, uint64_t additional_id, int additional_size,
Jan Gerberf4b1ca92013-11-14 11:58:283411 int64_t discard_padding)
Luca Barbatoc831ebf2012-09-16 23:28:133412{
3413 MatroskaTrackEncoding *encodings = track->encodings.elem;
3414 uint8_t *pkt_data = data;
James Almerb8e75a22018-04-04 19:07:363415 int res;
James Almer2f0e0de2018-04-04 13:54:143416 AVPacket pktl, *pkt = &pktl;
Luca Barbatoc831ebf2012-09-16 23:28:133417
Frank Galliganb8531032013-03-07 16:11:383418 if (encodings && !encodings->type && encodings->scope & 1) {
Luca Barbatoc831ebf2012-09-16 23:28:133419 res = matroska_decode_buffer(&pkt_data, &pkt_size, track);
3420 if (res < 0)
3421 return res;
3422 }
3423
Anton Khirnov92005142014-06-18 18:42:523424 if (st->codecpar->codec_id == AV_CODEC_ID_WAVPACK) {
Anton Khirnov9b6f47c2013-05-27 07:44:273425 uint8_t *wv_data;
3426 res = matroska_parse_wavpack(track, pkt_data, &wv_data, &pkt_size);
3427 if (res < 0) {
Keiji Costantini84cfce92014-03-01 16:28:153428 av_log(matroska->ctx, AV_LOG_ERROR,
3429 "Error parsing a wavpack block.\n");
Anton Khirnov9b6f47c2013-05-27 07:44:273430 goto fail;
3431 }
3432 if (pkt_data != data)
3433 av_freep(&pkt_data);
3434 pkt_data = wv_data;
3435 }
3436
Andreas Rheinhardtaf50f0a2019-12-06 23:16:193437 if (st->codecpar->codec_id == AV_CODEC_ID_PRORES &&
3438 AV_RB32(pkt_data + 4) != MKBETAG('i', 'c', 'p', 'f')) {
James Almerb8e75a22018-04-04 19:07:363439 uint8_t *pr_data;
3440 res = matroska_parse_prores(track, pkt_data, &pr_data, &pkt_size);
3441 if (res < 0) {
3442 av_log(matroska->ctx, AV_LOG_ERROR,
3443 "Error parsing a prores block.\n");
3444 goto fail;
3445 }
3446 if (pkt_data != data)
3447 av_freep(&pkt_data);
3448 pkt_data = pr_data;
3449 }
Luca Barbatoc831ebf2012-09-16 23:28:133450
James Almer9703b7d2018-04-04 21:12:533451 av_init_packet(pkt);
3452 if (pkt_data != data)
3453 pkt->buf = av_buffer_create(pkt_data, pkt_size + AV_INPUT_BUFFER_PADDING_SIZE,
3454 NULL, NULL, 0);
3455 else
3456 pkt->buf = av_buffer_ref(buf);
3457
3458 if (!pkt->buf) {
Michael Niedermayer2fe4b622013-06-03 14:07:063459 res = AVERROR(ENOMEM);
3460 goto fail;
Luca Barbatoc831ebf2012-09-16 23:28:133461 }
3462
James Almer9703b7d2018-04-04 21:12:533463 pkt->data = pkt_data;
3464 pkt->size = pkt_size;
Keiji Costantini84cfce92014-03-01 16:28:153465 pkt->flags = is_keyframe;
Luca Barbatoc831ebf2012-09-16 23:28:133466 pkt->stream_index = st->index;
3467
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:483468 if (additional_size > 0) {
3469 uint8_t *side_data = av_packet_new_side_data(pkt,
3470 AV_PKT_DATA_MATROSKA_BLOCKADDITIONAL,
Michael Niedermayera08ebf02013-02-13 23:55:253471 additional_size + 8);
Michael Niedermayerfb33bff2014-08-15 18:33:213472 if (!side_data) {
Hendrik Leppkesc2f861c2015-10-27 13:35:303473 av_packet_unref(pkt);
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:483474 return AVERROR(ENOMEM);
3475 }
Michael Niedermayera08ebf02013-02-13 23:55:253476 AV_WB64(side_data, additional_id);
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:483477 memcpy(side_data + 8, additional, additional_size);
3478 }
3479
Vignesh Venkatasubramanian7b0a8392013-09-10 18:12:213480 if (discard_padding) {
3481 uint8_t *side_data = av_packet_new_side_data(pkt,
3482 AV_PKT_DATA_SKIP_SAMPLES,
3483 10);
Michael Niedermayerfb33bff2014-08-15 18:33:213484 if (!side_data) {
Hendrik Leppkesc2f861c2015-10-27 13:35:303485 av_packet_unref(pkt);
Vignesh Venkatasubramanian7b0a8392013-09-10 18:12:213486 return AVERROR(ENOMEM);
3487 }
James Almer70c6a1b2016-11-05 20:46:523488 discard_padding = av_rescale_q(discard_padding,
Vignesh Venkatasubramanian7b0a8392013-09-10 18:12:213489 (AVRational){1, 1000000000},
James Almer70c6a1b2016-11-05 20:46:523490 (AVRational){1, st->codecpar->sample_rate});
3491 if (discard_padding > 0) {
3492 AV_WL32(side_data + 4, discard_padding);
3493 } else {
3494 AV_WL32(side_data, -discard_padding);
3495 }
Vignesh Venkatasubramanian7b0a8392013-09-10 18:12:213496 }
3497
Luca Barbatoc831ebf2012-09-16 23:28:133498 if (track->ms_compat)
3499 pkt->dts = timecode;
3500 else
3501 pkt->pts = timecode;
3502 pkt->pos = pos;
Hendrik Leppkesb01891a2015-09-29 13:14:593503 pkt->duration = lace_duration;
3504
wm4948f3c12015-09-26 16:13:553505#if FF_API_CONVERGENCE_DURATION
3506FF_DISABLE_DEPRECATION_WARNINGS
Derek Buitenhuis6f69f7a2016-04-10 19:58:153507 if (st->codecpar->codec_id == AV_CODEC_ID_SUBRIP) {
Michael Niedermayer8c51ea52012-09-20 18:37:263508 pkt->convergence_duration = lace_duration;
3509 }
wm4948f3c12015-09-26 16:13:553510FF_ENABLE_DEPRECATION_WARNINGS
3511#endif
Luca Barbatoc831ebf2012-09-16 23:28:133512
James Almer78b96be2018-03-26 18:02:373513 res = ff_packet_list_put(&matroska->queue, &matroska->queue_end, pkt, 0);
3514 if (res < 0) {
James Almer2f0e0de2018-04-04 13:54:143515 av_packet_unref(pkt);
James Almer78b96be2018-03-26 18:02:373516 return AVERROR(ENOMEM);
3517 }
Luca Barbatoc831ebf2012-09-16 23:28:133518
3519 return 0;
Keiji Costantini84cfce92014-03-01 16:28:153520
Anton Khirnov9b6f47c2013-05-27 07:44:273521fail:
3522 if (pkt_data != data)
3523 av_freep(&pkt_data);
3524 return res;
Luca Barbatoc831ebf2012-09-16 23:28:133525}
3526
James Almer9703b7d2018-04-04 21:12:533527static int matroska_parse_block(MatroskaDemuxContext *matroska, AVBufferRef *buf, uint8_t *data,
Aurelien Jacobsf7b96872008-08-05 00:42:053528 int size, int64_t pos, uint64_t cluster_time,
Luca Barbato7d843102012-09-17 00:48:023529 uint64_t block_duration, int is_keyframe,
Vignesh Venkatasubramanian30c5c452013-02-13 21:51:483530 uint8_t *additional, uint64_t additional_id, int additional_size,
Jan Gerberf4b1ca92013-11-14 11:58:283531 int64_t cluster_pos, int64_t discard_padding)
David Conradb061d892007-06-04 22:10:543532{
Aurelien Jacobsf14a2012008-09-09 11:54:353533 uint64_t timecode = AV_NOPTS_VALUE;
Aurelien Jacobs009ecd52008-08-05 00:40:123534 MatroskaTrack *track;
Andreas Rheinhardtd5274f82019-12-03 17:09:103535 AVIOContext pb;
Aurelien Jacobsa3467f82008-09-06 23:44:293536 int res = 0;
David Conradb061d892007-06-04 22:10:543537 AVStream *st;
David Conradb061d892007-06-04 22:10:543538 int16_t block_time;
Andreas Rheinhardt9ad1a6d2019-12-03 17:09:063539 uint32_t lace_size[256];
David Conradb061d892007-06-04 22:10:543540 int n, flags, laces = 0;
3541 uint64_t num;
Michael Niedermayer6158a3b2013-07-15 15:13:453542 int trust_default_duration = 1;
David Conradb061d892007-06-04 22:10:543543
Andreas Rheinhardtd5274f82019-12-03 17:09:103544 ffio_init_context(&pb, data, size, 0, NULL, NULL, NULL, NULL);
3545
3546 if ((n = ebml_read_num(matroska, &pb, 8, &num, 1)) < 0)
Luca Barbato721af292012-04-30 00:39:313547 return n;
David Conradb061d892007-06-04 22:10:543548 data += n;
3549 size -= n;
3550
David Conradb061d892007-06-04 22:10:543551 track = matroska_find_track_by_num(matroska, num);
Ronald S. Bultjed31fb1a2011-10-29 23:17:513552 if (!track || !track->stream) {
David Conradb061d892007-06-04 22:10:543553 av_log(matroska->ctx, AV_LOG_INFO,
Andreas Rheinhardtf767c682019-05-16 22:29:463554 "Invalid stream %"PRIu64"\n", num);
Reimar Döffingerd4931702012-02-13 22:06:193555 return AVERROR_INVALIDDATA;
Ronald S. Bultjed31fb1a2011-10-29 23:17:513556 } else if (size <= 3)
3557 return 0;
Aurelien Jacobs009ecd52008-08-05 00:40:123558 st = track->stream;
Aurelien Jacobs16f97ab2008-08-05 00:41:103559 if (st->discard >= AVDISCARD_ALL)
David Conradb061d892007-06-04 22:10:543560 return res;
Michael Niedermayer5864ce12012-09-20 19:46:353561 av_assert1(block_duration != AV_NOPTS_VALUE);
David Conradb061d892007-06-04 22:10:543562
Michael Niedermayer729fa552013-05-19 21:38:013563 block_time = sign_extend(AV_RB16(data), 16);
Keiji Costantini84cfce92014-03-01 16:28:153564 data += 2;
3565 flags = *data++;
3566 size -= 3;
David Conradb061d892007-06-04 22:10:543567 if (is_keyframe == -1)
Jean-Daniel Dupascc947f02010-03-31 12:29:583568 is_keyframe = flags & 0x80 ? AV_PKT_FLAG_KEY : 0;
David Conradb061d892007-06-04 22:10:543569
Keiji Costantini84cfce92014-03-01 16:28:153570 if (cluster_time != (uint64_t) -1 &&
3571 (block_time >= 0 || cluster_time >= -block_time)) {
Michael Niedermayerb5bc4362016-06-06 02:23:163572 timecode = cluster_time + block_time - track->codec_delay_in_track_tb;
Keiji Costantini84cfce92014-03-01 16:28:153573 if (track->type == MATROSKA_TRACK_TYPE_SUBTITLE &&
3574 timecode < track->end_timecode)
Aurelien Jacobs82360e62008-09-09 12:07:103575 is_keyframe = 0; /* overlapping subtitles are not key frame */
Michael Niedermayerb347ca92016-12-26 02:16:013576 if (is_keyframe) {
3577 ff_reduce_index(matroska->ctx, st->index);
Keiji Costantini84cfce92014-03-01 16:28:153578 av_add_index_entry(st, cluster_pos, timecode, 0, 0,
3579 AVINDEX_KEYFRAME);
Michael Niedermayerb347ca92016-12-26 02:16:013580 }
Aurelien Jacobsf14a2012008-09-09 11:54:353581 }
3582
Keiji Costantini84cfce92014-03-01 16:28:153583 if (matroska->skip_to_keyframe &&
3584 track->type != MATROSKA_TRACK_TYPE_SUBTITLE) {
Chris Cunninghamd59820f2016-07-21 19:01:453585 // Compare signed timecodes. Timecode may be negative due to codec delay
3586 // offset. We don't support timestamps greater than int64_t anyway - see
3587 // AVPacket's pts.
Chris Cunningham52ec4cc2016-07-28 01:33:303588 if ((int64_t)timecode < (int64_t)matroska->skip_to_timecode)
David Conradb061d892007-06-04 22:10:543589 return res;
Monty Montgomeryf6622f92013-09-11 06:00:313590 if (is_keyframe)
3591 matroska->skip_to_keyframe = 0;
3592 else if (!st->skip_to_keyframe) {
Reimar Döffinger4a958762012-04-13 22:17:303593 av_log(matroska->ctx, AV_LOG_ERROR, "File is broken, keyframes not correctly marked!\n");
3594 matroska->skip_to_keyframe = 0;
3595 }
David Conradb061d892007-06-04 22:10:543596 }
3597
Andreas Rheinhardtf74eaa12019-12-03 17:09:083598 res = matroska_parse_laces(matroska, &data, size, (flags & 0x06) >> 1,
Andreas Rheinhardtd5274f82019-12-03 17:09:103599 &pb, lace_size, &laces);
Andreas Rheinhardtdbe3be62019-12-03 17:09:093600 if (res < 0) {
3601 av_log(matroska->ctx, AV_LOG_ERROR, "Error parsing frame sizes.\n");
Andreas Rheinhardt9ad1a6d2019-12-03 17:09:063602 return res;
Andreas Rheinhardtdbe3be62019-12-03 17:09:093603 }
Aurelien Jacobseabb8ba2007-06-04 22:19:173604
Michael Niedermayer6158a3b2013-07-15 15:13:453605 if (track->audio.samplerate == 8000) {
3606 // If this is needed for more codecs, then add them here
Derek Buitenhuis6f69f7a2016-04-10 19:58:153607 if (st->codecpar->codec_id == AV_CODEC_ID_AC3) {
3608 if (track->audio.samplerate != st->codecpar->sample_rate || !st->codecpar->frame_size)
Michael Niedermayer6158a3b2013-07-15 15:13:453609 trust_default_duration = 0;
3610 }
3611 }
3612
3613 if (!block_duration && trust_default_duration)
Michael Niedermayer5864ce12012-09-20 19:46:353614 block_duration = track->default_duration * laces / matroska->time_scale;
Michael Niedermayer8c51ea52012-09-20 18:37:263615
3616 if (cluster_time != (uint64_t)-1 && (block_time >= 0 || cluster_time >= -block_time))
Luca Barbato7d843102012-09-17 00:48:023617 track->end_timecode =
3618 FFMAX(track->end_timecode, timecode + block_duration);
Michael Niedermayer8c51ea52012-09-20 18:37:263619
Luca Barbatoc831ebf2012-09-16 23:28:133620 for (n = 0; n < laces; n++) {
Michael Niedermayer5864ce12012-09-20 19:46:353621 int64_t lace_duration = block_duration*(n+1) / laces - block_duration*n / laces;
Michael Niedermayer8c51ea52012-09-20 18:37:263622
Andreas Rheinhardtc6f60b92019-12-02 10:04:553623 if (track->audio.buf) {
Luca Barbato25a80a92013-03-29 11:51:513624 res = matroska_parse_rm_audio(matroska, track, st, data,
3625 lace_size[n],
Michael Niedermayera6ec1e42012-09-20 21:43:203626 timecode, pos);
Luca Barbatoc831ebf2012-09-16 23:28:133627 if (res)
Andreas Rheinhardt9ad1a6d2019-12-03 17:09:063628 return res;
David Conradb061d892007-06-04 22:10:543629
Derek Buitenhuis6f69f7a2016-04-10 19:58:153630 } else if (st->codecpar->codec_id == AV_CODEC_ID_WEBVTT) {
Matthew Heaney818ebe92013-08-08 22:40:033631 res = matroska_parse_webvtt(matroska, track, st,
3632 data, lace_size[n],
3633 timecode, lace_duration,
3634 pos);
3635 if (res)
Andreas Rheinhardt9ad1a6d2019-12-03 17:09:063636 return res;
Luca Barbatoc831ebf2012-09-16 23:28:133637 } else {
James Almer9703b7d2018-04-04 21:12:533638 res = matroska_parse_frame(matroska, track, st, buf, data, lace_size[n],
Michael Niedermayerb3d9ab12014-03-07 22:46:373639 timecode, lace_duration, pos,
3640 !n ? is_keyframe : 0,
3641 additional, additional_id, additional_size,
3642 discard_padding);
Luca Barbatoc831ebf2012-09-16 23:28:133643 if (res)
Andreas Rheinhardt9ad1a6d2019-12-03 17:09:063644 return res;
David Conradb061d892007-06-04 22:10:543645 }
Luca Barbatoc831ebf2012-09-16 23:28:133646
3647 if (timecode != AV_NOPTS_VALUE)
Michael Niedermayer8c51ea52012-09-20 18:37:263648 timecode = lace_duration ? timecode + lace_duration : AV_NOPTS_VALUE;
Luca Barbatoc831ebf2012-09-16 23:28:133649 data += lace_size[n];
David Conradb061d892007-06-04 22:10:543650 }
3651
Andreas Rheinhardt9ad1a6d2019-12-03 17:09:063652 return 0;
David Conradb061d892007-06-04 22:10:543653}
3654
Andreas Rheinhardt70baf722019-05-16 22:29:583655static int matroska_parse_cluster(MatroskaDemuxContext *matroska)
Dale Curtis8336eb62012-04-19 18:12:243656{
Andreas Rheinhardtffa64a42019-05-16 22:29:593657 MatroskaCluster *cluster = &matroska->current_cluster;
3658 MatroskaBlock *block = &cluster->block;
3659 int res;
Andreas Rheinhardt865c5372019-05-16 22:30:083660
3661 av_assert0(matroska->num_levels <= 2);
3662
3663 if (matroska->num_levels == 1) {
Andreas Rheinhardt71c90882019-05-16 22:30:183664 res = ebml_parse(matroska, matroska_segment, NULL);
Andreas Rheinhardt865c5372019-05-16 22:30:083665
3666 if (res == 1) {
3667 /* Found a cluster: subtract the size of the ID already read. */
3668 cluster->pos = avio_tell(matroska->ctx->pb) - 4;
3669
3670 res = ebml_parse(matroska, matroska_cluster_enter, cluster);
3671 if (res < 0)
3672 return res;
3673 }
Dale Curtis8336eb62012-04-19 18:12:243674 }
3675
Andreas Rheinhardt865c5372019-05-16 22:30:083676 if (matroska->num_levels == 2) {
Andreas Rheinhardt865c5372019-05-16 22:30:083677 /* We are inside a cluster. */
3678 res = ebml_parse(matroska, matroska_cluster_parsing, cluster);
3679
3680 if (res >= 0 && block->bin.size > 0) {
Andreas Rheinhardtffa64a42019-05-16 22:29:593681 int is_keyframe = block->non_simple ? block->reference == INT64_MIN : -1;
3682 uint8_t* additional = block->additional.size > 0 ?
3683 block->additional.data : NULL;
Dale Curtis8336eb62012-04-19 18:12:243684
Andreas Rheinhardta9f05152019-05-16 22:30:093685 res = matroska_parse_block(matroska, block->bin.buf, block->bin.data,
Andreas Rheinhardtffa64a42019-05-16 22:29:593686 block->bin.size, block->bin.pos,
Andreas Rheinhardt865c5372019-05-16 22:30:083687 cluster->timecode, block->duration,
3688 is_keyframe, additional, block->additional_id,
3689 block->additional.size, cluster->pos,
Andreas Rheinhardtffa64a42019-05-16 22:29:593690 block->discard_padding);
Andreas Rheinhardt865c5372019-05-16 22:30:083691 }
Dale Curtis8336eb62012-04-19 18:12:243692
Andreas Rheinhardt60f75c92019-05-16 22:30:133693 ebml_free(matroska_blockgroup, block);
3694 memset(block, 0, sizeof(*block));
Andreas Rheinhardt865c5372019-05-16 22:30:083695 } else if (!matroska->num_levels) {
Andreas Rheinhardt3ed27552019-05-16 22:30:113696 if (!avio_feof(matroska->ctx->pb)) {
3697 avio_r8(matroska->ctx->pb);
3698 if (!avio_feof(matroska->ctx->pb)) {
3699 av_log(matroska->ctx, AV_LOG_WARNING, "File extends beyond "
3700 "end of segment.\n");
3701 return AVERROR_INVALIDDATA;
3702 }
3703 }
Andreas Rheinhardt865c5372019-05-16 22:30:083704 matroska->done = 1;
3705 return AVERROR_EOF;
3706 }
3707
Dale Curtis8336eb62012-04-19 18:12:243708 return res;
3709}
3710
Aurelien Jacobsf7b96872008-08-05 00:42:053711static int matroska_read_packet(AVFormatContext *s, AVPacket *pkt)
David Conradb061d892007-06-04 22:10:543712{
3713 MatroskaDemuxContext *matroska = s->priv_data;
Sophia Wang8c830622016-09-27 19:00:293714 int ret = 0;
David Conradb061d892007-06-04 22:10:543715
Andreas Rheinhardta3db9f62019-05-16 22:30:053716 if (matroska->resync_pos == -1) {
3717 // This can only happen if generic seeking has been used.
3718 matroska->resync_pos = avio_tell(s->pb);
3719 }
3720
Hendrik Leppkes8689d872011-07-06 17:57:113721 while (matroska_deliver_packet(matroska, pkt)) {
David Conradb061d892007-06-04 22:10:543722 if (matroska->done)
Sophia Wang8c830622016-09-27 19:00:293723 return (ret < 0) ? ret : AVERROR_EOF;
Andreas Rheinhardt3ed27552019-05-16 22:30:113724 if (matroska_parse_cluster(matroska) < 0 && !matroska->done)
Andreas Rheinhardta3db9f62019-05-16 22:30:053725 ret = matroska_resync(matroska, matroska->resync_pos);
David Conradb061d892007-06-04 22:10:543726 }
3727
Michael Niedermayerd1afa722019-02-06 14:29:383728 return 0;
David Conradb061d892007-06-04 22:10:543729}
3730
Aurelien Jacobsf7b96872008-08-05 00:42:053731static int matroska_read_seek(AVFormatContext *s, int stream_index,
3732 int64_t timestamp, int flags)
David Conradb061d892007-06-04 22:10:543733{
3734 MatroskaDemuxContext *matroska = s->priv_data;
Xiaohan Wang33301f02014-11-06 20:59:543735 MatroskaTrack *tracks = NULL;
David Conradb061d892007-06-04 22:10:543736 AVStream *st = s->streams[stream_index];
Andreas Rheinhardtc6bb8252019-05-16 22:29:453737 int i, index;
David Conradb061d892007-06-04 22:10:543738
Aaron Colwell31ad14c2011-07-09 05:48:433739 /* Parse the CUES now since we need the index data to seek. */
Reimar Döffinger47e015e2012-02-12 13:09:033740 if (matroska->cues_parsing_deferred > 0) {
Aaron Colwell31ad14c2011-07-09 05:48:433741 matroska->cues_parsing_deferred = 0;
Reimar Döffinger47e015e2012-02-12 13:09:033742 matroska_parse_cues(matroska);
Aaron Colwell31ad14c2011-07-09 05:48:433743 }
3744
Aurelien Jacobsa8fd7e72008-09-12 00:06:063745 if (!st->nb_index_entries)
Reimar Döffinger47e015e2012-02-12 13:09:033746 goto err;
Aurelien Jacobsa8fd7e72008-09-12 00:06:063747 timestamp = FFMAX(timestamp, st->index_entries[0].timestamp);
Aurelien Jacobsdfbbbdc2008-08-24 23:57:293748
Michael Niedermayera3920182014-10-22 02:21:393749 if ((index = av_index_search_timestamp(st, timestamp, flags)) < 0 || index == st->nb_index_entries - 1) {
Andreas Rheinhardt8a286e72019-05-16 22:30:033750 matroska_reset_status(matroska, 0, st->index_entries[st->nb_index_entries - 1].pos);
Michael Niedermayera3920182014-10-22 02:21:393751 while ((index = av_index_search_timestamp(st, timestamp, flags)) < 0 || index == st->nb_index_entries - 1) {
Aurelien Jacobs0dbddda2008-08-27 19:58:553752 matroska_clear_queue(matroska);
3753 if (matroska_parse_cluster(matroska) < 0)
3754 break;
3755 }
Aurelien Jacobs6bef5f92008-08-27 19:57:423756 }
David Conradb061d892007-06-04 22:10:543757
Aurelien Jacobs243cc4c2007-12-29 18:35:383758 matroska_clear_queue(matroska);
Reimar Döffinger47e015e2012-02-12 13:09:033759 if (index < 0 || (matroska->cues_parsing_deferred < 0 && index == st->nb_index_entries - 1))
3760 goto err;
Aurelien Jacobs243cc4c2007-12-29 18:35:383761
Xiaohan Wang33301f02014-11-06 20:59:543762 tracks = matroska->tracks.elem;
Keiji Costantini84cfce92014-03-01 16:28:153763 for (i = 0; i < matroska->tracks.nb_elem; i++) {
3764 tracks[i].audio.pkt_cnt = 0;
Reimar Döffingerb09e5062011-02-26 11:52:013765 tracks[i].audio.sub_packet_cnt = 0;
Keiji Costantini84cfce92014-03-01 16:28:153766 tracks[i].audio.buf_timecode = AV_NOPTS_VALUE;
3767 tracks[i].end_timecode = 0;
Aurelien Jacobsc1658252008-09-09 12:10:253768 }
3769
Andreas Rheinhardt8a286e72019-05-16 22:30:033770 /* We seek to a level 1 element, so set the appropriate status. */
3771 matroska_reset_status(matroska, 0, st->index_entries[index].pos);
Michael Niedermayer7c00d852013-02-07 20:34:353772 if (flags & AVSEEK_FLAG_ANY) {
3773 st->skip_to_keyframe = 0;
3774 matroska->skip_to_timecode = timestamp;
3775 } else {
3776 st->skip_to_keyframe = 1;
3777 matroska->skip_to_timecode = st->index_entries[index].timestamp;
3778 }
3779 matroska->skip_to_keyframe = 1;
Keiji Costantini84cfce92014-03-01 16:28:153780 matroska->done = 0;
Anton Khirnova2faa952011-10-16 13:03:303781 ff_update_cur_dts(s, st, st->index_entries[index].timestamp);
David Conradb061d892007-06-04 22:10:543782 return 0;
Reimar Döffinger47e015e2012-02-12 13:09:033783err:
3784 // slightly hackish but allows proper fallback to
3785 // the generic seeking code.
Andreas Rheinhardt8a286e72019-05-16 22:30:033786 matroska_reset_status(matroska, 0, -1);
Andreas Rheinhardta3db9f62019-05-16 22:30:053787 matroska->resync_pos = -1;
Reimar Döffinger47e015e2012-02-12 13:09:033788 matroska_clear_queue(matroska);
Reimar Döffinger4a958762012-04-13 22:17:303789 st->skip_to_keyframe =
Reimar Döffinger47e015e2012-02-12 13:09:033790 matroska->skip_to_keyframe = 0;
3791 matroska->done = 0;
Reimar Döffinger47e015e2012-02-12 13:09:033792 return -1;
David Conradb061d892007-06-04 22:10:543793}
3794
Aurelien Jacobsf7b96872008-08-05 00:42:053795static int matroska_read_close(AVFormatContext *s)
David Conradb061d892007-06-04 22:10:543796{
3797 MatroskaDemuxContext *matroska = s->priv_data;
Aurelien Jacobs2cbc8812008-08-05 00:40:313798 MatroskaTrack *tracks = matroska->tracks.elem;
Aurelien Jacobs70109c02008-08-05 00:41:133799 int n;
David Conradb061d892007-06-04 22:10:543800
Aurelien Jacobs34c9c1b2007-12-29 18:32:473801 matroska_clear_queue(matroska);
David Conradb061d892007-06-04 22:10:543802
Keiji Costantini84cfce92014-03-01 16:28:153803 for (n = 0; n < matroska->tracks.nb_elem; n++)
Aurelien Jacobs2cbc8812008-08-05 00:40:313804 if (tracks[n].type == MATROSKA_TRACK_TYPE_AUDIO)
Michael Niedermayer6e70e4a2015-01-06 11:48:383805 av_freep(&tracks[n].audio.buf);
Aurelien Jacobsce6f28b2008-08-05 00:40:583806 ebml_free(matroska_segment, matroska);
David Conradb061d892007-06-04 22:10:543807
3808 return 0;
3809}
3810
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373811typedef struct {
3812 int64_t start_time_ns;
3813 int64_t end_time_ns;
3814 int64_t start_offset;
3815 int64_t end_offset;
3816} CueDesc;
3817
James Zern20aeee42017-04-17 17:59:313818/* This function searches all the Cues and returns the CueDesc corresponding to
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373819 * the timestamp ts. Returned CueDesc will be such that start_time_ns <= ts <
3820 * end_time_ns. All 4 fields will be set to -1 if ts >= file's duration.
3821 */
3822static CueDesc get_cue_desc(AVFormatContext *s, int64_t ts, int64_t cues_start) {
3823 MatroskaDemuxContext *matroska = s->priv_data;
3824 CueDesc cue_desc;
3825 int i;
3826 int nb_index_entries = s->streams[0]->nb_index_entries;
3827 AVIndexEntry *index_entries = s->streams[0]->index_entries;
3828 if (ts >= matroska->duration * matroska->time_scale) return (CueDesc) {-1, -1, -1, -1};
3829 for (i = 1; i < nb_index_entries; i++) {
3830 if (index_entries[i - 1].timestamp * matroska->time_scale <= ts &&
3831 index_entries[i].timestamp * matroska->time_scale > ts) {
3832 break;
3833 }
3834 }
3835 --i;
3836 cue_desc.start_time_ns = index_entries[i].timestamp * matroska->time_scale;
3837 cue_desc.start_offset = index_entries[i].pos - matroska->segment_start;
3838 if (i != nb_index_entries - 1) {
3839 cue_desc.end_time_ns = index_entries[i + 1].timestamp * matroska->time_scale;
3840 cue_desc.end_offset = index_entries[i + 1].pos - matroska->segment_start;
3841 } else {
3842 cue_desc.end_time_ns = matroska->duration * matroska->time_scale;
3843 // FIXME: this needs special handling for files where Cues appear
3844 // before Clusters. the current logic assumes Cues appear after
3845 // Clusters.
3846 cue_desc.end_offset = cues_start - matroska->segment_start;
3847 }
3848 return cue_desc;
3849}
3850
3851static int webm_clusters_start_with_keyframe(AVFormatContext *s)
3852{
3853 MatroskaDemuxContext *matroska = s->priv_data;
Andreas Rheinhardt8a286e72019-05-16 22:30:033854 uint32_t id = matroska->current_id;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373855 int64_t cluster_pos, before_pos;
3856 int index, rv = 1;
3857 if (s->streams[0]->nb_index_entries <= 0) return 0;
3858 // seek to the first cluster using cues.
3859 index = av_index_search_timestamp(s->streams[0], 0, 0);
3860 if (index < 0) return 0;
3861 cluster_pos = s->streams[0]->index_entries[index].pos;
3862 before_pos = avio_tell(s->pb);
3863 while (1) {
Andreas Rheinhardt36aceb62019-05-16 22:29:493864 uint64_t cluster_id, cluster_length;
3865 int read;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373866 AVPacket *pkt;
3867 avio_seek(s->pb, cluster_pos, SEEK_SET);
3868 // read cluster id and length
Andreas Rheinhardt239c7362019-06-25 01:08:563869 read = ebml_read_num(matroska, matroska->ctx->pb, 4, &cluster_id, 1);
Andreas Rheinhardt36aceb62019-05-16 22:29:493870 if (read < 0 || cluster_id != 0xF43B675) // done with all clusters
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373871 break;
Andreas Rheinhardt36aceb62019-05-16 22:29:493872 read = ebml_read_length(matroska, matroska->ctx->pb, &cluster_length);
3873 if (read < 0)
3874 break;
Andreas Rheinhardt8a286e72019-05-16 22:30:033875
3876 matroska_reset_status(matroska, 0, cluster_pos);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373877 matroska_clear_queue(matroska);
3878 if (matroska_parse_cluster(matroska) < 0 ||
James Almer78b96be2018-03-26 18:02:373879 !matroska->queue) {
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373880 break;
3881 }
James Almer78b96be2018-03-26 18:02:373882 pkt = &matroska->queue->pkt;
Andreas Rheinhardt36aceb62019-05-16 22:29:493883 // 4 + read is the length of the cluster id and the cluster length field.
3884 cluster_pos += 4 + read + cluster_length;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373885 if (!(pkt->flags & AV_PKT_FLAG_KEY)) {
3886 rv = 0;
3887 break;
3888 }
3889 }
Andreas Rheinhardt8a286e72019-05-16 22:30:033890
3891 /* Restore the status after matroska_read_header: */
3892 matroska_reset_status(matroska, id, before_pos);
3893
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373894 return rv;
3895}
3896
3897static int buffer_size_after_time_downloaded(int64_t time_ns, double search_sec, int64_t bps,
3898 double min_buffer, double* buffer,
3899 double* sec_to_download, AVFormatContext *s,
3900 int64_t cues_start)
3901{
3902 double nano_seconds_per_second = 1000000000.0;
3903 double time_sec = time_ns / nano_seconds_per_second;
3904 int rv = 0;
3905 int64_t time_to_search_ns = (int64_t)(search_sec * nano_seconds_per_second);
3906 int64_t end_time_ns = time_ns + time_to_search_ns;
3907 double sec_downloaded = 0.0;
3908 CueDesc desc_curr = get_cue_desc(s, time_ns, cues_start);
3909 if (desc_curr.start_time_ns == -1)
3910 return -1;
3911 *sec_to_download = 0.0;
3912
3913 // Check for non cue start time.
3914 if (time_ns > desc_curr.start_time_ns) {
3915 int64_t cue_nano = desc_curr.end_time_ns - time_ns;
3916 double percent = (double)(cue_nano) / (desc_curr.end_time_ns - desc_curr.start_time_ns);
3917 double cueBytes = (desc_curr.end_offset - desc_curr.start_offset) * percent;
3918 double timeToDownload = (cueBytes * 8.0) / bps;
3919
3920 sec_downloaded += (cue_nano / nano_seconds_per_second) - timeToDownload;
3921 *sec_to_download += timeToDownload;
3922
3923 // Check if the search ends within the first cue.
3924 if (desc_curr.end_time_ns >= end_time_ns) {
3925 double desc_end_time_sec = desc_curr.end_time_ns / nano_seconds_per_second;
3926 double percent_to_sub = search_sec / (desc_end_time_sec - time_sec);
3927 sec_downloaded = percent_to_sub * sec_downloaded;
3928 *sec_to_download = percent_to_sub * *sec_to_download;
3929 }
3930
3931 if ((sec_downloaded + *buffer) <= min_buffer) {
3932 return 1;
3933 }
3934
3935 // Get the next Cue.
3936 desc_curr = get_cue_desc(s, desc_curr.end_time_ns, cues_start);
3937 }
3938
3939 while (desc_curr.start_time_ns != -1) {
3940 int64_t desc_bytes = desc_curr.end_offset - desc_curr.start_offset;
3941 int64_t desc_ns = desc_curr.end_time_ns - desc_curr.start_time_ns;
3942 double desc_sec = desc_ns / nano_seconds_per_second;
3943 double bits = (desc_bytes * 8.0);
3944 double time_to_download = bits / bps;
3945
3946 sec_downloaded += desc_sec - time_to_download;
3947 *sec_to_download += time_to_download;
3948
3949 if (desc_curr.end_time_ns >= end_time_ns) {
3950 double desc_end_time_sec = desc_curr.end_time_ns / nano_seconds_per_second;
3951 double percent_to_sub = search_sec / (desc_end_time_sec - time_sec);
3952 sec_downloaded = percent_to_sub * sec_downloaded;
3953 *sec_to_download = percent_to_sub * *sec_to_download;
3954
3955 if ((sec_downloaded + *buffer) <= min_buffer)
3956 rv = 1;
3957 break;
3958 }
3959
3960 if ((sec_downloaded + *buffer) <= min_buffer) {
3961 rv = 1;
3962 break;
3963 }
3964
3965 desc_curr = get_cue_desc(s, desc_curr.end_time_ns, cues_start);
3966 }
3967 *buffer = *buffer + sec_downloaded;
3968 return rv;
3969}
3970
3971/* This function computes the bandwidth of the WebM file with the help of
3972 * buffer_size_after_time_downloaded() function. Both of these functions are
3973 * adapted from WebM Tools project and are adapted to work with FFmpeg's
3974 * Matroska parsing mechanism.
3975 *
3976 * Returns the bandwidth of the file on success; -1 on error.
3977 * */
3978static int64_t webm_dash_manifest_compute_bandwidth(AVFormatContext *s, int64_t cues_start)
3979{
3980 MatroskaDemuxContext *matroska = s->priv_data;
3981 AVStream *st = s->streams[0];
3982 double bandwidth = 0.0;
Michael Niedermayere240d012014-07-15 22:06:153983 int i;
3984
3985 for (i = 0; i < st->nb_index_entries; i++) {
Vignesh Venkatasubramanian5a206562014-07-07 19:52:373986 int64_t prebuffer_ns = 1000000000;
3987 int64_t time_ns = st->index_entries[i].timestamp * matroska->time_scale;
3988 double nano_seconds_per_second = 1000000000.0;
3989 int64_t prebuffered_ns = time_ns + prebuffer_ns;
3990 double prebuffer_bytes = 0.0;
3991 int64_t temp_prebuffer_ns = prebuffer_ns;
3992 int64_t pre_bytes, pre_ns;
3993 double pre_sec, prebuffer, bits_per_second;
3994 CueDesc desc_beg = get_cue_desc(s, time_ns, cues_start);
3995
3996 // Start with the first Cue.
3997 CueDesc desc_end = desc_beg;
3998
3999 // Figure out how much data we have downloaded for the prebuffer. This will
4000 // be used later to adjust the bits per sample to try.
4001 while (desc_end.start_time_ns != -1 && desc_end.end_time_ns < prebuffered_ns) {
4002 // Prebuffered the entire Cue.
4003 prebuffer_bytes += desc_end.end_offset - desc_end.start_offset;
4004 temp_prebuffer_ns -= desc_end.end_time_ns - desc_end.start_time_ns;
4005 desc_end = get_cue_desc(s, desc_end.end_time_ns, cues_start);
4006 }
4007 if (desc_end.start_time_ns == -1) {
4008 // The prebuffer is larger than the duration.
Vignesh Venkatasubramanianb1071db2014-10-01 17:13:314009 if (matroska->duration * matroska->time_scale >= prebuffered_ns)
4010 return -1;
4011 bits_per_second = 0.0;
4012 } else {
4013 // The prebuffer ends in the last Cue. Estimate how much data was
4014 // prebuffered.
4015 pre_bytes = desc_end.end_offset - desc_end.start_offset;
4016 pre_ns = desc_end.end_time_ns - desc_end.start_time_ns;
4017 pre_sec = pre_ns / nano_seconds_per_second;
4018 prebuffer_bytes +=
4019 pre_bytes * ((temp_prebuffer_ns / nano_seconds_per_second) / pre_sec);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374020
Vignesh Venkatasubramanianb1071db2014-10-01 17:13:314021 prebuffer = prebuffer_ns / nano_seconds_per_second;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374022
Vignesh Venkatasubramanianb1071db2014-10-01 17:13:314023 // Set this to 0.0 in case our prebuffer buffers the entire video.
4024 bits_per_second = 0.0;
4025 do {
4026 int64_t desc_bytes = desc_end.end_offset - desc_beg.start_offset;
4027 int64_t desc_ns = desc_end.end_time_ns - desc_beg.start_time_ns;
4028 double desc_sec = desc_ns / nano_seconds_per_second;
4029 double calc_bits_per_second = (desc_bytes * 8) / desc_sec;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374030
Vignesh Venkatasubramanianb1071db2014-10-01 17:13:314031 // Drop the bps by the percentage of bytes buffered.
4032 double percent = (desc_bytes - prebuffer_bytes) / desc_bytes;
4033 double mod_bits_per_second = calc_bits_per_second * percent;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374034
Vignesh Venkatasubramanianb1071db2014-10-01 17:13:314035 if (prebuffer < desc_sec) {
4036 double search_sec =
4037 (double)(matroska->duration * matroska->time_scale) / nano_seconds_per_second;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374038
Vignesh Venkatasubramanianb1071db2014-10-01 17:13:314039 // Add 1 so the bits per second should be a little bit greater than file
4040 // datarate.
4041 int64_t bps = (int64_t)(mod_bits_per_second) + 1;
4042 const double min_buffer = 0.0;
4043 double buffer = prebuffer;
4044 double sec_to_download = 0.0;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374045
Vignesh Venkatasubramanianb1071db2014-10-01 17:13:314046 int rv = buffer_size_after_time_downloaded(prebuffered_ns, search_sec, bps,
4047 min_buffer, &buffer, &sec_to_download,
4048 s, cues_start);
4049 if (rv < 0) {
4050 return -1;
4051 } else if (rv == 0) {
4052 bits_per_second = (double)(bps);
4053 break;
4054 }
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374055 }
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374056
Vignesh Venkatasubramanianb1071db2014-10-01 17:13:314057 desc_end = get_cue_desc(s, desc_end.end_time_ns, cues_start);
4058 } while (desc_end.start_time_ns != -1);
4059 }
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374060 if (bandwidth < bits_per_second) bandwidth = bits_per_second;
4061 }
4062 return (int64_t)bandwidth;
4063}
4064
Derek Buitenhuis6ba1c9b2017-04-21 15:40:354065static int webm_dash_manifest_cues(AVFormatContext *s, int64_t init_range)
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374066{
4067 MatroskaDemuxContext *matroska = s->priv_data;
4068 EbmlList *seekhead_list = &matroska->seekhead;
4069 MatroskaSeekhead *seekhead = seekhead_list->elem;
4070 char *buf;
Vignesh Venkatasubramanian080acf72014-08-25 16:15:134071 int64_t cues_start = -1, cues_end = -1, before_pos, bandwidth;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374072 int i;
Derek Buitenhuis8e6b9ef2017-04-20 14:02:544073 int end = 0;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374074
4075 // determine cues start and end positions
4076 for (i = 0; i < seekhead_list->nb_elem; i++)
4077 if (seekhead[i].id == MATROSKA_ID_CUES)
4078 break;
4079
4080 if (i >= seekhead_list->nb_elem) return -1;
4081
4082 before_pos = avio_tell(matroska->ctx->pb);
4083 cues_start = seekhead[i].pos + matroska->segment_start;
4084 if (avio_seek(matroska->ctx->pb, cues_start, SEEK_SET) == cues_start) {
Vignesh Venkatasubramanian8acb7652014-10-01 17:13:304085 // cues_end is computed as cues_start + cues_length + length of the
Andreas Rheinhardta27e5392019-05-16 22:29:544086 // Cues element ID (i.e. 4) + EBML length of the Cues element.
4087 // cues_end is inclusive and the above sum is reduced by 1.
4088 uint64_t cues_length, cues_id;
4089 int bytes_read;
Andreas Rheinhardt239c7362019-06-25 01:08:564090 bytes_read = ebml_read_num (matroska, matroska->ctx->pb, 4, &cues_id, 1);
Andreas Rheinhardta27e5392019-05-16 22:29:544091 if (bytes_read < 0 || cues_id != (MATROSKA_ID_CUES & 0xfffffff))
4092 return bytes_read < 0 ? bytes_read : AVERROR_INVALIDDATA;
4093 bytes_read = ebml_read_length(matroska, matroska->ctx->pb, &cues_length);
4094 if (bytes_read < 0)
4095 return bytes_read;
4096 cues_end = cues_start + 4 + bytes_read + cues_length - 1;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374097 }
4098 avio_seek(matroska->ctx->pb, before_pos, SEEK_SET);
Vignesh Venkatasubramanian080acf72014-08-25 16:15:134099 if (cues_start == -1 || cues_end == -1) return -1;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374100
4101 // parse the cues
4102 matroska_parse_cues(matroska);
4103
4104 // cues start
Reimar Döffingera0941c82014-07-29 19:10:394105 av_dict_set_int(&s->streams[0]->metadata, CUES_START, cues_start, 0);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374106
4107 // cues end
Reimar Döffingera0941c82014-07-29 19:10:394108 av_dict_set_int(&s->streams[0]->metadata, CUES_END, cues_end, 0);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374109
Andreas Rheinhardt60f75c92019-05-16 22:30:134110 // if the file has cues at the start, fix up the init range so that
Derek Buitenhuis6ba1c9b2017-04-21 15:40:354111 // it does not include it
4112 if (cues_start <= init_range)
4113 av_dict_set_int(&s->streams[0]->metadata, INITIALIZATION_RANGE, cues_start - 1, 0);
4114
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374115 // bandwidth
4116 bandwidth = webm_dash_manifest_compute_bandwidth(s, cues_start);
4117 if (bandwidth < 0) return -1;
Reimar Döffingera0941c82014-07-29 19:10:394118 av_dict_set_int(&s->streams[0]->metadata, BANDWIDTH, bandwidth, 0);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374119
4120 // check if all clusters start with key frames
Reimar Döffingera0941c82014-07-29 19:10:394121 av_dict_set_int(&s->streams[0]->metadata, CLUSTER_KEYFRAME, webm_clusters_start_with_keyframe(s), 0);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374122
4123 // store cue point timestamps as a comma separated list for checking subsegment alignment in
4124 // the muxer. assumes that each timestamp cannot be more than 20 characters long.
Carl Eugen Hoyos6871c172018-09-03 12:18:024125 buf = av_malloc_array(s->streams[0]->nb_index_entries, 20);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374126 if (!buf) return -1;
4127 strcpy(buf, "");
4128 for (i = 0; i < s->streams[0]->nb_index_entries; i++) {
Carl Eugen Hoyos6871c172018-09-03 12:18:024129 int ret = snprintf(buf + end, 20,
Carl Eugen Hoyos73abde62018-12-10 00:55:154130 "%" PRId64"%s", s->streams[0]->index_entries[i].timestamp,
4131 i != s->streams[0]->nb_index_entries - 1 ? "," : "");
Derek Buitenhuis8e6b9ef2017-04-20 14:02:544132 if (ret <= 0 || (ret == 20 && i == s->streams[0]->nb_index_entries - 1)) {
4133 av_log(s, AV_LOG_ERROR, "timestamp too long.\n");
Steven Liucc25a882017-05-07 03:29:084134 av_free(buf);
Derek Buitenhuis8e6b9ef2017-04-20 14:02:544135 return AVERROR_INVALIDDATA;
4136 }
4137 end += ret;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374138 }
Andreas Rheinhardt40d9cbd2019-11-10 04:07:314139 av_dict_set(&s->streams[0]->metadata, CUE_TIMESTAMPS,
4140 buf, AV_DICT_DONT_STRDUP_VAL);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374141
4142 return 0;
4143}
4144
4145static int webm_dash_manifest_read_header(AVFormatContext *s)
4146{
4147 char *buf;
4148 int ret = matroska_read_header(s);
Derek Buitenhuis6ba1c9b2017-04-21 15:40:354149 int64_t init_range;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374150 MatroskaTrack *tracks;
4151 MatroskaDemuxContext *matroska = s->priv_data;
4152 if (ret) {
4153 av_log(s, AV_LOG_ERROR, "Failed to read file headers\n");
4154 return -1;
4155 }
Andreas Cadhalpunff100c92016-11-07 23:42:234156 if (!s->nb_streams) {
4157 matroska_read_close(s);
4158 av_log(s, AV_LOG_ERROR, "No streams found\n");
4159 return AVERROR_INVALIDDATA;
4160 }
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374161
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:574162 if (!matroska->is_live) {
4163 buf = av_asprintf("%g", matroska->duration);
4164 if (!buf) return AVERROR(ENOMEM);
Andreas Rheinhardt40d9cbd2019-11-10 04:07:314165 av_dict_set(&s->streams[0]->metadata, DURATION,
4166 buf, AV_DICT_DONT_STRDUP_VAL);
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:574167
4168 // initialization range
4169 // 5 is the offset of Cluster ID.
Derek Buitenhuis6ba1c9b2017-04-21 15:40:354170 init_range = avio_tell(s->pb) - 5;
4171 av_dict_set_int(&s->streams[0]->metadata, INITIALIZATION_RANGE, init_range, 0);
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:574172 }
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374173
4174 // basename of the file
Marton Balint18ac6422017-12-29 22:30:144175 buf = strrchr(s->url, '/');
4176 av_dict_set(&s->streams[0]->metadata, FILENAME, buf ? ++buf : s->url, 0);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374177
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374178 // track number
4179 tracks = matroska->tracks.elem;
Reimar Döffingera0941c82014-07-29 19:10:394180 av_dict_set_int(&s->streams[0]->metadata, TRACK_NUMBER, tracks[0].num, 0);
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374181
4182 // parse the cues and populate Cue related fields
Vignesh Venkatasubramanian62c27fd2017-04-12 04:33:284183 if (!matroska->is_live) {
Derek Buitenhuis6ba1c9b2017-04-21 15:40:354184 ret = webm_dash_manifest_cues(s, init_range);
Vignesh Venkatasubramanian62c27fd2017-04-12 04:33:284185 if (ret < 0) {
4186 av_log(s, AV_LOG_ERROR, "Error parsing Cues\n");
4187 return ret;
4188 }
4189 }
4190
4191 // use the bandwidth from the command line if it was provided
4192 if (matroska->bandwidth > 0) {
4193 av_dict_set_int(&s->streams[0]->metadata, BANDWIDTH,
4194 matroska->bandwidth, 0);
4195 }
4196 return 0;
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374197}
4198
4199static int webm_dash_manifest_read_packet(AVFormatContext *s, AVPacket *pkt)
4200{
4201 return AVERROR_EOF;
4202}
4203
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:574204#define OFFSET(x) offsetof(MatroskaDemuxContext, x)
4205static const AVOption options[] = {
Clément Bœsch43ecec02015-11-21 21:05:074206 { "live", "flag indicating that the input is a live file that only has the headers.", OFFSET(is_live), AV_OPT_TYPE_BOOL, {.i64 = 0}, 0, 1, AV_OPT_FLAG_DECODING_PARAM },
Vignesh Venkatasubramanian62c27fd2017-04-12 04:33:284207 { "bandwidth", "bandwidth of this stream to be specified in the DASH manifest.", OFFSET(bandwidth), AV_OPT_TYPE_INT, {.i64 = 0}, 0, INT_MAX, AV_OPT_FLAG_DECODING_PARAM },
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:574208 { NULL },
4209};
4210
4211static const AVClass webm_dash_class = {
4212 .class_name = "WebM DASH Manifest demuxer",
4213 .item_name = av_default_item_name,
4214 .option = options,
4215 .version = LIBAVUTIL_VERSION_INT,
4216};
4217
Diego Elio Pettenò66355be2011-01-25 22:03:284218AVInputFormat ff_matroska_demuxer = {
Anton Khirnovdfc2c4d2011-07-16 20:18:124219 .name = "matroska,webm",
Diego Biurrun67742472012-07-24 21:51:414220 .long_name = NULL_IF_CONFIG_SMALL("Matroska / WebM"),
Vittorio Giovaraf2583bc2014-07-23 08:49:244221 .extensions = "mkv,mk3d,mka,mks",
Anton Khirnovdfc2c4d2011-07-16 20:18:124222 .priv_data_size = sizeof(MatroskaDemuxContext),
4223 .read_probe = matroska_probe,
4224 .read_header = matroska_read_header,
4225 .read_packet = matroska_read_packet,
4226 .read_close = matroska_read_close,
4227 .read_seek = matroska_read_seek,
Luca Barbatofa385732014-03-13 21:14:434228 .mime_type = "audio/webm,audio/x-matroska,video/webm,video/x-matroska"
David Conradb061d892007-06-04 22:10:544229};
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374230
4231AVInputFormat ff_webm_dash_manifest_demuxer = {
4232 .name = "webm_dash_manifest",
4233 .long_name = NULL_IF_CONFIG_SMALL("WebM DASH Manifest"),
4234 .priv_data_size = sizeof(MatroskaDemuxContext),
4235 .read_header = webm_dash_manifest_read_header,
4236 .read_packet = webm_dash_manifest_read_packet,
4237 .read_close = matroska_read_close,
Vignesh Venkatasubramanian2171b7c2015-03-31 23:51:574238 .priv_class = &webm_dash_class,
Vignesh Venkatasubramanian5a206562014-07-07 19:52:374239};