FFmpeg
wavdec.c
Go to the documentation of this file.
1 /*
2  * WAV demuxer
3  * Copyright (c) 2001, 2002 Fabrice Bellard
4  *
5  * Sony Wave64 demuxer
6  * RF64 demuxer
7  * Copyright (c) 2009 Daniel Verkamp
8  *
9  * BW64 demuxer
10  *
11  * This file is part of FFmpeg.
12  *
13  * FFmpeg is free software; you can redistribute it and/or
14  * modify it under the terms of the GNU Lesser General Public
15  * License as published by the Free Software Foundation; either
16  * version 2.1 of the License, or (at your option) any later version.
17  *
18  * FFmpeg is distributed in the hope that it will be useful,
19  * but WITHOUT ANY WARRANTY; without even the implied warranty of
20  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21  * Lesser General Public License for more details.
22  *
23  * You should have received a copy of the GNU Lesser General Public
24  * License along with FFmpeg; if not, write to the Free Software
25  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26  */
27 
28 #include <stdint.h>
29 
30 #include "config_components.h"
31 #include "libavutil/avassert.h"
32 #include "libavutil/dict.h"
33 #include "libavutil/intreadwrite.h"
34 #include "libavutil/log.h"
35 #include "libavutil/mathematics.h"
36 #include "libavutil/opt.h"
37 #include "libavcodec/internal.h"
38 #include "avformat.h"
39 #include "avio.h"
40 #include "avio_internal.h"
41 #include "demux.h"
42 #include "id3v2.h"
43 #include "internal.h"
44 #include "metadata.h"
45 #include "pcm.h"
46 #include "riff.h"
47 #include "w64.h"
48 #include "spdif.h"
49 
50 typedef struct WAVDemuxContext {
51  const AVClass *class;
52  int64_t data_end;
53  int w64;
55  int64_t smv_data_ofs;
58  int smv_block;
60  int smv_eof;
61  int audio_eof;
63  int max_size;
64  int spdif;
66  int unaligned; // e.g. if an odd number of bytes ID3 tag was prepended
67  int rifx; // RIFX: integer byte order for parameters is big endian
69 
70 #define OFFSET(x) offsetof(WAVDemuxContext, x)
71 #define DEC AV_OPT_FLAG_DECODING_PARAM
72 static const AVOption demux_options[] = {
73 #define W64_DEMUXER_OPTIONS_OFFSET (1 * CONFIG_WAV_DEMUXER)
74 #if CONFIG_WAV_DEMUXER
75  { "ignore_length", "Ignore length", OFFSET(ignore_length), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, DEC },
76 #endif
77  { "max_size", "max size of single packet", OFFSET(max_size), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1 << 22, DEC },
78  { NULL },
79 };
80 
81 static void set_max_size(AVStream *st, WAVDemuxContext *wav)
82 {
83  if (wav->max_size <= 0) {
84  int max_size = ff_pcm_default_packet_size(st->codecpar);
85  wav->max_size = max_size < 0 ? 4096 : max_size;
86  }
87 }
88 
90 {
91  if (CONFIG_SPDIF_DEMUXER && s->streams[0]->codecpar->codec_tag == 1) {
92  enum AVCodecID codec;
93  int len = 1<<16;
94  int ret = ffio_ensure_seekback(s->pb, len);
95 
96  if (ret >= 0) {
97  uint8_t *buf = av_malloc(len + AV_INPUT_BUFFER_PADDING_SIZE);
98  if (!buf) {
99  ret = AVERROR(ENOMEM);
100  } else {
101  int64_t pos = avio_tell(s->pb);
102  len = ret = avio_read(s->pb, buf, len);
103  if (len >= 0) {
104  ret = ff_spdif_probe(buf, len, &codec);
106  s->streams[0]->codecpar->codec_id = codec;
107  wav->spdif = 1;
108  }
109  }
110  avio_seek(s->pb, pos, SEEK_SET);
111  av_free(buf);
112  }
113  }
114 
115  if (ret < 0)
116  av_log(s, AV_LOG_WARNING, "Cannot check for SPDIF\n");
117  }
118 }
119 
120 #if CONFIG_WAV_DEMUXER
121 
122 static int64_t next_tag(AVIOContext *pb, uint32_t *tag, int big_endian)
123 {
124  *tag = avio_rl32(pb);
125  if (!big_endian) {
126  return avio_rl32(pb);
127  } else {
128  return avio_rb32(pb);
129  }
130 }
131 
132 /* RIFF chunks are always at even offsets relative to where they start. */
133 static int64_t wav_seek_tag(WAVDemuxContext * wav, AVIOContext *s, int64_t offset, int whence)
134 {
135  offset += offset < INT64_MAX && offset + wav->unaligned & 1;
136 
137  return avio_seek(s, offset, whence);
138 }
139 
140 /* return the size of the found tag */
141 static int64_t find_tag(WAVDemuxContext * wav, AVIOContext *pb, uint32_t tag1)
142 {
143  unsigned int tag;
144  int64_t size;
145 
146  for (;;) {
147  if (avio_feof(pb))
148  return AVERROR_EOF;
149  size = next_tag(pb, &tag, wav->rifx);
150  if (tag == tag1)
151  break;
152  wav_seek_tag(wav, pb, size, SEEK_CUR);
153  }
154  return size;
155 }
156 
157 static int wav_probe(const AVProbeData *p)
158 {
159  /* check file header */
160  if (p->buf_size <= 32)
161  return 0;
162  if (!memcmp(p->buf + 8, "WAVE", 4)) {
163  if (!memcmp(p->buf, "RIFF", 4) || !memcmp(p->buf, "RIFX", 4))
164  /* Since the ACT demuxer has a standard WAV header at the top of
165  * its own, the returned score is decreased to avoid a probe
166  * conflict between ACT and WAV. */
167  return AVPROBE_SCORE_MAX - 1;
168  else if ((!memcmp(p->buf, "RF64", 4) ||
169  !memcmp(p->buf, "BW64", 4)) &&
170  !memcmp(p->buf + 12, "ds64", 4))
171  return AVPROBE_SCORE_MAX;
172  }
173  return 0;
174 }
175 
176 static void handle_stream_probing(AVStream *st)
177 {
179  FFStream *const sti = ffstream(st);
181  sti->probe_packets = FFMIN(sti->probe_packets, 32);
182  }
183 }
184 
185 static int wav_parse_fmt_tag(AVFormatContext *s, int64_t size, AVStream *st)
186 {
187  AVIOContext *pb = s->pb;
188  WAVDemuxContext *wav = s->priv_data;
189  int ret;
190 
191  /* parse fmt header */
192  ret = ff_get_wav_header(s, pb, st->codecpar, size, wav->rifx);
193  if (ret < 0)
194  return ret;
195  handle_stream_probing(st);
196 
198 
199  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
200 
201  return 0;
202 }
203 
204 static int wav_parse_xma2_tag(AVFormatContext *s, int64_t size, AVStream *st)
205 {
206  AVIOContext *pb = s->pb;
207  int version, num_streams, i, channels = 0, ret;
208 
209  if (size < 36)
210  return AVERROR_INVALIDDATA;
211 
215 
216  version = avio_r8(pb);
217  if (version != 3 && version != 4)
218  return AVERROR_INVALIDDATA;
219  num_streams = avio_r8(pb);
220  if (size != (32 + ((version==3)?0:8) + 4*num_streams))
221  return AVERROR_INVALIDDATA;
222  avio_skip(pb, 10);
223  st->codecpar->sample_rate = avio_rb32(pb);
224  if (version == 4)
225  avio_skip(pb, 8);
226  avio_skip(pb, 4);
227  st->duration = avio_rb32(pb);
228  avio_skip(pb, 8);
229 
230  for (i = 0; i < num_streams; i++) {
231  channels += avio_r8(pb);
232  avio_skip(pb, 3);
233  }
237 
238  if (st->codecpar->ch_layout.nb_channels <= 0 || st->codecpar->sample_rate <= 0)
239  return AVERROR_INVALIDDATA;
240 
241  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
242 
243  avio_seek(pb, -size, SEEK_CUR);
244  if ((ret = ff_get_extradata(s, st->codecpar, pb, size)) < 0)
245  return ret;
246 
247  return 0;
248 }
249 
250 static inline int wav_parse_bext_string(AVFormatContext *s, const char *key,
251  int length)
252 {
253  char temp[257];
254  int ret;
255 
256  av_assert0(length < sizeof(temp));
257  if ((ret = ffio_read_size(s->pb, temp, length)) < 0)
258  return ret;
259 
260  temp[length] = 0;
261 
262  if (strlen(temp))
263  return av_dict_set(&s->metadata, key, temp, 0);
264 
265  return 0;
266 }
267 
268 static int wav_parse_bext_tag(AVFormatContext *s, int64_t size)
269 {
270  char temp[131], *coding_history;
271  int ret, x;
272  uint64_t time_reference;
273  int64_t umid_parts[8], umid_mask = 0;
274 
275  if ((ret = wav_parse_bext_string(s, "description", 256)) < 0 ||
276  (ret = wav_parse_bext_string(s, "originator", 32)) < 0 ||
277  (ret = wav_parse_bext_string(s, "originator_reference", 32)) < 0 ||
278  (ret = wav_parse_bext_string(s, "origination_date", 10)) < 0 ||
279  (ret = wav_parse_bext_string(s, "origination_time", 8)) < 0)
280  return ret;
281 
282  time_reference = avio_rl64(s->pb);
283  snprintf(temp, sizeof(temp), "%"PRIu64, time_reference);
284  if ((ret = av_dict_set(&s->metadata, "time_reference", temp, 0)) < 0)
285  return ret;
286 
287  /* check if version is >= 1, in which case an UMID may be present */
288  if (avio_rl16(s->pb) >= 1) {
289  for (x = 0; x < 8; x++)
290  umid_mask |= umid_parts[x] = avio_rb64(s->pb);
291 
292  if (umid_mask) {
293  /* the string formatting below is per SMPTE 330M-2004 Annex C */
294  if (umid_parts[4] == 0 && umid_parts[5] == 0 &&
295  umid_parts[6] == 0 && umid_parts[7] == 0) {
296  /* basic UMID */
297  snprintf(temp, sizeof(temp),
298  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
299  umid_parts[0], umid_parts[1],
300  umid_parts[2], umid_parts[3]);
301  } else {
302  /* extended UMID */
303  snprintf(temp, sizeof(temp),
304  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64
305  "%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
306  umid_parts[0], umid_parts[1],
307  umid_parts[2], umid_parts[3],
308  umid_parts[4], umid_parts[5],
309  umid_parts[6], umid_parts[7]);
310  }
311 
312  if ((ret = av_dict_set(&s->metadata, "umid", temp, 0)) < 0)
313  return ret;
314  }
315 
316  avio_skip(s->pb, 190);
317  } else
318  avio_skip(s->pb, 254);
319 
320  if (size > 602) {
321  /* CodingHistory present */
322  size -= 602;
323 
324  if (!(coding_history = av_malloc(size + 1)))
325  return AVERROR(ENOMEM);
326 
327  if ((ret = ffio_read_size(s->pb, coding_history, size)) < 0) {
328  av_free(coding_history);
329  return ret;
330  }
331 
332  coding_history[size] = 0;
333  if ((ret = av_dict_set(&s->metadata, "coding_history", coding_history,
335  return ret;
336  }
337 
338  return 0;
339 }
340 
341 static const AVMetadataConv wav_metadata_conv[] = {
342  { "description", "comment" },
343  { "originator", "encoded_by" },
344  { "origination_date", "date" },
345  { "origination_time", "creation_time" },
346  { 0 },
347 };
348 
349 /* wav input */
350 static int wav_read_header(AVFormatContext *s)
351 {
352  int64_t size, av_uninit(data_size);
353  int64_t sample_count = 0;
354  int rf64 = 0, bw64 = 0;
355  uint32_t tag;
356  AVIOContext *pb = s->pb;
357  AVStream *st = NULL;
358  WAVDemuxContext *wav = s->priv_data;
359  int ret, got_fmt = 0, got_xma2 = 0;
360  int64_t next_tag_ofs, data_ofs = -1;
361 
362  wav->unaligned = avio_tell(s->pb) & 1;
363 
364  wav->smv_data_ofs = -1;
365 
366  /* read chunk ID */
367  tag = avio_rl32(pb);
368  switch (tag) {
369  case MKTAG('R', 'I', 'F', 'F'):
370  break;
371  case MKTAG('R', 'I', 'F', 'X'):
372  wav->rifx = 1;
373  break;
374  case MKTAG('R', 'F', '6', '4'):
375  rf64 = 1;
376  break;
377  case MKTAG('B', 'W', '6', '4'):
378  bw64 = 1;
379  break;
380  default:
381  av_log(s, AV_LOG_ERROR, "invalid start code %s in RIFF header\n",
382  av_fourcc2str(tag));
383  return AVERROR_INVALIDDATA;
384  }
385 
386  /* read chunk size */
387  avio_rl32(pb);
388 
389  /* read format */
390  if (avio_rl32(pb) != MKTAG('W', 'A', 'V', 'E')) {
391  av_log(s, AV_LOG_ERROR, "invalid format in RIFF header\n");
392  return AVERROR_INVALIDDATA;
393  }
394 
395  if (rf64 || bw64) {
396  if (avio_rl32(pb) != MKTAG('d', 's', '6', '4'))
397  return AVERROR_INVALIDDATA;
398  size = avio_rl32(pb);
399  if (size < 24)
400  return AVERROR_INVALIDDATA;
401  avio_rl64(pb); /* RIFF size */
402 
403  data_size = avio_rl64(pb);
404  sample_count = avio_rl64(pb);
405 
406  if (data_size < 0 || sample_count < 0) {
407  av_log(s, AV_LOG_ERROR, "negative data_size and/or sample_count in "
408  "ds64: data_size = %"PRId64", sample_count = %"PRId64"\n",
409  data_size, sample_count);
410  return AVERROR_INVALIDDATA;
411  }
412  avio_skip(pb, size - 24); /* skip rest of ds64 chunk */
413 
414  }
415 
416  /* Create the audio stream now so that its index is always zero */
417  st = avformat_new_stream(s, NULL);
418  if (!st)
419  return AVERROR(ENOMEM);
420 
421  for (;;) {
422  AVStream *vst;
423  size = next_tag(pb, &tag, wav->rifx);
424  next_tag_ofs = avio_tell(pb) + size;
425 
426  if (avio_feof(pb))
427  break;
428 
429  switch (tag) {
430  case MKTAG('f', 'm', 't', ' '):
431  /* only parse the first 'fmt ' tag found */
432  if (!got_xma2 && !got_fmt && (ret = wav_parse_fmt_tag(s, size, st)) < 0) {
433  return ret;
434  } else if (got_fmt)
435  av_log(s, AV_LOG_WARNING, "found more than one 'fmt ' tag\n");
436 
437  got_fmt = 1;
438  break;
439  case MKTAG('X', 'M', 'A', '2'):
440  /* only parse the first 'XMA2' tag found */
441  if (!got_fmt && !got_xma2 && (ret = wav_parse_xma2_tag(s, size, st)) < 0) {
442  return ret;
443  } else if (got_xma2)
444  av_log(s, AV_LOG_WARNING, "found more than one 'XMA2' tag\n");
445 
446  got_xma2 = 1;
447  break;
448  case MKTAG('d', 'a', 't', 'a'):
449  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) && !got_fmt && !got_xma2) {
451  "found no 'fmt ' tag before the 'data' tag\n");
452  return AVERROR_INVALIDDATA;
453  }
454 
455  if (rf64 || bw64) {
456  next_tag_ofs = wav->data_end = av_sat_add64(avio_tell(pb), data_size);
457  } else if (size != 0xFFFFFFFF) {
458  data_size = size;
459  next_tag_ofs = wav->data_end = size ? next_tag_ofs : INT64_MAX;
460  } else {
461  av_log(s, AV_LOG_WARNING, "Ignoring maximum wav data size, "
462  "file may be invalid\n");
463  data_size = 0;
464  next_tag_ofs = wav->data_end = INT64_MAX;
465  }
466 
467  data_ofs = avio_tell(pb);
468 
469  /* don't look for footer metadata if we can't seek or if we don't
470  * know where the data tag ends
471  */
472  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) || (!(rf64 && !bw64) && !size))
473  goto break_loop;
474  break;
475  case MKTAG('f', 'a', 'c', 't'):
476  if (!sample_count)
477  sample_count = (!wav->rifx ? avio_rl32(pb) : avio_rb32(pb));
478  break;
479  case MKTAG('b', 'e', 'x', 't'):
480  if ((ret = wav_parse_bext_tag(s, size)) < 0)
481  return ret;
482  break;
483  case MKTAG('S','M','V','0'):
484  if (!got_fmt) {
485  av_log(s, AV_LOG_ERROR, "found no 'fmt ' tag before the 'SMV0' tag\n");
486  return AVERROR_INVALIDDATA;
487  }
488  // SMV file, a wav file with video appended.
489  if (size != MKTAG('0','2','0','0')) {
490  av_log(s, AV_LOG_ERROR, "Unknown SMV version found\n");
491  goto break_loop;
492  }
493  av_log(s, AV_LOG_DEBUG, "Found SMV data\n");
494  wav->smv_given_first = 0;
495  vst = avformat_new_stream(s, NULL);
496  if (!vst)
497  return AVERROR(ENOMEM);
498  wav->vst = vst;
499  avio_r8(pb);
500  vst->id = 1;
503  vst->codecpar->width = avio_rl24(pb);
504  vst->codecpar->height = avio_rl24(pb);
505  if ((ret = ff_alloc_extradata(vst->codecpar, 4)) < 0) {
506  av_log(s, AV_LOG_ERROR, "Could not allocate extradata.\n");
507  return ret;
508  }
509  size = avio_rl24(pb);
510  wav->smv_data_ofs = avio_tell(pb) + (size - 5) * 3;
511  avio_rl24(pb);
512  wav->smv_block_size = avio_rl24(pb);
513  if (!wav->smv_block_size)
514  return AVERROR_INVALIDDATA;
515  avpriv_set_pts_info(vst, 32, 1, avio_rl24(pb));
516  vst->duration = avio_rl24(pb);
517  avio_rl24(pb);
518  avio_rl24(pb);
519  wav->smv_frames_per_jpeg = avio_rl24(pb);
520  if (wav->smv_frames_per_jpeg > 65536) {
521  av_log(s, AV_LOG_ERROR, "too many frames per jpeg\n");
522  return AVERROR_INVALIDDATA;
523  }
525  goto break_loop;
526  case MKTAG('L', 'I', 'S', 'T'):
527  case MKTAG('l', 'i', 's', 't'):
528  if (size < 4) {
529  av_log(s, AV_LOG_ERROR, "too short LIST tag\n");
530  return AVERROR_INVALIDDATA;
531  }
532  switch (avio_rl32(pb)) {
533  case MKTAG('I', 'N', 'F', 'O'):
534  ff_read_riff_info(s, size - 4);
535  break;
536  case MKTAG('a', 'd', 't', 'l'):
537  if (s->nb_chapters > 0) {
538  while (avio_tell(pb) < next_tag_ofs &&
539  !avio_feof(pb)) {
540  char cue_label[512];
541  unsigned id, sub_size;
542 
543  if (avio_rl32(pb) != MKTAG('l', 'a', 'b', 'l'))
544  break;
545 
546  sub_size = avio_rl32(pb);
547  if (sub_size < 5)
548  break;
549  id = avio_rl32(pb);
550  avio_get_str(pb, sub_size - 4, cue_label, sizeof(cue_label));
551  avio_skip(pb, avio_tell(pb) & 1);
552 
553  for (int i = 0; i < s->nb_chapters; i++) {
554  if (s->chapters[i]->id == id) {
555  av_dict_set(&s->chapters[i]->metadata, "title", cue_label, 0);
556  break;
557  }
558  }
559  }
560  }
561  break;
562  }
563  break;
564  case MKTAG('I', 'D', '3', ' '):
565  case MKTAG('i', 'd', '3', ' '): {
566  ID3v2ExtraMeta *id3v2_extra_meta;
567  ff_id3v2_read(s, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta, 0);
568  if (id3v2_extra_meta) {
569  ff_id3v2_parse_apic(s, id3v2_extra_meta);
570  ff_id3v2_parse_chapters(s, id3v2_extra_meta);
571  ff_id3v2_parse_priv(s, id3v2_extra_meta);
572  }
573  ff_id3v2_free_extra_meta(&id3v2_extra_meta);
574  }
575  break;
576  case MKTAG('c', 'u', 'e', ' '):
577  if (size >= 4 && got_fmt && st->codecpar->sample_rate > 0) {
578  AVRational tb = {1, st->codecpar->sample_rate};
579  unsigned nb_cues = avio_rl32(pb);
580 
581  if (size >= nb_cues * 24LL + 4LL) {
582  for (int i = 0; i < nb_cues; i++) {
583  unsigned offset, id = avio_rl32(pb);
584 
585  if (avio_feof(pb))
586  return AVERROR_INVALIDDATA;
587 
588  avio_skip(pb, 16);
589  offset = avio_rl32(pb);
590 
592  return AVERROR(ENOMEM);
593  }
594  }
595  }
596  break;
597  }
598 
599  /* seek to next tag unless we know that we'll run into EOF */
600  if ((avio_size(pb) > 0 && next_tag_ofs >= avio_size(pb)) ||
601  wav_seek_tag(wav, pb, next_tag_ofs, SEEK_SET) < 0) {
602  break;
603  }
604  }
605 
606 break_loop:
607  if (!got_fmt && !got_xma2) {
608  av_log(s, AV_LOG_ERROR, "no 'fmt ' or 'XMA2' tag found\n");
609  return AVERROR_INVALIDDATA;
610  }
611 
612  if (data_ofs < 0) {
613  av_log(s, AV_LOG_ERROR, "no 'data' tag found\n");
614  return AVERROR_INVALIDDATA;
615  }
616 
617  avio_seek(pb, data_ofs, SEEK_SET);
618 
619  if (data_size > (INT64_MAX>>3)) {
620  av_log(s, AV_LOG_WARNING, "Data size %"PRId64" is too large\n", data_size);
621  data_size = 0;
622  }
623 
624  if ( st->codecpar->bit_rate > 0 && data_size > 0
625  && st->codecpar->sample_rate > 0
626  && sample_count > 0 && st->codecpar->ch_layout.nb_channels > 1
627  && sample_count % st->codecpar->ch_layout.nb_channels == 0) {
628  if (fabs(8.0 * data_size * st->codecpar->ch_layout.nb_channels * st->codecpar->sample_rate /
629  sample_count /st->codecpar->bit_rate - 1.0) < 0.3)
630  sample_count /= st->codecpar->ch_layout.nb_channels;
631  }
632 
633  if (data_size > 0 && sample_count && st->codecpar->ch_layout.nb_channels &&
634  (data_size << 3) / sample_count / st->codecpar->ch_layout.nb_channels > st->codecpar->bits_per_coded_sample + 1) {
635  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
636  sample_count = 0;
637  }
638 
639  /* G.729 hack (for Ticket4577)
640  * FIXME: Come up with cleaner, more general solution */
641  if (st->codecpar->codec_id == AV_CODEC_ID_G729 && sample_count && (data_size << 3) > sample_count) {
642  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
643  sample_count = 0;
644  }
645 
646  if (!sample_count || av_get_exact_bits_per_sample(st->codecpar->codec_id) > 0)
647  if ( st->codecpar->ch_layout.nb_channels
648  && data_size
650  && wav->data_end <= avio_size(pb))
651  sample_count = (data_size << 3)
652  /
654 
655  if (sample_count)
656  st->duration = sample_count;
657 
660  st->codecpar->bits_per_coded_sample == 32 &&
661  st->codecpar->extradata_size == 2 &&
662  AV_RL16(st->codecpar->extradata) == 1) {
665  } else if (st->codecpar->codec_id == AV_CODEC_ID_PCM_S24LE &&
667  st->codecpar->bits_per_coded_sample == 24) {
669  } else if (st->codecpar->codec_id == AV_CODEC_ID_XMA1 ||
671  st->codecpar->block_align = 2048;
672  } else if (st->codecpar->codec_id == AV_CODEC_ID_ADPCM_MS && st->codecpar->ch_layout.nb_channels > 2 &&
673  st->codecpar->block_align < INT_MAX / st->codecpar->ch_layout.nb_channels) {
675  }
676 
677  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
679 
680  set_spdif(s, wav);
681  set_max_size(st, wav);
682 
683  return 0;
684 }
685 
686 /**
687  * Find chunk with w64 GUID by skipping over other chunks.
688  * @return the size of the found chunk
689  */
690 static int64_t find_guid(AVIOContext *pb, const uint8_t guid1[16])
691 {
692  uint8_t guid[16];
693  int64_t size;
694 
695  while (!avio_feof(pb)) {
696  avio_read(pb, guid, 16);
697  size = avio_rl64(pb);
698  if (size <= 24 || size > INT64_MAX - 8)
699  return AVERROR_INVALIDDATA;
700  if (!memcmp(guid, guid1, 16))
701  return size;
702  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
703  }
704  return AVERROR_EOF;
705 }
706 
707 static int wav_read_packet(AVFormatContext *s, AVPacket *pkt)
708 {
709  int ret, size;
710  int64_t left;
711  WAVDemuxContext *wav = s->priv_data;
712  AVStream *st = s->streams[0];
713 
714  if (CONFIG_SPDIF_DEMUXER && wav->spdif == 1)
715  return ff_spdif_read_packet(s, pkt);
716 
717  if (wav->smv_data_ofs > 0) {
718  int64_t audio_dts, video_dts;
719  AVStream *vst = wav->vst;
720 smv_retry:
723 
725  /*We always return a video frame first to get the pixel format first*/
726  wav->smv_last_stream = wav->smv_given_first ?
728  audio_dts, st->time_base) > 0 : 0;
729  wav->smv_given_first = 1;
730  }
731  wav->smv_last_stream = !wav->smv_last_stream;
732  wav->smv_last_stream |= wav->audio_eof;
733  wav->smv_last_stream &= !wav->smv_eof;
734  if (wav->smv_last_stream) {
735  uint64_t old_pos = avio_tell(s->pb);
736  uint64_t new_pos = wav->smv_data_ofs +
737  wav->smv_block * (int64_t)wav->smv_block_size;
738  if (avio_seek(s->pb, new_pos, SEEK_SET) < 0) {
739  ret = AVERROR_EOF;
740  goto smv_out;
741  }
742  size = avio_rl24(s->pb);
743  if (size > wav->smv_block_size) {
744  ret = AVERROR_EOF;
745  goto smv_out;
746  }
747  ret = av_get_packet(s->pb, pkt, size);
748  if (ret < 0)
749  goto smv_out;
750  pkt->pos -= 3;
751  pkt->pts = wav->smv_block * wav->smv_frames_per_jpeg;
753  wav->smv_block++;
754 
755  pkt->stream_index = vst->index;
756 smv_out:
757  avio_seek(s->pb, old_pos, SEEK_SET);
758  if (ret == AVERROR_EOF) {
759  wav->smv_eof = 1;
760  goto smv_retry;
761  }
762  return ret;
763  }
764  }
765 
766  left = wav->data_end - avio_tell(s->pb);
767  if (wav->ignore_length)
768  left = INT_MAX;
769  if (left <= 0) {
770  if (CONFIG_W64_DEMUXER && wav->w64)
771  left = find_guid(s->pb, ff_w64_guid_data) - 24;
772  else
773  left = find_tag(wav, s->pb, MKTAG('d', 'a', 't', 'a'));
774  if (left < 0) {
775  wav->audio_eof = 1;
776  if (wav->smv_data_ofs > 0 && !wav->smv_eof)
777  goto smv_retry;
778  return AVERROR_EOF;
779  }
780  if (INT64_MAX - left < avio_tell(s->pb))
781  return AVERROR_INVALIDDATA;
782  wav->data_end = avio_tell(s->pb) + left;
783  }
784 
785  size = wav->max_size;
786  if (st->codecpar->block_align > 1) {
787  if (size < st->codecpar->block_align)
788  size = st->codecpar->block_align;
789  size = (size / st->codecpar->block_align) * st->codecpar->block_align;
790  }
791  size = FFMIN(size, left);
792  ret = av_get_packet(s->pb, pkt, size);
793  if (ret < 0)
794  return ret;
795  pkt->stream_index = 0;
796 
797  return ret;
798 }
799 
800 static int wav_read_seek(AVFormatContext *s,
801  int stream_index, int64_t timestamp, int flags)
802 {
803  WAVDemuxContext *wav = s->priv_data;
804  AVStream *ast = s->streams[0], *vst = wav->vst;
805  wav->smv_eof = 0;
806  wav->audio_eof = 0;
807 
808  if (stream_index != 0 && (!vst || stream_index != vst->index))
809  return AVERROR(EINVAL);
810  if (wav->smv_data_ofs > 0) {
811  int64_t smv_timestamp = timestamp;
812  if (stream_index == 0)
813  smv_timestamp = av_rescale_q(timestamp, ast->time_base, vst->time_base);
814  else
815  timestamp = av_rescale_q(smv_timestamp, vst->time_base, ast->time_base);
816  if (wav->smv_frames_per_jpeg > 0) {
817  wav->smv_block = smv_timestamp / wav->smv_frames_per_jpeg;
818  }
819  }
820 
821  switch (ast->codecpar->codec_id) {
822  case AV_CODEC_ID_MP2:
823  case AV_CODEC_ID_MP3:
824  case AV_CODEC_ID_AC3:
825  case AV_CODEC_ID_DTS:
826  case AV_CODEC_ID_XMA2:
827  /* use generic seeking with dynamically generated indexes */
828  return -1;
829  default:
830  break;
831  }
832  return ff_pcm_read_seek(s, 0, timestamp, flags);
833 }
834 
835 static const AVClass wav_demuxer_class = {
836  .class_name = "WAV demuxer",
837  .item_name = av_default_item_name,
838  .option = demux_options,
839  .version = LIBAVUTIL_VERSION_INT,
840 };
842  .p.name = "wav",
843  .p.long_name = NULL_IF_CONFIG_SMALL("WAV / WAVE (Waveform Audio)"),
844  .p.flags = AVFMT_GENERIC_INDEX,
845  .p.codec_tag = ff_wav_codec_tags_list,
846  .p.priv_class = &wav_demuxer_class,
847  .priv_data_size = sizeof(WAVDemuxContext),
848  .read_probe = wav_probe,
849  .read_header = wav_read_header,
850  .read_packet = wav_read_packet,
851  .read_seek = wav_read_seek,
852 };
853 #endif /* CONFIG_WAV_DEMUXER */
854 
855 #if CONFIG_W64_DEMUXER
856 static int w64_probe(const AVProbeData *p)
857 {
858  if (p->buf_size <= 40)
859  return 0;
860  if (!memcmp(p->buf, ff_w64_guid_riff, 16) &&
861  !memcmp(p->buf + 24, ff_w64_guid_wave, 16))
862  return AVPROBE_SCORE_MAX;
863  else
864  return 0;
865 }
866 
867 static int w64_read_header(AVFormatContext *s)
868 {
869  int64_t size, data_ofs = 0;
870  AVIOContext *pb = s->pb;
871  WAVDemuxContext *wav = s->priv_data;
872  AVStream *st;
873  uint8_t guid[16];
874  int ret;
875 
876  avio_read(pb, guid, 16);
877  if (memcmp(guid, ff_w64_guid_riff, 16))
878  return AVERROR_INVALIDDATA;
879 
880  /* riff + wave + fmt + sizes */
881  if (avio_rl64(pb) < 16 + 8 + 16 + 8 + 16 + 8)
882  return AVERROR_INVALIDDATA;
883 
884  avio_read(pb, guid, 16);
885  if (memcmp(guid, ff_w64_guid_wave, 16)) {
886  av_log(s, AV_LOG_ERROR, "could not find wave guid\n");
887  return AVERROR_INVALIDDATA;
888  }
889 
890  wav->w64 = 1;
891 
892  st = avformat_new_stream(s, NULL);
893  if (!st)
894  return AVERROR(ENOMEM);
895 
896  while (!avio_feof(pb)) {
897  if (avio_read(pb, guid, 16) != 16)
898  break;
899  size = avio_rl64(pb);
900  if (size <= 24 || INT64_MAX - size < avio_tell(pb)) {
901  if (data_ofs)
902  break;
903  return AVERROR_INVALIDDATA;
904  }
905 
906  if (!memcmp(guid, ff_w64_guid_fmt, 16)) {
907  /* subtract chunk header size - normal wav file doesn't count it */
908  ret = ff_get_wav_header(s, pb, st->codecpar, size - 24, 0);
909  if (ret < 0)
910  return ret;
911  avio_skip(pb, FFALIGN(size, INT64_C(8)) - size);
912  if (st->codecpar->block_align &&
914  st->codecpar->bits_per_coded_sample < 128) {
915  int block_align = st->codecpar->block_align;
916 
917  block_align = FFMAX(block_align,
918  ((st->codecpar->bits_per_coded_sample + 7) / 8) *
920  if (block_align > st->codecpar->block_align) {
921  av_log(s, AV_LOG_WARNING, "invalid block_align: %d, broken file.\n",
922  st->codecpar->block_align);
923  st->codecpar->block_align = block_align;
924  }
925  }
926  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
927  } else if (!memcmp(guid, ff_w64_guid_fact, 16)) {
928  int64_t samples;
929 
930  samples = avio_rl64(pb);
931  if (samples > 0)
932  st->duration = samples;
933  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 32);
934  } else if (!memcmp(guid, ff_w64_guid_data, 16)) {
935  wav->data_end = avio_tell(pb) + size - 24;
936 
937  data_ofs = avio_tell(pb);
938  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
939  break;
940 
941  avio_skip(pb, size - 24);
942  } else if (!memcmp(guid, ff_w64_guid_summarylist, 16)) {
943  int64_t start, end, cur;
944  uint32_t count, chunk_size, i;
945  int64_t filesize = avio_size(s->pb);
946 
947  start = avio_tell(pb);
948  end = start + FFALIGN(size, INT64_C(8)) - 24;
949  count = avio_rl32(pb);
950 
951  for (i = 0; i < count; i++) {
952  char chunk_key[5], *value;
953 
954  if (avio_feof(pb) || (cur = avio_tell(pb)) < 0 || cur > end - 8 /* = tag + size */)
955  break;
956 
957  chunk_key[4] = 0;
958  avio_read(pb, chunk_key, 4);
959  chunk_size = avio_rl32(pb);
960  if (chunk_size == UINT32_MAX || (filesize >= 0 && chunk_size > filesize))
961  return AVERROR_INVALIDDATA;
962 
963  value = av_malloc(chunk_size + 1);
964  if (!value)
965  return AVERROR(ENOMEM);
966 
967  ret = avio_get_str16le(pb, chunk_size, value, chunk_size);
968  if (ret < 0) {
969  av_free(value);
970  return ret;
971  }
972  avio_skip(pb, chunk_size - ret);
973 
974  av_dict_set(&s->metadata, chunk_key, value, AV_DICT_DONT_STRDUP_VAL);
975  }
976 
977  avio_skip(pb, end - avio_tell(pb));
978  } else {
979  av_log(s, AV_LOG_DEBUG, "unknown guid: "FF_PRI_GUID"\n", FF_ARG_GUID(guid));
980  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
981  }
982  }
983 
984  if (!data_ofs)
985  return AVERROR_EOF;
986 
987  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
989 
990  handle_stream_probing(st);
992 
993  avio_seek(pb, data_ofs, SEEK_SET);
994 
995  set_spdif(s, wav);
996  set_max_size(st, wav);
997 
998  return 0;
999 }
1000 
1001 static const AVClass w64_demuxer_class = {
1002  .class_name = "W64 demuxer",
1003  .item_name = av_default_item_name,
1005  .version = LIBAVUTIL_VERSION_INT,
1006 };
1007 
1008 const FFInputFormat ff_w64_demuxer = {
1009  .p.name = "w64",
1010  .p.long_name = NULL_IF_CONFIG_SMALL("Sony Wave64"),
1011  .p.flags = AVFMT_GENERIC_INDEX,
1012  .p.codec_tag = ff_wav_codec_tags_list,
1013  .p.priv_class = &w64_demuxer_class,
1014  .priv_data_size = sizeof(WAVDemuxContext),
1015  .read_probe = w64_probe,
1016  .read_header = w64_read_header,
1017  .read_packet = wav_read_packet,
1018  .read_seek = wav_read_seek,
1019 };
1020 #endif /* CONFIG_W64_DEMUXER */
avpriv_new_chapter
AVChapter * avpriv_new_chapter(AVFormatContext *s, int64_t id, AVRational time_base, int64_t start, int64_t end, const char *title)
Add a new chapter.
Definition: demux_utils.c:42
WAVDemuxContext
Definition: wavdec.c:50
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:328
WAVDemuxContext::unaligned
int unaligned
Definition: wavdec.c:66
WAVDemuxContext::smv_block
int smv_block
Definition: wavdec.c:58
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:373
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:69
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:443
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
pcm.h
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:51
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:424
av_compare_ts
int av_compare_ts(int64_t ts_a, AVRational tb_a, int64_t ts_b, AVRational tb_b)
Compare two timestamps each in its own time base.
Definition: mathematics.c:147
W64_DEMUXER_OPTIONS_OFFSET
#define W64_DEMUXER_OPTIONS_OFFSET
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const struct AVCodec *c)
Add a new stream to a media file.
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:57
WAVDemuxContext::smv_data_ofs
int64_t smv_data_ofs
Definition: wavdec.c:55
audio_dts
int64_t audio_dts
Definition: movenc.c:61
WAVDemuxContext::smv_frames_per_jpeg
int smv_frames_per_jpeg
Definition: wavdec.c:57
id3v2.h
WAVDemuxContext::max_size
int max_size
Definition: wavdec.c:63
internal.h
AVOption
AVOption.
Definition: opt.h:346
ff_id3v2_read
void ff_id3v2_read(AVFormatContext *s, const char *magic, ID3v2ExtraMeta **extra_meta, unsigned int max_search_size)
Read an ID3v2 tag, including supported extra metadata.
Definition: id3v2.c:1139
AVMetadataConv
Definition: metadata.h:34
ff_get_wav_header
int ff_get_wav_header(void *logctx, AVIOContext *pb, AVCodecParameters *par, int size, int big_endian)
Definition: riffdec.c:94
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:540
mathematics.h
AVProbeData::buf_size
int buf_size
Size of buf except extra allocated bytes.
Definition: avformat.h:454
AVChannelLayout::order
enum AVChannelOrder order
Channel order used in this layout.
Definition: channel_layout.h:308
FFMAX
#define FFMAX(a, b)
Definition: macros.h:47
AVChannelLayout::nb_channels
int nb_channels
Number of channels in this layout.
Definition: channel_layout.h:313
avio_size
int64_t avio_size(AVIOContext *s)
Get the filesize.
Definition: aviobuf.c:322
sample_rate
sample_rate
Definition: ffmpeg_filter.c:410
WAVDemuxContext::data_end
int64_t data_end
Definition: wavdec.c:52
video_dts
int64_t video_dts
Definition: movenc.c:61
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:30
WAVDemuxContext::w64
int w64
Definition: wavdec.c:53
ff_get_extradata
int ff_get_extradata(void *logctx, AVCodecParameters *par, AVIOContext *pb, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0 and f...
Definition: demux_utils.c:335
AVPROBE_SCORE_MAX
#define AVPROBE_SCORE_MAX
maximum score
Definition: avformat.h:463
return
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a it should return
Definition: filter_design.txt:264
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *st, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: avformat.c:853
ff_w64_guid_summarylist
const uint8_t ff_w64_guid_summarylist[16]
Definition: w64.c:47
ff_wav_demuxer
const FFInputFormat ff_wav_demuxer
ffstream
static av_always_inline FFStream * ffstream(AVStream *st)
Definition: internal.h:417
read_seek
static int read_seek(AVFormatContext *ctx, int stream_index, int64_t timestamp, int flags)
Definition: libcdio.c:151
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:494
AVFMT_GENERIC_INDEX
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:480
demux_options
static const AVOption demux_options[]
Definition: wavdec.c:72
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:441
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:802
avio_rl16
unsigned int avio_rl16(AVIOContext *s)
Definition: aviobuf.c:713
ff_id3v2_parse_chapters
int ff_id3v2_parse_chapters(AVFormatContext *s, ID3v2ExtraMeta *cur)
Create chapters for all CHAP tags found in the ID3v2 header.
Definition: id3v2.c:1192
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:79
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:547
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:760
pkt
AVPacket * pkt
Definition: movenc.c:59
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
ID3v2ExtraMeta
Definition: id3v2.h:84
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_read_callback.c:41
avio_get_str16le
int avio_get_str16le(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a UTF-16 string from pb and convert it to UTF-8.
FF_ARG_GUID
#define FF_ARG_GUID(g)
Definition: riff.h:109
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_CODEC_ID_XMA1
@ AV_CODEC_ID_XMA1
Definition: codec_id.h:519
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:553
AVProbeData::buf
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:453
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:134
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:440
AV_CHANNEL_ORDER_UNSPEC
@ AV_CHANNEL_ORDER_UNSPEC
Only the channel count is specified, without any further information about the channel order.
Definition: channel_layout.h:112
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:40
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:201
AV_CODEC_ID_PCM_F24LE
@ AV_CODEC_ID_PCM_F24LE
Definition: codec_id.h:362
channels
channels
Definition: aptx.h:31
AV_RL16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_RL16
Definition: bytestream.h:94
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
ff_read_riff_info
int ff_read_riff_info(AVFormatContext *s, int64_t size)
Definition: riffdec.c:242
key
const char * key
Definition: hwcontext_opencl.c:189
if
if(ret)
Definition: filter_design.txt:179
FFStream::need_parsing
enum AVStreamParseType need_parsing
Definition: internal.h:386
AVFormatContext
Format I/O context.
Definition: avformat.h:1255
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:766
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
read_header
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:550
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
fabs
static __device__ float fabs(float a)
Definition: cuda_runtime.h:182
AVStream::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avformat.h:782
NULL
#define NULL
Definition: coverity.c:32
ff_pcm_default_packet_size
int ff_pcm_default_packet_size(AVCodecParameters *par)
Definition: pcm.c:29
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:237
ff_id3v2_parse_apic
int ff_id3v2_parse_apic(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create a stream for each APIC (attached picture) extracted from the ID3v2 header.
Definition: id3v2.c:1161
avio_rb64
uint64_t avio_rb64(AVIOContext *s)
Definition: aviobuf.c:907
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:451
AVCodecParameters::ch_layout
AVChannelLayout ch_layout
Audio only.
Definition: codec_par.h:180
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:461
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:184
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:49
ff_w64_guid_fmt
const uint8_t ff_w64_guid_fmt[16]
Definition: w64.c:33
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:73
WAVDemuxContext::smv_last_stream
int smv_last_stream
Definition: wavdec.c:59
av_get_exact_bits_per_sample
int av_get_exact_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:454
avio_rl32
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:729
AVIOContext
Bytestream IO Context.
Definition: avio.h:160
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:340
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:106
DEC
#define DEC
Definition: wavdec.c:71
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:261
FFStream
Definition: internal.h:193
ff_spdif_probe
int ff_spdif_probe(const uint8_t *p_buf, int buf_size, enum AVCodecID *codec)
Definition: spdifdec.c:122
WAVDemuxContext::smv_eof
int smv_eof
Definition: wavdec.c:60
AV_CODEC_ID_DTS
@ AV_CODEC_ID_DTS
Definition: codec_id.h:444
avio_get_str
int avio_get_str(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a string from pb into buf.
Definition: aviobuf.c:865
size
int size
Definition: twinvq_data.h:10344
AV_CODEC_ID_SMVJPEG
@ AV_CODEC_ID_SMVJPEG
Definition: codec_id.h:264
avio.h
ID3v2_DEFAULT_MAGIC
#define ID3v2_DEFAULT_MAGIC
Default magic bytes for ID3v2 header: "ID3".
Definition: id3v2.h:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:248
ff_riff_info_conv
const AVMetadataConv ff_riff_info_conv[]
Definition: riff.c:621
FFInputFormat::p
AVInputFormat p
The public AVInputFormat.
Definition: demux.h:41
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:602
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:1022
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
version
version
Definition: libkvazaar.c:321
FFStream::probe_packets
int probe_packets
Number of packets to buffer for codec probing.
Definition: internal.h:383
ff_spdif_read_packet
int ff_spdif_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: spdifdec.c:189
filesize
static int64_t filesize(AVIOContext *pb)
Definition: ffmpeg_mux.c:51
set_max_size
static void set_max_size(AVStream *st, WAVDemuxContext *wav)
Definition: wavdec.c:81
WAVDemuxContext::rifx
int rifx
Definition: wavdec.c:67
log.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:515
avio_rl24
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:721
avio_internal.h
WAVDemuxContext::audio_eof
int audio_eof
Definition: wavdec.c:61
ff_w64_guid_wave
const uint8_t ff_w64_guid_wave[16]
Definition: w64.c:28
AVCodecParameters::height
int height
Definition: codec_par.h:135
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:191
WAVDemuxContext::smv_block_size
int smv_block_size
Definition: wavdec.c:56
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
tb
#define tb
Definition: regdef.h:68
demux.h
AV_CODEC_ID_PCM_F16LE
@ AV_CODEC_ID_PCM_F16LE
Definition: codec_id.h:361
ff_w64_guid_fact
const uint8_t ff_w64_guid_fact[16]
Definition: w64.c:38
len
int len
Definition: vorbis_enc_data.h:426
av_get_packet
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:103
av_uninit
#define av_uninit(x)
Definition: attributes.h:154
tag
uint32_t tag
Definition: movenc.c:1786
AVStream::id
int id
Format-specific stream ID.
Definition: avformat.h:755
ret
ret
Definition: filter_design.txt:187
AVStream
Stream structure.
Definition: avformat.h:743
WAVDemuxContext::spdif
int spdif
Definition: wavdec.c:64
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:230
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:71
ff_pcm_read_seek
int ff_pcm_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
Definition: pcm.c:73
metadata.h
pos
unsigned int pos
Definition: spdifenc.c:413
avformat.h
dict.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
id
enum AVCodecID id
Definition: dts2pts.c:364
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
av_sat_add64
#define av_sat_add64
Definition: common.h:140
set_spdif
static void set_spdif(AVFormatContext *s, WAVDemuxContext *wav)
Definition: wavdec.c:89
AVStream::index
int index
stream index in AVFormatContext
Definition: avformat.h:749
WAVDemuxContext::smv_given_first
int smv_given_first
Definition: wavdec.c:65
AV_CODEC_ID_G729
@ AV_CODEC_ID_G729
Definition: codec_id.h:493
w64.h
WAVDemuxContext::ignore_length
int ignore_length
Definition: wavdec.c:62
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:41
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:235
av_channel_layout_uninit
void av_channel_layout_uninit(AVChannelLayout *channel_layout)
Free any allocated data in the channel layout and reset the channel count to 0.
Definition: channel_layout.c:432
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:611
temp
else temp
Definition: vf_mcdeint.c:263
AVSTREAM_PARSE_FULL_RAW
@ AVSTREAM_PARSE_FULL_RAW
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:597
OFFSET
#define OFFSET(x)
Definition: wavdec.c:70
samples
Filter the word “frame” indicates either a video frame or a group of audio samples
Definition: filter_design.txt:8
AVPacket::stream_index
int stream_index
Definition: packet.h:524
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:317
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
read_probe
static int read_probe(const AVProbeData *p)
Definition: cdg.c:30
ff_w64_guid_data
const uint8_t ff_w64_guid_data[16]
Definition: w64.c:42
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:336
AVCodecParameters::bits_per_coded_sample
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: codec_par.h:110
find_guid
static const GUIDParseTable * find_guid(ff_asf_guid guid)
Definition: asfdec_o.c:1545
AV_CODEC_ID_XMA2
@ AV_CODEC_ID_XMA2
Definition: codec_id.h:520
FFStream::request_probe
int request_probe
stream probing state -1 -> probing finished 0 -> no probing requested rest -> perform probing with re...
Definition: internal.h:263
ff_w64_guid_riff
const uint8_t ff_w64_guid_riff[16]
Definition: w64.c:23
av_free
#define av_free(p)
Definition: tableprint_vlc.h:33
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:55
AVPacket
This structure stores compressed data.
Definition: packet.h:499
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Definition: opt.h:251
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:88
riff.h
ff_id3v2_free_extra_meta
void ff_id3v2_free_extra_meta(ID3v2ExtraMeta **extra_meta)
Free memory allocated parsing special (non-text) metadata.
Definition: id3v2.c:1145
FFStream::cur_dts
int64_t cur_dts
Definition: internal.h:410
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:542
FFInputFormat
Definition: demux.h:37
avio_rl64
uint64_t avio_rl64(AVIOContext *s)
Definition: aviobuf.c:737
int32_t
int32_t
Definition: audioconvert.c:56
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:474
AVCodecParameters::bit_rate
int64_t bit_rate
The average bitrate of the encoded data (in bits per second).
Definition: codec_par.h:97
ff_id3v2_parse_priv
int ff_id3v2_parse_priv(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Add metadata for all PRIV tags in the ID3v2 header.
Definition: id3v2.c:1257
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
MKTAG
#define MKTAG(a, b, c, d)
Definition: macros.h:55
ffio_read_size
int ffio_read_size(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:661
FF_SANE_NB_CHANNELS
#define FF_SANE_NB_CHANNELS
Definition: internal.h:37
snprintf
#define snprintf
Definition: snprintf.h:34
WAVDemuxContext::vst
AVStream * vst
Definition: wavdec.c:54
ff_w64_demuxer
const FFInputFormat ff_w64_demuxer
spdif.h
FF_PRI_GUID
#define FF_PRI_GUID
Definition: riff.h:105
ff_wav_codec_tags_list
const AVCodecTag *const ff_wav_codec_tags_list[]
ff_metadata_conv_ctx
void ff_metadata_conv_ctx(AVFormatContext *ctx, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: metadata.c:59
av_fourcc2str
#define av_fourcc2str(fourcc)
Definition: avutil.h:345
ff_alloc_extradata
int ff_alloc_extradata(AVCodecParameters *par, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0.
Definition: utils.c:239
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:345