| /* |
| * Copyright (c) 2012 Justin Ruggles |
| * |
| * This file is part of FFmpeg. |
| * |
| * FFmpeg is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU Lesser General Public |
| * License as published by the Free Software Foundation; either |
| * version 2.1 of the License, or (at your option) any later version. |
| * |
| * FFmpeg is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * Lesser General Public License for more details. |
| * |
| * You should have received a copy of the GNU Lesser General Public |
| * License along with FFmpeg; if not, write to the Free Software |
| * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| */ |
| |
| /** |
| * @file |
| * Vorbis audio parser |
| * |
| * Determines the duration for each packet. |
| */ |
| |
| #include "libavutil/log.h" |
| |
| #include "get_bits.h" |
| #include "parser.h" |
| #include "xiph.h" |
| #include "vorbis_parser_internal.h" |
| |
| static const AVClass vorbis_parser_class = { |
| .class_name = "Vorbis parser", |
| .item_name = av_default_item_name, |
| .version = LIBAVUTIL_VERSION_INT, |
| }; |
| |
| static int parse_id_header(AVVorbisParseContext *s, |
| const uint8_t *buf, int buf_size) |
| { |
| /* Id header should be 30 bytes */ |
| if (buf_size < 30) { |
| av_log(s, AV_LOG_ERROR, "Id header is too short\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| |
| /* make sure this is the Id header */ |
| if (buf[0] != 1) { |
| av_log(s, AV_LOG_ERROR, "Wrong packet type in Id header\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| |
| /* check for header signature */ |
| if (memcmp(&buf[1], "vorbis", 6)) { |
| av_log(s, AV_LOG_ERROR, "Invalid packet signature in Id header\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| |
| if (!(buf[29] & 0x1)) { |
| av_log(s, AV_LOG_ERROR, "Invalid framing bit in Id header\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| |
| s->blocksize[0] = 1 << (buf[28] & 0xF); |
| s->blocksize[1] = 1 << (buf[28] >> 4); |
| |
| return 0; |
| } |
| |
| static int parse_setup_header(AVVorbisParseContext *s, |
| const uint8_t *buf, int buf_size) |
| { |
| GetBitContext gb, gb0; |
| uint8_t *rev_buf; |
| int i, ret = 0; |
| int got_framing_bit, mode_count, got_mode_header, last_mode_count = 0; |
| |
| /* avoid overread */ |
| if (buf_size < 7) { |
| av_log(s, AV_LOG_ERROR, "Setup header is too short\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| |
| /* make sure this is the Setup header */ |
| if (buf[0] != 5) { |
| av_log(s, AV_LOG_ERROR, "Wrong packet type in Setup header\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| |
| /* check for header signature */ |
| if (memcmp(&buf[1], "vorbis", 6)) { |
| av_log(s, AV_LOG_ERROR, "Invalid packet signature in Setup header\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| |
| /* reverse bytes so we can easily read backwards with get_bits() */ |
| if (!(rev_buf = av_malloc(buf_size))) { |
| av_log(s, AV_LOG_ERROR, "Out of memory\n"); |
| return AVERROR(ENOMEM); |
| } |
| for (i = 0; i < buf_size; i++) |
| rev_buf[i] = buf[buf_size - 1 - i]; |
| init_get_bits(&gb, rev_buf, buf_size * 8); |
| |
| got_framing_bit = 0; |
| while (get_bits_left(&gb) > 97) { |
| if (get_bits1(&gb)) { |
| got_framing_bit = get_bits_count(&gb); |
| break; |
| } |
| } |
| if (!got_framing_bit) { |
| av_log(s, AV_LOG_ERROR, "Invalid Setup header\n"); |
| ret = AVERROR_INVALIDDATA; |
| goto bad_header; |
| } |
| |
| /* Now we search backwards to find possible valid mode counts. This is not |
| * fool-proof because we could have false positive matches and read too |
| * far, but there isn't really any way to be sure without parsing through |
| * all the many variable-sized fields before the modes. This approach seems |
| * to work well in testing, and it is similar to how it is handled in |
| * liboggz. */ |
| mode_count = 0; |
| got_mode_header = 0; |
| while (get_bits_left(&gb) >= 97) { |
| if (get_bits(&gb, 8) > 63 || get_bits(&gb, 16) || get_bits(&gb, 16)) |
| break; |
| skip_bits(&gb, 1); |
| mode_count++; |
| if (mode_count > 64) |
| break; |
| gb0 = gb; |
| if (get_bits(&gb0, 6) + 1 == mode_count) { |
| got_mode_header = 1; |
| last_mode_count = mode_count; |
| } |
| } |
| if (!got_mode_header) { |
| av_log(s, AV_LOG_ERROR, "Invalid Setup header\n"); |
| ret = AVERROR_INVALIDDATA; |
| goto bad_header; |
| } |
| /* All samples I've seen use <= 2 modes, so ask for a sample if we find |
| * more than that, as it is most likely a false positive. If we get any |
| * we may need to approach this the long way and parse the whole Setup |
| * header, but I hope very much that it never comes to that. */ |
| if (last_mode_count > 2) { |
| avpriv_request_sample(s, |
| "%d modes (either a false positive or a " |
| "sample from an unknown encoder)", |
| last_mode_count); |
| } |
| /* We're limiting the mode count to 63 so that we know that the previous |
| * block flag will be in the first packet byte. */ |
| if (last_mode_count > 63) { |
| av_log(s, AV_LOG_ERROR, "Unsupported mode count: %d\n", |
| last_mode_count); |
| ret = AVERROR_INVALIDDATA; |
| goto bad_header; |
| } |
| s->mode_count = mode_count = last_mode_count; |
| /* Determine the number of bits required to code the mode and turn that |
| * into a bitmask to directly access the mode from the first frame byte. */ |
| s->mode_mask = ((1 << (av_log2(mode_count - 1) + 1)) - 1) << 1; |
| /* The previous window flag is the next bit after the mode */ |
| s->prev_mask = (s->mode_mask | 0x1) + 1; |
| |
| init_get_bits(&gb, rev_buf, buf_size * 8); |
| skip_bits_long(&gb, got_framing_bit); |
| for (i = mode_count - 1; i >= 0; i--) { |
| skip_bits_long(&gb, 40); |
| s->mode_blocksize[i] = get_bits1(&gb); |
| } |
| |
| bad_header: |
| av_free(rev_buf); |
| return ret; |
| } |
| |
| static int vorbis_parse_init(AVVorbisParseContext *s, |
| const uint8_t *extradata, int extradata_size) |
| { |
| const uint8_t *header_start[3]; |
| int header_len[3]; |
| int ret; |
| |
| s->class = &vorbis_parser_class; |
| s->extradata_parsed = 1; |
| |
| if ((ret = avpriv_split_xiph_headers(extradata, |
| extradata_size, 30, |
| header_start, header_len)) < 0) { |
| av_log(s, AV_LOG_ERROR, "Extradata corrupt.\n"); |
| return ret; |
| } |
| |
| if ((ret = parse_id_header(s, header_start[0], header_len[0])) < 0) |
| return ret; |
| |
| if ((ret = parse_setup_header(s, header_start[2], header_len[2])) < 0) |
| return ret; |
| |
| s->valid_extradata = 1; |
| s->previous_blocksize = s->blocksize[s->mode_blocksize[0]]; |
| |
| return 0; |
| } |
| |
| int av_vorbis_parse_frame_flags(AVVorbisParseContext *s, const uint8_t *buf, |
| int buf_size, int *flags) |
| { |
| int duration = 0; |
| |
| if (s->valid_extradata && buf_size > 0) { |
| int mode, current_blocksize; |
| int previous_blocksize = s->previous_blocksize; |
| |
| if (buf[0] & 1) { |
| /* If the user doesn't care about special packets, it's a bad one. */ |
| if (!flags) |
| goto bad_packet; |
| |
| /* Set the flag for which kind of special packet it is. */ |
| if (buf[0] == 1) |
| *flags |= VORBIS_FLAG_HEADER; |
| else if (buf[0] == 3) |
| *flags |= VORBIS_FLAG_COMMENT; |
| else if (buf[0] == 5) |
| *flags |= VORBIS_FLAG_SETUP; |
| else |
| goto bad_packet; |
| |
| /* Special packets have no duration. */ |
| return 0; |
| |
| bad_packet: |
| av_log(s, AV_LOG_ERROR, "Invalid packet\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| if (s->mode_count == 1) |
| mode = 0; |
| else |
| mode = (buf[0] & s->mode_mask) >> 1; |
| if (mode >= s->mode_count) { |
| av_log(s, AV_LOG_ERROR, "Invalid mode in packet\n"); |
| return AVERROR_INVALIDDATA; |
| } |
| if(s->mode_blocksize[mode]){ |
| int flag = !!(buf[0] & s->prev_mask); |
| previous_blocksize = s->blocksize[flag]; |
| } |
| current_blocksize = s->blocksize[s->mode_blocksize[mode]]; |
| duration = (previous_blocksize + current_blocksize) >> 2; |
| s->previous_blocksize = current_blocksize; |
| } |
| |
| return duration; |
| } |
| |
| int av_vorbis_parse_frame(AVVorbisParseContext *s, const uint8_t *buf, |
| int buf_size) |
| { |
| return av_vorbis_parse_frame_flags(s, buf, buf_size, NULL); |
| } |
| |
| void av_vorbis_parse_reset(AVVorbisParseContext *s) |
| { |
| if (s->valid_extradata) |
| s->previous_blocksize = s->blocksize[0]; |
| } |
| |
| void av_vorbis_parse_free(AVVorbisParseContext **s) |
| { |
| av_freep(s); |
| } |
| |
| AVVorbisParseContext *av_vorbis_parse_init(const uint8_t *extradata, |
| int extradata_size) |
| { |
| AVVorbisParseContext *s = av_mallocz(sizeof(*s)); |
| int ret; |
| |
| if (!s) |
| return NULL; |
| |
| ret = vorbis_parse_init(s, extradata, extradata_size); |
| if (ret < 0) { |
| av_vorbis_parse_free(&s); |
| return NULL; |
| } |
| |
| return s; |
| } |
| |
| #if CONFIG_VORBIS_PARSER |
| |
| typedef struct VorbisParseContext { |
| AVVorbisParseContext *vp; |
| } VorbisParseContext; |
| |
| static int vorbis_parse(AVCodecParserContext *s1, AVCodecContext *avctx, |
| const uint8_t **poutbuf, int *poutbuf_size, |
| const uint8_t *buf, int buf_size) |
| { |
| VorbisParseContext *s = s1->priv_data; |
| int duration; |
| |
| if (!s->vp && avctx->extradata && avctx->extradata_size) { |
| s->vp = av_vorbis_parse_init(avctx->extradata, avctx->extradata_size); |
| } |
| if (!s->vp) |
| goto end; |
| |
| if ((duration = av_vorbis_parse_frame(s->vp, buf, buf_size)) >= 0) |
| s1->duration = duration; |
| |
| end: |
| /* always return the full packet. this parser isn't doing any splitting or |
| combining, only packet analysis */ |
| *poutbuf = buf; |
| *poutbuf_size = buf_size; |
| return buf_size; |
| } |
| |
| static void vorbis_parser_close(AVCodecParserContext *ctx) |
| { |
| VorbisParseContext *s = ctx->priv_data; |
| av_vorbis_parse_free(&s->vp); |
| } |
| |
| AVCodecParser ff_vorbis_parser = { |
| .codec_ids = { AV_CODEC_ID_VORBIS }, |
| .priv_data_size = sizeof(VorbisParseContext), |
| .parser_parse = vorbis_parse, |
| .parser_close = vorbis_parser_close, |
| }; |
| #endif /* CONFIG_VORBIS_PARSER */ |