libavformat/westwood.c
2fdf638b
 /*
  * Westwood Studios Multimedia Formats Demuxer (VQA, AUD)
  * Copyright (c) 2003 The ffmpeg Project
  *
b78e7197
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
2fdf638b
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
b78e7197
  * version 2.1 of the License, or (at your option) any later version.
2fdf638b
  *
b78e7197
  * FFmpeg is distributed in the hope that it will be useful,
2fdf638b
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
b78e7197
  * License along with FFmpeg; if not, write to the Free Software
5509bffa
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
2fdf638b
  */
 
 /**
ba87f080
  * @file
2fdf638b
  * Westwood Studios VQA & AUD file demuxers
  * by Mike Melanson (melanson@pcisys.net)
  * for more information on the Westwood file formats, visit:
  *   http://www.pcisys.net/~melanson/codecs/
  *   http://www.geocities.com/SiliconValley/8682/aud3.txt
  *
  * Implementation note: There is no definite file signature for AUD files.
  * The demuxer uses a probabilistic strategy for content detection. This
  * entails performing sanity checks on certain header values in order to
  * qualify a file. Refer to wsaud_probe() for the precise parameters.
  */
 
6a5d31ac
 #include "libavutil/intreadwrite.h"
2fdf638b
 #include "avformat.h"
 
 #define AUD_HEADER_SIZE 12
 #define AUD_CHUNK_PREAMBLE_SIZE 8
 #define AUD_CHUNK_SIGNATURE 0x0000DEAF
 
3a278992
 #define FORM_TAG MKBETAG('F', 'O', 'R', 'M')
 #define WVQA_TAG MKBETAG('W', 'V', 'Q', 'A')
 #define VQHD_TAG MKBETAG('V', 'Q', 'H', 'D')
 #define FINF_TAG MKBETAG('F', 'I', 'N', 'F')
 #define SND0_TAG MKBETAG('S', 'N', 'D', '0')
61710f7b
 #define SND1_TAG MKBETAG('S', 'N', 'D', '1')
3a278992
 #define SND2_TAG MKBETAG('S', 'N', 'D', '2')
 #define VQFR_TAG MKBETAG('V', 'Q', 'F', 'R')
2fdf638b
 
20f269dc
 /* don't know what these tags are for, but acknowledge their existence */
3a278992
 #define CINF_TAG MKBETAG('C', 'I', 'N', 'F')
 #define CINH_TAG MKBETAG('C', 'I', 'N', 'H')
 #define CIND_TAG MKBETAG('C', 'I', 'N', 'D')
 #define PINF_TAG MKBETAG('P', 'I', 'N', 'F')
 #define PINH_TAG MKBETAG('P', 'I', 'N', 'H')
 #define PIND_TAG MKBETAG('P', 'I', 'N', 'D')
61710f7b
 #define CMDS_TAG MKBETAG('C', 'M', 'D', 'S')
20f269dc
 
2fdf638b
 #define VQA_HEADER_SIZE 0x2A
 #define VQA_FRAMERATE 15
 #define VQA_PREAMBLE_SIZE 8
 
 typedef struct WsAudDemuxContext {
     int audio_samplerate;
     int audio_channels;
     int audio_bits;
fb65d2ca
     enum CodecID audio_type;
2fdf638b
     int audio_stream_index;
     int64_t audio_frame_counter;
 } WsAudDemuxContext;
 
 typedef struct WsVqaDemuxContext {
     int audio_samplerate;
     int audio_channels;
     int audio_bits;
 
     int audio_stream_index;
     int video_stream_index;
 
     int64_t audio_frame_counter;
 } WsVqaDemuxContext;
 
 static int wsaud_probe(AVProbeData *p)
 {
     int field;
 
     /* Probabilistic content detection strategy: There is no file signature
      * so perform sanity checks on various header parameters:
      *   8000 <= sample rate (16 bits) <= 48000  ==> 40001 acceptable numbers
9e2ffc45
      *   flags <= 0x03 (2 LSBs are used)         ==> 4 acceptable numbers
2fdf638b
      *   compression type (8 bits) = 1 or 99     ==> 2 acceptable numbers
9e2ffc45
      *   first audio chunk signature (32 bits)   ==> 1 acceptable number
      * The number space contains 2^64 numbers. There are 40001 * 4 * 2 * 1 =
      * 320008 acceptable number combinations.
2fdf638b
      */
 
9e2ffc45
     if (p->buf_size < AUD_HEADER_SIZE + AUD_CHUNK_PREAMBLE_SIZE)
2fdf638b
         return 0;
 
     /* check sample rate */
fead30d4
     field = AV_RL16(&p->buf[0]);
2fdf638b
     if ((field < 8000) || (field > 48000))
         return 0;
 
9e2ffc45
     /* enforce the rule that the top 6 bits of this flags field are reserved (0);
      * this might not be true, but enforce it until deemed unnecessary */
     if (p->buf[10] & 0xFC)
         return 0;
 
115329f1
     /* note: only check for WS IMA (type 99) right now since there is no
2fdf638b
      * support for type 1 */
     if (p->buf[11] != 99)
         return 0;
 
9e2ffc45
     /* read ahead to the first audio chunk and validate the first header signature */
     if (AV_RL32(&p->buf[16]) != AUD_CHUNK_SIGNATURE)
         return 0;
 
2fdf638b
     /* return 1/2 certainty since this file check is a little sketchy */
     return AVPROBE_SCORE_MAX / 2;
 }
 
 static int wsaud_read_header(AVFormatContext *s,
                              AVFormatParameters *ap)
 {
e4141433
     WsAudDemuxContext *wsaud = s->priv_data;
ae628ec1
     AVIOContext *pb = s->pb;
2fdf638b
     AVStream *st;
     unsigned char header[AUD_HEADER_SIZE];
 
b7effd4e
     if (avio_read(pb, header, AUD_HEADER_SIZE) != AUD_HEADER_SIZE)
6f3e0b21
         return AVERROR(EIO);
fead30d4
     wsaud->audio_samplerate = AV_RL16(&header[0]);
2fdf638b
     if (header[11] == 99)
         wsaud->audio_type = CODEC_ID_ADPCM_IMA_WS;
     else
         return AVERROR_INVALIDDATA;
 
     /* flag 0 indicates stereo */
     wsaud->audio_channels = (header[10] & 0x1) + 1;
     /* flag 1 indicates 16 bit audio */
     wsaud->audio_bits = (((header[10] & 0x2) >> 1) + 1) * 8;
 
     /* initialize the audio decoder stream */
     st = av_new_stream(s, 0);
     if (!st)
769e10f0
         return AVERROR(ENOMEM);
9ee91c2f
     av_set_pts_info(st, 33, 1, wsaud->audio_samplerate);
72415b2a
     st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
01f4895c
     st->codec->codec_id = wsaud->audio_type;
     st->codec->codec_tag = 0;  /* no tag */
     st->codec->channels = wsaud->audio_channels;
     st->codec->sample_rate = wsaud->audio_samplerate;
dd1c8f3e
     st->codec->bits_per_coded_sample = wsaud->audio_bits;
01f4895c
     st->codec->bit_rate = st->codec->channels * st->codec->sample_rate *
dd1c8f3e
         st->codec->bits_per_coded_sample / 4;
     st->codec->block_align = st->codec->channels * st->codec->bits_per_coded_sample;
2fdf638b
 
     wsaud->audio_stream_index = st->index;
     wsaud->audio_frame_counter = 0;
 
     return 0;
 }
 
 static int wsaud_read_packet(AVFormatContext *s,
                              AVPacket *pkt)
 {
e4141433
     WsAudDemuxContext *wsaud = s->priv_data;
ae628ec1
     AVIOContext *pb = s->pb;
2fdf638b
     unsigned char preamble[AUD_CHUNK_PREAMBLE_SIZE];
     unsigned int chunk_size;
     int ret = 0;
 
b7effd4e
     if (avio_read(pb, preamble, AUD_CHUNK_PREAMBLE_SIZE) !=
2fdf638b
         AUD_CHUNK_PREAMBLE_SIZE)
6f3e0b21
         return AVERROR(EIO);
2fdf638b
 
     /* validate the chunk */
fead30d4
     if (AV_RL32(&preamble[4]) != AUD_CHUNK_SIGNATURE)
2fdf638b
         return AVERROR_INVALIDDATA;
 
fead30d4
     chunk_size = AV_RL16(&preamble[0]);
2692067a
     ret= av_get_packet(pb, pkt, chunk_size);
     if (ret != chunk_size)
6f3e0b21
         return AVERROR(EIO);
2fdf638b
     pkt->stream_index = wsaud->audio_stream_index;
     pkt->pts = wsaud->audio_frame_counter;
     pkt->pts /= wsaud->audio_samplerate;
 
     /* 2 samples/byte, 1 or 2 samples per frame depending on stereo */
     wsaud->audio_frame_counter += (chunk_size * 2) / wsaud->audio_channels;
 
     return ret;
 }
 
 static int wsvqa_probe(AVProbeData *p)
 {
     /* need 12 bytes to qualify */
     if (p->buf_size < 12)
         return 0;
 
     /* check for the VQA signatures */
fead30d4
     if ((AV_RB32(&p->buf[0]) != FORM_TAG) ||
         (AV_RB32(&p->buf[8]) != WVQA_TAG))
2fdf638b
         return 0;
 
     return AVPROBE_SCORE_MAX;
 }
 
 static int wsvqa_read_header(AVFormatContext *s,
                              AVFormatParameters *ap)
 {
e4141433
     WsVqaDemuxContext *wsvqa = s->priv_data;
ae628ec1
     AVIOContext *pb = s->pb;
2fdf638b
     AVStream *st;
     unsigned char *header;
     unsigned char scratch[VQA_PREAMBLE_SIZE];
20f269dc
     unsigned int chunk_tag;
     unsigned int chunk_size;
2fdf638b
 
     /* initialize the video decoder stream */
     st = av_new_stream(s, 0);
     if (!st)
769e10f0
         return AVERROR(ENOMEM);
5f3c4ba4
     av_set_pts_info(st, 33, 1, VQA_FRAMERATE);
2fdf638b
     wsvqa->video_stream_index = st->index;
72415b2a
     st->codec->codec_type = AVMEDIA_TYPE_VIDEO;
01f4895c
     st->codec->codec_id = CODEC_ID_WS_VQA;
     st->codec->codec_tag = 0;  /* no fourcc */
2fdf638b
 
     /* skip to the start of the VQA header */
6b4aa5da
     avio_seek(pb, 20, SEEK_SET);
2fdf638b
 
     /* the VQA header needs to go to the decoder */
01f4895c
     st->codec->extradata_size = VQA_HEADER_SIZE;
d76319b1
     st->codec->extradata = av_mallocz(VQA_HEADER_SIZE + FF_INPUT_BUFFER_PADDING_SIZE);
01f4895c
     header = (unsigned char *)st->codec->extradata;
b7effd4e
     if (avio_read(pb, st->codec->extradata, VQA_HEADER_SIZE) !=
2fdf638b
         VQA_HEADER_SIZE) {
01f4895c
         av_free(st->codec->extradata);
6f3e0b21
         return AVERROR(EIO);
2fdf638b
     }
fead30d4
     st->codec->width = AV_RL16(&header[6]);
     st->codec->height = AV_RL16(&header[8]);
2fdf638b
 
61710f7b
     /* initialize the audio decoder stream for VQA v1 or nonzero samplerate */
fead30d4
     if (AV_RL16(&header[24]) || (AV_RL16(&header[0]) == 1 && AV_RL16(&header[2]) == 1)) {
20f269dc
         st = av_new_stream(s, 0);
         if (!st)
769e10f0
             return AVERROR(ENOMEM);
5f3c4ba4
         av_set_pts_info(st, 33, 1, VQA_FRAMERATE);
72415b2a
         st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
fead30d4
         if (AV_RL16(&header[0]) == 1)
61710f7b
             st->codec->codec_id = CODEC_ID_WESTWOOD_SND1;
         else
             st->codec->codec_id = CODEC_ID_ADPCM_IMA_WS;
01f4895c
         st->codec->codec_tag = 0;  /* no tag */
fead30d4
         st->codec->sample_rate = AV_RL16(&header[24]);
61710f7b
         if (!st->codec->sample_rate)
             st->codec->sample_rate = 22050;
01f4895c
         st->codec->channels = header[26];
61710f7b
         if (!st->codec->channels)
             st->codec->channels = 1;
dd1c8f3e
         st->codec->bits_per_coded_sample = 16;
01f4895c
         st->codec->bit_rate = st->codec->channels * st->codec->sample_rate *
dd1c8f3e
             st->codec->bits_per_coded_sample / 4;
         st->codec->block_align = st->codec->channels * st->codec->bits_per_coded_sample;
20f269dc
 
         wsvqa->audio_stream_index = st->index;
01f4895c
         wsvqa->audio_samplerate = st->codec->sample_rate;
         wsvqa->audio_channels = st->codec->channels;
20f269dc
         wsvqa->audio_frame_counter = 0;
     }
2fdf638b
 
20f269dc
     /* there are 0 or more chunks before the FINF chunk; iterate until
      * FINF has been skipped and the file will be ready to be demuxed */
     do {
b832e539
         if (avio_read(pb, scratch, VQA_PREAMBLE_SIZE) != VQA_PREAMBLE_SIZE)
6f3e0b21
             return AVERROR(EIO);
fead30d4
         chunk_tag = AV_RB32(&scratch[0]);
         chunk_size = AV_RB32(&scratch[4]);
20f269dc
 
         /* catch any unknown header tags, for curiousity */
         switch (chunk_tag) {
         case CINF_TAG:
         case CINH_TAG:
         case CIND_TAG:
         case PINF_TAG:
         case PINH_TAG:
         case PIND_TAG:
         case FINF_TAG:
61710f7b
         case CMDS_TAG:
20f269dc
             break;
 
         default:
bc874dae
             av_log (s, AV_LOG_ERROR, " note: unknown chunk seen (%c%c%c%c)\n",
20f269dc
                 scratch[0], scratch[1],
                 scratch[2], scratch[3]);
             break;
         }
 
45a8a02a
         avio_skip(pb, chunk_size);
20f269dc
     } while (chunk_tag != FINF_TAG);
2fdf638b
 
     return 0;
 }
 
 static int wsvqa_read_packet(AVFormatContext *s,
                              AVPacket *pkt)
 {
e4141433
     WsVqaDemuxContext *wsvqa = s->priv_data;
ae628ec1
     AVIOContext *pb = s->pb;
61710f7b
     int ret = -1;
2fdf638b
     unsigned char preamble[VQA_PREAMBLE_SIZE];
     unsigned int chunk_type;
     unsigned int chunk_size;
     int skip_byte;
 
b7effd4e
     while (avio_read(pb, preamble, VQA_PREAMBLE_SIZE) == VQA_PREAMBLE_SIZE) {
fead30d4
         chunk_type = AV_RB32(&preamble[0]);
         chunk_size = AV_RB32(&preamble[4]);
61710f7b
         skip_byte = chunk_size & 0x01;
 
         if ((chunk_type == SND1_TAG) || (chunk_type == SND2_TAG) || (chunk_type == VQFR_TAG)) {
 
             if (av_new_packet(pkt, chunk_size))
6f3e0b21
                 return AVERROR(EIO);
b7effd4e
             ret = avio_read(pb, pkt->data, chunk_size);
61710f7b
             if (ret != chunk_size) {
                 av_free_packet(pkt);
6f3e0b21
                 return AVERROR(EIO);
61710f7b
             }
 
             if (chunk_type == SND2_TAG) {
                 pkt->stream_index = wsvqa->audio_stream_index;
                 /* 2 samples/byte, 1 or 2 samples per frame depending on stereo */
                 wsvqa->audio_frame_counter += (chunk_size * 2) / wsvqa->audio_channels;
             } else if(chunk_type == SND1_TAG) {
                 pkt->stream_index = wsvqa->audio_stream_index;
                 /* unpacked size is stored in header */
fead30d4
                 wsvqa->audio_frame_counter += AV_RL16(pkt->data) / wsvqa->audio_channels;
61710f7b
             } else {
                 pkt->stream_index = wsvqa->video_stream_index;
             }
             /* stay on 16-bit alignment */
             if (skip_byte)
45a8a02a
                 avio_skip(pb, 1);
61710f7b
 
             return ret;
2fdf638b
         } else {
61710f7b
             switch(chunk_type){
             case CMDS_TAG:
             case SND0_TAG:
                 break;
             default:
                 av_log(s, AV_LOG_INFO, "Skipping unknown chunk 0x%08X\n", chunk_type);
             }
45a8a02a
             avio_skip(pb, chunk_size + skip_byte);
2fdf638b
         }
61710f7b
     }
2fdf638b
 
     return ret;
 }
 
b250f9c6
 #if CONFIG_WSAUD_DEMUXER
c6610a21
 AVInputFormat ff_wsaud_demuxer = {
2fdf638b
     "wsaud",
bde15e74
     NULL_IF_CONFIG_SMALL("Westwood Studios audio format"),
2fdf638b
     sizeof(WsAudDemuxContext),
     wsaud_probe,
     wsaud_read_header,
     wsaud_read_packet,
 };
ff70e601
 #endif
b250f9c6
 #if CONFIG_WSVQA_DEMUXER
c6610a21
 AVInputFormat ff_wsvqa_demuxer = {
2fdf638b
     "wsvqa",
bde15e74
     NULL_IF_CONFIG_SMALL("Westwood Studios VQA format"),
2fdf638b
     sizeof(WsVqaDemuxContext),
     wsvqa_probe,
     wsvqa_read_header,
     wsvqa_read_packet,
 };
ff70e601
 #endif