libavformat/cafenc.c
2c4ad1a3
 /*
  * Core Audio Format muxer
  * Copyright (c) 2011 Carl Eugen Hoyos
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */
 
 #include "avformat.h"
 #include "caf.h"
 #include "isom.h"
 #include "avio_internal.h"
a6ef7b3a
 #include "libavutil/intfloat.h"
7fe6f6e2
 #include "libavutil/dict.h"
2c4ad1a3
 
 typedef struct {
     int64_t data;
9b60b076
     uint8_t *pkt_sizes;
     int size_buffer_size;
     int size_entries_used;
     int packets;
2c4ad1a3
 } CAFContext;
 
bb2f13c1
 static uint32_t codec_flags(enum AVCodecID codec_id) {
2c4ad1a3
     switch (codec_id) {
7a72695c
     case AV_CODEC_ID_PCM_F32BE:
     case AV_CODEC_ID_PCM_F64BE:
2c4ad1a3
         return 1; //< kCAFLinearPCMFormatFlagIsFloat
7a72695c
     case AV_CODEC_ID_PCM_S16LE:
     case AV_CODEC_ID_PCM_S24LE:
     case AV_CODEC_ID_PCM_S32LE:
2c4ad1a3
         return 2; //< kCAFLinearPCMFormatFlagIsLittleEndian
7a72695c
     case AV_CODEC_ID_PCM_F32LE:
     case AV_CODEC_ID_PCM_F64LE:
2c4ad1a3
         return 3; //< kCAFLinearPCMFormatFlagIsFloat | kCAFLinearPCMFormatFlagIsLittleEndian
     default:
         return 0;
     }
 }
 
1acb5ca0
 static uint32_t samples_per_packet(enum AVCodecID codec_id, int channels, int block_align) {
2c4ad1a3
     switch (codec_id) {
7a72695c
     case AV_CODEC_ID_PCM_S8:
     case AV_CODEC_ID_PCM_S16LE:
     case AV_CODEC_ID_PCM_S16BE:
     case AV_CODEC_ID_PCM_S24LE:
     case AV_CODEC_ID_PCM_S24BE:
     case AV_CODEC_ID_PCM_S32LE:
     case AV_CODEC_ID_PCM_S32BE:
     case AV_CODEC_ID_PCM_F32LE:
     case AV_CODEC_ID_PCM_F32BE:
     case AV_CODEC_ID_PCM_F64LE:
     case AV_CODEC_ID_PCM_F64BE:
     case AV_CODEC_ID_PCM_ALAW:
     case AV_CODEC_ID_PCM_MULAW:
2c4ad1a3
         return 1;
7a72695c
     case AV_CODEC_ID_MACE3:
     case AV_CODEC_ID_MACE6:
2c4ad1a3
         return 6;
7a72695c
     case AV_CODEC_ID_ADPCM_IMA_QT:
2c4ad1a3
         return 64;
7a72695c
     case AV_CODEC_ID_AMR_NB:
     case AV_CODEC_ID_GSM:
a5d4e94a
     case AV_CODEC_ID_ILBC:
7a72695c
     case AV_CODEC_ID_QCELP:
2c4ad1a3
         return 160;
7a72695c
     case AV_CODEC_ID_GSM_MS:
43e96d04
         return 320;
7a72695c
     case AV_CODEC_ID_MP1:
2c4ad1a3
         return 384;
7a72695c
     case AV_CODEC_ID_MP2:
     case AV_CODEC_ID_MP3:
2c4ad1a3
         return 1152;
7a72695c
     case AV_CODEC_ID_AC3:
2c4ad1a3
         return 1536;
7a72695c
     case AV_CODEC_ID_QDM2:
7f1b3c2c
         return 2048 * channels;
     case AV_CODEC_ID_ALAC:
2c4ad1a3
         return 4096;
7a72695c
     case AV_CODEC_ID_ADPCM_IMA_WAV:
1acb5ca0
         return (block_align - 4 * channels) * 8 / (4 * channels) + 1;
7a72695c
     case AV_CODEC_ID_ADPCM_MS:
1acb5ca0
         return (block_align - 7 * channels) * 2 / channels + 2;
2c4ad1a3
     default:
         return 0;
     }
 }
 
 static int caf_write_header(AVFormatContext *s)
 {
     AVIOContext *pb = s->pb;
     AVCodecContext *enc = s->streams[0]->codec;
     CAFContext *caf = s->priv_data;
7fe6f6e2
     AVDictionaryEntry *t = NULL;
2c4ad1a3
     unsigned int codec_tag = ff_codec_get_tag(ff_codec_caf_tags, enc->codec_id);
7fe6f6e2
     int64_t chunk_size = 0;
2d56f0d0
     int frame_size = enc->frame_size;
2c4ad1a3
 
fb5518cf
     if (s->nb_streams != 1) {
         av_log(s, AV_LOG_ERROR, "CAF files have exactly one stream\n");
         return AVERROR(EINVAL);
     }
 
2c4ad1a3
     switch (enc->codec_id) {
7a72695c
     case AV_CODEC_ID_AAC:
c6e0332f
         av_log(s, AV_LOG_ERROR, "muxing codec currently unsupported\n");
         return AVERROR_PATCHWELCOME;
     }
 
     switch (enc->codec_id) {
7a72695c
     case AV_CODEC_ID_PCM_S8:
     case AV_CODEC_ID_PCM_S16LE:
     case AV_CODEC_ID_PCM_S16BE:
     case AV_CODEC_ID_PCM_S24LE:
     case AV_CODEC_ID_PCM_S24BE:
     case AV_CODEC_ID_PCM_S32LE:
     case AV_CODEC_ID_PCM_S32BE:
     case AV_CODEC_ID_PCM_F32LE:
     case AV_CODEC_ID_PCM_F32BE:
     case AV_CODEC_ID_PCM_F64LE:
     case AV_CODEC_ID_PCM_F64BE:
88084eec
         codec_tag = MKTAG('l','p','c','m');
2c4ad1a3
     }
 
     if (!codec_tag) {
         av_log(s, AV_LOG_ERROR, "unsupported codec\n");
         return AVERROR_INVALIDDATA;
     }
 
9b60b076
     if (!enc->block_align && !pb->seekable) {
         av_log(s, AV_LOG_ERROR, "Muxing variable packet size not supported on non seekable output\n");
         return AVERROR_INVALIDDATA;
2c4ad1a3
     }
 
2d56f0d0
     if (enc->codec_id != AV_CODEC_ID_MP3 || frame_size != 576)
1acb5ca0
         frame_size = samples_per_packet(enc->codec_id, enc->channels, enc->block_align);
2d56f0d0
 
2c4ad1a3
     ffio_wfourcc(pb, "caff"); //< mFileType
     avio_wb16(pb, 1);         //< mFileVersion
     avio_wb16(pb, 0);         //< mFileFlags
 
     ffio_wfourcc(pb, "desc");                         //< Audio Description chunk
     avio_wb64(pb, 32);                                //< mChunkSize
a6ef7b3a
     avio_wb64(pb, av_double2int(enc->sample_rate));   //< mSampleRate
88084eec
     avio_wl32(pb, codec_tag);                         //< mFormatID
2c4ad1a3
     avio_wb32(pb, codec_flags(enc->codec_id));        //< mFormatFlags
     avio_wb32(pb, enc->block_align);                  //< mBytesPerPacket
2d56f0d0
     avio_wb32(pb, frame_size);                        //< mFramesPerPacket
2c4ad1a3
     avio_wb32(pb, enc->channels);                     //< mChannelsPerFrame
b35477a2
     avio_wb32(pb, av_get_bits_per_sample(enc->codec_id)); //< mBitsPerChannel
2c4ad1a3
 
6d721f71
     if (enc->channel_layout) {
         ffio_wfourcc(pb, "chan");
         avio_wb64(pb, 12);
         ff_mov_write_chan(pb, enc->channel_layout);
     }
2c4ad1a3
 
7a72695c
     if (enc->codec_id == AV_CODEC_ID_ALAC) {
05a26730
         ffio_wfourcc(pb, "kuki");
         avio_wb64(pb, 12 + enc->extradata_size);
         avio_write(pb, "\0\0\0\14frmaalac", 12);
         avio_write(pb, enc->extradata, enc->extradata_size);
7a72695c
     } else if (enc->codec_id == AV_CODEC_ID_AMR_NB) {
05a26730
         ffio_wfourcc(pb, "kuki");
         avio_wb64(pb, 29);
         avio_write(pb, "\0\0\0\14frmasamr", 12);
         avio_wb32(pb, 0x11); /* size */
         avio_write(pb, "samrFFMP", 8);
         avio_w8(pb, 0); /* decoder version */
 
         avio_wb16(pb, 0x81FF); /* Mode set (all modes for AMR_NB) */
         avio_w8(pb, 0x00); /* Mode change period (no restriction) */
         avio_w8(pb, 0x01); /* Frames per sample */
7a72695c
     } else if (enc->codec_id == AV_CODEC_ID_QDM2) {
05a26730
         ffio_wfourcc(pb, "kuki");
         avio_wb64(pb, enc->extradata_size);
         avio_write(pb, enc->extradata, enc->extradata_size);
     }
 
7fe6f6e2
     if (av_dict_count(s->metadata)) {
         ffio_wfourcc(pb, "info"); //< Information chunk
         while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
             chunk_size += strlen(t->key) + strlen(t->value) + 2;
         }
         avio_wb64(pb, chunk_size + 4);
         avio_wb32(pb, av_dict_count(s->metadata));
         t = NULL;
         while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
             avio_put_str(pb, t->key);
             avio_put_str(pb, t->value);
         }
     }
 
2c4ad1a3
     ffio_wfourcc(pb, "data"); //< Audio Data chunk
     caf->data = avio_tell(pb);
     avio_wb64(pb, -1);        //< mChunkSize
     avio_wb32(pb, 0);         //< mEditCount
 
     avio_flush(pb);
     return 0;
 }
 
 static int caf_write_packet(AVFormatContext *s, AVPacket *pkt)
 {
9b60b076
     CAFContext *caf = s->priv_data;
 
2c4ad1a3
     avio_write(s->pb, pkt->data, pkt->size);
9b60b076
     if (!s->streams[0]->codec->block_align) {
         void *pkt_sizes = caf->pkt_sizes;
         int i, alloc_size = caf->size_entries_used + 5;
         if (alloc_size < 0) {
             caf->pkt_sizes = NULL;
         } else {
             caf->pkt_sizes = av_fast_realloc(caf->pkt_sizes,
                                              &caf->size_buffer_size,
                                              alloc_size);
         }
         if (!caf->pkt_sizes) {
             av_free(pkt_sizes);
             return AVERROR(ENOMEM);
         }
         for (i = 4; i > 0; i--) {
             unsigned top = pkt->size >> i * 7;
             if (top)
                 caf->pkt_sizes[caf->size_entries_used++] = 128 | top;
         }
         caf->pkt_sizes[caf->size_entries_used++] = pkt->size & 127;
         caf->packets++;
     }
2c4ad1a3
     return 0;
 }
 
 static int caf_write_trailer(AVFormatContext *s)
 {
c46400dd
     CAFContext *caf = s->priv_data;
2c4ad1a3
     AVIOContext *pb = s->pb;
9b60b076
     AVCodecContext *enc = s->streams[0]->codec;
2c4ad1a3
 
     if (pb->seekable) {
         int64_t file_size = avio_tell(pb);
 
         avio_seek(pb, caf->data, SEEK_SET);
         avio_wb64(pb, file_size - caf->data - 8);
         avio_seek(pb, file_size, SEEK_SET);
9b60b076
         if (!enc->block_align) {
             ffio_wfourcc(pb, "pakt");
             avio_wb64(pb, caf->size_entries_used + 24);
             avio_wb64(pb, caf->packets); ///< mNumberPackets
1acb5ca0
             avio_wb64(pb, caf->packets * samples_per_packet(enc->codec_id, enc->channels, enc->block_align)); ///< mNumberValidFrames
9b60b076
             avio_wb32(pb, 0); ///< mPrimingFrames
             avio_wb32(pb, 0); ///< mRemainderFrames
             avio_write(pb, caf->pkt_sizes, caf->size_entries_used);
             caf->size_buffer_size = 0;
         }
2c4ad1a3
         avio_flush(pb);
     }
c46400dd
     av_freep(&caf->pkt_sizes);
2c4ad1a3
     return 0;
 }
 
 AVOutputFormat ff_caf_muxer = {
ba10207b
     .name           = "caf",
73f9d2e8
     .long_name      = NULL_IF_CONFIG_SMALL("Apple CAF (Core Audio Format)"),
ba10207b
     .mime_type      = "audio/x-caf",
     .extensions     = "caf",
     .priv_data_size = sizeof(CAFContext),
7a72695c
     .audio_codec    = AV_CODEC_ID_PCM_S16BE,
     .video_codec    = AV_CODEC_ID_NONE,
ba10207b
     .write_header   = caf_write_header,
     .write_packet   = caf_write_packet,
     .write_trailer  = caf_write_trailer,
73f9d2e8
     .codec_tag      = (const AVCodecTag* const []){ff_codec_caf_tags, 0},
2c4ad1a3
 };