59686073 |
/*
* WMA compatible encoder
* Copyright (c) 2007 Michael Niedermayer
*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
|
6fee1b90 |
#include "libavutil/attributes.h" |
d2a4e4b9 |
|
59686073 |
#include "avcodec.h" |
27bacfeb |
#include "internal.h" |
59686073 |
#include "wma.h" |
0d92e5a6 |
#include "libavutil/avassert.h" |
59686073 |
|
6fee1b90 |
static av_cold int encode_init(AVCodecContext *avctx)
{ |
911b9faf |
WMACodecContext *s = avctx->priv_data; |
2ed40608 |
int i, flags1, flags2, block_align; |
59686073 |
uint8_t *extradata;
|
a9c9a240 |
s->avctx = avctx;
|
d2a4e4b9 |
if (avctx->channels > MAX_CHANNELS) {
av_log(avctx, AV_LOG_ERROR, |
75a9859a |
"too many channels: got %i, need %i or fewer\n", |
0cd13834 |
avctx->channels, MAX_CHANNELS);
return AVERROR(EINVAL);
}
|
1ec075cf |
if (avctx->sample_rate > 48000) { |
53819605 |
av_log(avctx, AV_LOG_ERROR, "sample rate is too high: %d > 48kHz\n", |
1ec075cf |
avctx->sample_rate);
return AVERROR(EINVAL);
}
|
d2a4e4b9 |
if (avctx->bit_rate < 24 * 1000) {
av_log(avctx, AV_LOG_ERROR,
"bitrate too low: got %i, need 24000 or higher\n", |
0cd13834 |
avctx->bit_rate);
return AVERROR(EINVAL);
} |
2ed76c08 |
|
59686073 |
/* extract flag infos */
flags1 = 0;
flags2 = 1; |
36ef5369 |
if (avctx->codec->id == AV_CODEC_ID_WMAV1) { |
d2a4e4b9 |
extradata = av_malloc(4);
avctx->extradata_size = 4; |
2c124cb6 |
AV_WL16(extradata, flags1); |
d2a4e4b9 |
AV_WL16(extradata + 2, flags2); |
36ef5369 |
} else if (avctx->codec->id == AV_CODEC_ID_WMAV2) { |
d2a4e4b9 |
extradata = av_mallocz(10);
avctx->extradata_size = 10; |
2c124cb6 |
AV_WL32(extradata, flags1); |
d2a4e4b9 |
AV_WL16(extradata + 4, flags2);
} else { |
9eb6e5cc |
av_assert0(0); |
d2a4e4b9 |
}
avctx->extradata = extradata;
s->use_exp_vlc = flags2 & 0x0001;
s->use_bit_reservoir = flags2 & 0x0002; |
59686073 |
s->use_variable_block_len = flags2 & 0x0004; |
51ddf35c |
if (avctx->channels == 2)
s->ms_stereo = 1; |
59686073 |
ff_wma_init(avctx, flags2);
/* init MDCT */ |
d2a4e4b9 |
for (i = 0; i < s->nb_block_sizes; i++) |
7d485f16 |
ff_mdct_init(&s->mdct_ctx[i], s->frame_len_bits - i + 1, 0, 1.0); |
59686073 |
|
d2a4e4b9 |
block_align = avctx->bit_rate * (int64_t) s->frame_len / |
c2b8dea1 |
(avctx->sample_rate * 8); |
2ed40608 |
block_align = FFMIN(block_align, MAX_CODED_SUPERFRAME_SIZE);
avctx->block_align = block_align; |
2df0c32e |
avctx->frame_size = avctx->initial_padding = s->frame_len; |
27bacfeb |
|
59686073 |
return 0;
}
|
d2a4e4b9 |
static void apply_window_and_mdct(AVCodecContext *avctx, const AVFrame *frame) |
31b2262d |
{ |
911b9faf |
WMACodecContext *s = avctx->priv_data; |
d2a4e4b9 |
float **audio = (float **) frame->extended_data; |
31b2262d |
int len = frame->nb_samples; |
d2a4e4b9 |
int window_index = s->frame_len_bits - s->block_len_bits;
FFTContext *mdct = &s->mdct_ctx[window_index]; |
31b2262d |
int ch; |
d2a4e4b9 |
const float *win = s->windows[window_index];
int window_len = 1 << s->block_len_bits;
float n = 2.0 * 32768.0 / window_len; |
31b2262d |
for (ch = 0; ch < avctx->channels; ch++) {
memcpy(s->output, s->frame_out[ch], window_len * sizeof(*s->output)); |
2fbb9e64 |
s->fdsp->vector_fmul_scalar(s->frame_out[ch], audio[ch], n, len);
s->fdsp->vector_fmul_reverse(&s->output[window_len], s->frame_out[ch], |
d2a4e4b9 |
win, len); |
2fbb9e64 |
s->fdsp->vector_fmul(s->frame_out[ch], s->frame_out[ch], win, len); |
31b2262d |
mdct->mdct_calc(mdct, s->coefs[ch], s->output); |
59686073 |
}
}
|
d2a4e4b9 |
// FIXME use for decoding too
static void init_exp(WMACodecContext *s, int ch, const int *exp_param)
{ |
59686073 |
int n;
const uint16_t *ptr;
float v, *q, max_scale, *q_end;
|
d2a4e4b9 |
ptr = s->exponent_bands[s->frame_len_bits - s->block_len_bits];
q = s->exponents[ch];
q_end = q + s->block_len; |
59686073 |
max_scale = 0;
while (q < q_end) {
/* XXX: use a table */ |
d2a4e4b9 |
v = pow(10, *exp_param++ *(1.0 / 16.0));
max_scale = FFMAX(max_scale, v);
n = *ptr++; |
59686073 |
do {
*q++ = v;
} while (--n);
}
s->max_exponent[ch] = max_scale;
}
|
d2a4e4b9 |
static void encode_exp_vlc(WMACodecContext *s, int ch, const int *exp_param)
{ |
59686073 |
int last_exp;
const uint16_t *ptr;
float *q, *q_end;
|
d2a4e4b9 |
ptr = s->exponent_bands[s->frame_len_bits - s->block_len_bits];
q = s->exponents[ch]; |
59686073 |
q_end = q + s->block_len;
if (s->version == 1) { |
d2a4e4b9 |
last_exp = *exp_param++; |
75a9859a |
av_assert0(last_exp - 10 >= 0 && last_exp - 10 < 32); |
59686073 |
put_bits(&s->pb, 5, last_exp - 10); |
d2a4e4b9 |
q += *ptr++;
} else |
59686073 |
last_exp = 36;
while (q < q_end) { |
d2a4e4b9 |
int exp = *exp_param++; |
59686073 |
int code = exp - last_exp + 60; |
9eb6e5cc |
av_assert1(code >= 0 && code < 120); |
d2a4e4b9 |
put_bits(&s->pb, ff_aac_scalefactor_bits[code],
ff_aac_scalefactor_code[code]); |
59686073 |
/* XXX: use a table */ |
d2a4e4b9 |
q += *ptr++;
last_exp = exp; |
59686073 |
}
}
|
d2a4e4b9 |
static int encode_block(WMACodecContext *s, float (*src_coefs)[BLOCK_MAX_SIZE],
int total_gain)
{ |
59686073 |
int v, bsize, ch, coef_nb_bits, parse_exponents;
float mdct_norm;
int nb_coefs[MAX_CHANNELS]; |
d2a4e4b9 |
static const int fixed_exp[25] = {
20, 20, 20, 20, 20,
20, 20, 20, 20, 20,
20, 20, 20, 20, 20,
20, 20, 20, 20, 20,
20, 20, 20, 20, 20
};
// FIXME remove duplication relative to decoder |
59686073 |
if (s->use_variable_block_len) { |
75a9859a |
av_assert0(0); // FIXME not implemented |
d2a4e4b9 |
} else { |
59686073 |
/* fixed block len */
s->next_block_len_bits = s->frame_len_bits;
s->prev_block_len_bits = s->frame_len_bits; |
d2a4e4b9 |
s->block_len_bits = s->frame_len_bits; |
59686073 |
}
s->block_len = 1 << s->block_len_bits; |
5936d982 |
// av_assert0((s->block_pos + s->block_len) <= s->frame_len); |
59686073 |
bsize = s->frame_len_bits - s->block_len_bits;
|
d2a4e4b9 |
// FIXME factor |
59686073 |
v = s->coefs_end[bsize] - s->coefs_start; |
2ed40608 |
for (ch = 0; ch < s->avctx->channels; ch++) |
59686073 |
nb_coefs[ch] = v;
{
int n4 = s->block_len / 2; |
d2a4e4b9 |
mdct_norm = 1.0 / (float) n4;
if (s->version == 1) |
59686073 |
mdct_norm *= sqrt(n4);
}
|
d2a4e4b9 |
if (s->avctx->channels == 2) |
51ddf35c |
put_bits(&s->pb, 1, !!s->ms_stereo); |
59686073 |
|
2ed40608 |
for (ch = 0; ch < s->avctx->channels; ch++) { |
d2a4e4b9 |
// FIXME only set channel_coded when needed, instead of always
s->channel_coded[ch] = 1;
if (s->channel_coded[ch]) |
59686073 |
init_exp(s, ch, fixed_exp);
}
|
2ed40608 |
for (ch = 0; ch < s->avctx->channels; ch++) { |
59686073 |
if (s->channel_coded[ch]) { |
9970c61b |
WMACoef *coefs1; |
59686073 |
float *coefs, *exponents, mult;
int i, n;
|
d2a4e4b9 |
coefs1 = s->coefs1[ch]; |
59686073 |
exponents = s->exponents[ch]; |
d2a4e4b9 |
mult = pow(10, total_gain * 0.05) / s->max_exponent[ch];
mult *= mdct_norm;
coefs = src_coefs[ch]; |
59686073 |
if (s->use_noise_coding && 0) { |
75a9859a |
av_assert0(0); // FIXME not implemented |
59686073 |
} else {
coefs += s->coefs_start; |
d2a4e4b9 |
n = nb_coefs[ch];
for (i = 0; i < n; i++) {
double t = *coefs++ / (exponents[i] * mult);
if (t < -32768 || t > 32767) |
59686073 |
return -1;
coefs1[i] = lrint(t);
}
}
}
}
v = 0; |
2ed40608 |
for (ch = 0; ch < s->avctx->channels; ch++) { |
21ac1d47 |
int a = s->channel_coded[ch]; |
59686073 |
put_bits(&s->pb, 1, a);
v |= a;
}
if (!v)
return 1;
|
d2a4e4b9 |
for (v = total_gain - 1; v >= 127; v -= 127) |
59686073 |
put_bits(&s->pb, 7, 127);
put_bits(&s->pb, 7, v);
|
d2a4e4b9 |
coef_nb_bits = ff_wma_total_gain_to_bits(total_gain); |
59686073 |
if (s->use_noise_coding) { |
2ed40608 |
for (ch = 0; ch < s->avctx->channels; ch++) { |
59686073 |
if (s->channel_coded[ch]) {
int i, n;
n = s->exponent_high_sizes[bsize]; |
d2a4e4b9 |
for (i = 0; i < n; i++) {
put_bits(&s->pb, 1, s->high_band_coded[ch][i] = 0); |
59686073 |
if (0)
nb_coefs[ch] -= s->exponent_high_bands[bsize][i];
}
}
}
}
parse_exponents = 1; |
d2a4e4b9 |
if (s->block_len_bits != s->frame_len_bits) |
59686073 |
put_bits(&s->pb, 1, parse_exponents);
if (parse_exponents) { |
2ed40608 |
for (ch = 0; ch < s->avctx->channels; ch++) { |
59686073 |
if (s->channel_coded[ch]) {
if (s->use_exp_vlc) {
encode_exp_vlc(s, ch, fixed_exp);
} else { |
75a9859a |
av_assert0(0); // FIXME not implemented |
59686073 |
// encode_exp_lsp(s, ch);
}
}
} |
d2a4e4b9 |
} else |
75a9859a |
av_assert0(0); // FIXME not implemented |
59686073 |
|
2ed40608 |
for (ch = 0; ch < s->avctx->channels; ch++) { |
59686073 |
if (s->channel_coded[ch]) {
int run, tindex; |
9970c61b |
WMACoef *ptr, *eptr; |
59686073 |
tindex = (ch == 1 && s->ms_stereo); |
d2a4e4b9 |
ptr = &s->coefs1[ch][0];
eptr = ptr + nb_coefs[ch];
run = 0;
for (; ptr < eptr; ptr++) {
if (*ptr) {
int level = *ptr;
int abs_level = FFABS(level);
int code = 0;
if (abs_level <= s->coef_vlcs[tindex]->max_level)
if (run < s->coef_vlcs[tindex]->levels[abs_level - 1])
code = run + s->int_table[tindex][abs_level - 1]; |
59686073 |
|
9eb6e5cc |
av_assert2(code < s->coef_vlcs[tindex]->n); |
d2a4e4b9 |
put_bits(&s->pb, s->coef_vlcs[tindex]->huffbits[code],
s->coef_vlcs[tindex]->huffcodes[code]); |
59686073 |
|
d2a4e4b9 |
if (code == 0) {
if (1 << coef_nb_bits <= abs_level) |
59686073 |
return -1;
put_bits(&s->pb, coef_nb_bits, abs_level);
put_bits(&s->pb, s->frame_len_bits, run);
} |
d2a4e4b9 |
// FIXME the sign is flipped somewhere
put_bits(&s->pb, 1, level < 0);
run = 0;
} else |
59686073 |
run++;
} |
d2a4e4b9 |
if (run)
put_bits(&s->pb, s->coef_vlcs[tindex]->huffbits[1],
s->coef_vlcs[tindex]->huffcodes[1]); |
59686073 |
} |
d2a4e4b9 |
if (s->version == 1 && s->avctx->channels >= 2) |
9f51c682 |
avpriv_align_put_bits(&s->pb); |
59686073 |
}
return 0;
}
|
d2a4e4b9 |
static int encode_frame(WMACodecContext *s, float (*src_coefs)[BLOCK_MAX_SIZE],
uint8_t *buf, int buf_size, int total_gain)
{ |
59686073 |
init_put_bits(&s->pb, buf, buf_size);
|
d2a4e4b9 |
if (s->use_bit_reservoir) |
75a9859a |
av_assert0(0); // FIXME not implemented |
d2a4e4b9 |
else if (encode_block(s, src_coefs, total_gain) < 0)
return INT_MAX; |
59686073 |
|
9f51c682 |
avpriv_align_put_bits(&s->pb); |
59686073 |
|
2ed40608 |
return put_bits_count(&s->pb) / 8 - s->avctx->block_align; |
59686073 |
}
|
27bacfeb |
static int encode_superframe(AVCodecContext *avctx, AVPacket *avpkt,
const AVFrame *frame, int *got_packet_ptr)
{ |
911b9faf |
WMACodecContext *s = avctx->priv_data; |
5968a076 |
int i, total_gain, ret, error; |
59686073 |
|
d2a4e4b9 |
s->block_len_bits = s->frame_len_bits; // required by non variable block len
s->block_len = 1 << s->block_len_bits; |
59686073 |
|
31b2262d |
apply_window_and_mdct(avctx, frame); |
59686073 |
if (s->ms_stereo) {
float a, b;
int i;
|
d2a4e4b9 |
for (i = 0; i < s->block_len; i++) {
a = s->coefs[0][i] * 0.5;
b = s->coefs[1][i] * 0.5; |
59686073 |
s->coefs[0][i] = a + b;
s->coefs[1][i] = a - b;
}
}
|
bcaf64b6 |
if ((ret = ff_alloc_packet2(avctx, avpkt, 2 * MAX_CODED_SUPERFRAME_SIZE)) < 0) |
27bacfeb |
return ret; |
dfc4fded |
|
d2a4e4b9 |
total_gain = 128;
for (i = 64; i; i >>= 1) { |
5968a076 |
error = encode_frame(s, s->coefs, avpkt->data, avpkt->size, |
27bacfeb |
total_gain - i); |
75a9859a |
if (error <= 0) |
d2a4e4b9 |
total_gain -= i; |
59686073 |
}
|
5968a076 |
while(total_gain <= 128 && error > 0)
error = encode_frame(s, s->coefs, avpkt->data, avpkt->size, total_gain++); |
dccaad3b |
if (error > 0) {
av_log(avctx, AV_LOG_ERROR, "Invalid input data or requested bitrate too low, cannot encode\n");
avpkt->size = 0;
return AVERROR(EINVAL);
} |
0a7bf340 |
av_assert0((put_bits_count(&s->pb) & 7) == 0); |
8551c6be |
i= avctx->block_align - (put_bits_count(&s->pb)+7)/8; |
0a7bf340 |
av_assert0(i>=0); |
c99bd294 |
while(i--) |
59686073 |
put_bits(&s->pb, 8, 'N');
flush_put_bits(&s->pb); |
8551c6be |
av_assert0(put_bits_ptr(&s->pb) - s->pb.buf == avctx->block_align); |
27bacfeb |
if (frame->pts != AV_NOPTS_VALUE) |
2df0c32e |
avpkt->pts = frame->pts - ff_samples_to_time_base(avctx, avctx->initial_padding); |
27bacfeb |
|
d2a4e4b9 |
avpkt->size = avctx->block_align; |
27bacfeb |
*got_packet_ptr = 1;
return 0; |
59686073 |
}
|
137e8081 |
#if CONFIG_WMAV1_ENCODER |
86714887 |
AVCodec ff_wmav1_encoder = {
.name = "wmav1", |
b2bed932 |
.long_name = NULL_IF_CONFIG_SMALL("Windows Media Audio 1"), |
86714887 |
.type = AVMEDIA_TYPE_AUDIO, |
36ef5369 |
.id = AV_CODEC_ID_WMAV1, |
86714887 |
.priv_data_size = sizeof(WMACodecContext),
.init = encode_init, |
27bacfeb |
.encode2 = encode_superframe, |
86714887 |
.close = ff_wma_end, |
d2a4e4b9 |
.sample_fmts = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLTP,
AV_SAMPLE_FMT_NONE }, |
59686073 |
}; |
137e8081 |
#endif
#if CONFIG_WMAV2_ENCODER |
86714887 |
AVCodec ff_wmav2_encoder = {
.name = "wmav2", |
b2bed932 |
.long_name = NULL_IF_CONFIG_SMALL("Windows Media Audio 2"), |
86714887 |
.type = AVMEDIA_TYPE_AUDIO, |
36ef5369 |
.id = AV_CODEC_ID_WMAV2, |
86714887 |
.priv_data_size = sizeof(WMACodecContext),
.init = encode_init, |
27bacfeb |
.encode2 = encode_superframe, |
86714887 |
.close = ff_wma_end, |
d2a4e4b9 |
.sample_fmts = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLTP,
AV_SAMPLE_FMT_NONE }, |
59686073 |
}; |
137e8081 |
#endif |