[FFmpeg-cvslog] r23646 - in trunk/libavcodec: mpegaudio.h mpegaudiodec.c
Vitor Sessak
vitor1001
Sat Jun 19 15:33:50 CEST 2010
On 06/19/2010 01:13 PM, M?ns Rullg?rd wrote:
> vitor<subversion at mplayerhq.hu> writes:
>
>> Author: vitor
>> Date: Sat Jun 19 11:56:05 2010
>> New Revision: 23646
>>
>> Log:
>> Factorize the mpegaudio windowing code in a function and call it by a
>> function pointer. Should allow for ASM optimizations.
>>
>> Modified:
>> trunk/libavcodec/mpegaudio.h
>> trunk/libavcodec/mpegaudiodec.c
>>
>> Modified: trunk/libavcodec/mpegaudiodec.c
>> ==============================================================================
>> --- trunk/libavcodec/mpegaudiodec.c Sat Jun 19 01:17:20 2010 (r23645)
>> +++ trunk/libavcodec/mpegaudiodec.c Sat Jun 19 11:56:05 2010 (r23646)
>> @@ -69,6 +69,8 @@
>>
>> static void compute_antialias_integer(MPADecodeContext *s, GranuleDef *g);
>> static void compute_antialias_float(MPADecodeContext *s, GranuleDef *g);
>> +static void apply_window_mp3_c(MPA_INT *synth_buf, MPA_INT *window,
>> + int *dither_state, OUT_INT *samples, int incr);
>>
>> /* vlc structure for decoding layer 3 huffman tables */
>> static VLC huff_vlc[16];
>> @@ -305,6 +307,7 @@ static av_cold int decode_init(AVCodecCo
>> int i, j, k;
>>
>> s->avctx = avctx;
>> + s->apply_window_mp3 = apply_window_mp3_c;
>>
>> avctx->sample_fmt= OUT_FMT;
>> s->error_recognition= avctx->error_recognition;
>> @@ -836,41 +839,20 @@ void av_cold RENAME(ff_mpa_synth_init)(M
>> }
>> }
>>
>> -/* 32 sub band synthesis filter. Input: 32 sub band samples, Output:
>> - 32 samples. */
>> -/* XXX: optimize by avoiding ring buffer usage */
>> -void RENAME(ff_mpa_synth_filter)(MPA_INT *synth_buf_ptr, int *synth_buf_offset,
>> - MPA_INT *window, int *dither_state,
>> - OUT_INT *samples, int incr,
>> - INTFLOAT sb_samples[SBLIMIT])
>> +static void apply_window_mp3_c(MPA_INT *synth_buf, MPA_INT *window,
>> + int *dither_state, OUT_INT *samples, int incr)
>> {
>> - register MPA_INT *synth_buf;
>> register const MPA_INT *w, *w2, *p;
>> - int j, offset;
>> + int j;
>> OUT_INT *samples2;
>> #if CONFIG_FLOAT
>> float sum, sum2;
>> #elif FRAC_BITS<= 15
>> - int32_t tmp[32];
>> int sum, sum2;
>> #else
>> int64_t sum, sum2;
>> #endif
>>
>> - offset = *synth_buf_offset;
>> - synth_buf = synth_buf_ptr + offset;
>> -
>> -#if FRAC_BITS<= 15&& !CONFIG_FLOAT
>> - dct32(tmp, sb_samples);
>> - for(j=0;j<32;j++) {
>> - /* NOTE: can cause a loss in precision if very high amplitude
>> - sound */
>> - synth_buf[j] = av_clip_int16(tmp[j]);
>> - }
>> -#else
>> - dct32(synth_buf, sb_samples);
>> -#endif
>> -
>> /* copy to avoid wrap */
>> memcpy(synth_buf + 512, synth_buf, 32 * sizeof(*synth_buf));
>>
>> @@ -909,10 +891,63 @@ void RENAME(ff_mpa_synth_filter)(MPA_INT
>> SUM8(MLSS, sum, w + 32, p);
>> *samples = round_sample(&sum);
>> *dither_state= sum;
>> +}
>> +
>> +
>> +/* 32 sub band synthesis filter. Input: 32 sub band samples, Output:
>> + 32 samples. */
>> +/* XXX: optimize by avoiding ring buffer usage */
>> +#if CONFIG_FLOAT
>> +void ff_mpa_synth_filter_float(MPADecodeContext *s, float *synth_buf_ptr,
>> + int *synth_buf_offset,
>> + float *window, int *dither_state,
>> + float *samples, int incr,
>> + float sb_samples[SBLIMIT])
>> +{
>> + float *synth_buf;
>> + int offset;
>> +
>> + offset = *synth_buf_offset;
>> + synth_buf = synth_buf_ptr + offset;
>> +
>> + dct32(synth_buf, sb_samples);
>> + s->apply_window_mp3(synth_buf, window, dither_state, samples, incr);
>> +
>> + offset = (offset - 32)& 511;
>> + *synth_buf_offset = offset;
>> +}
>> +#else
>> +void ff_mpa_synth_filter(MPA_INT *synth_buf_ptr, int *synth_buf_offset,
>> + MPA_INT *window, int *dither_state,
>> + OUT_INT *samples, int incr,
>> + INTFLOAT sb_samples[SBLIMIT])
>> +{
>> + register MPA_INT *synth_buf;
>> + int offset;
>> +#if FRAC_BITS<= 15
>> + int32_t tmp[32];
>> +#endif
>> +
>> + offset = *synth_buf_offset;
>> + synth_buf = synth_buf_ptr + offset;
>> +
>> +#if FRAC_BITS<= 15&& !CONFIG_FLOAT
>
> !CONFIG_FLOAT is always true here.
Of course. I noticed that but I thought it would be better not to touch
the original function in the first patch. If we settle for the code as
is, I will remove it.
>> + dct32(tmp, sb_samples);
>> + for(j=0;j<32;j++) {
>> + /* NOTE: can cause a loss in precision if very high amplitude
>> + sound */
>> + synth_buf[j] = av_clip_int16(tmp[j]);
>> + }
>> +#else
>> + dct32(synth_buf, sb_samples);
>> +#endif
>> +
>> + apply_window_mp3_c(synth_buf, window, dither_state, samples, incr);
>
> Why doesn't this use a function pointer too?
Because this is a public function used by other codecs (mpc and qdm2).
It would need either to make them store and initialize a
MPADecodeContext just for this function or to create some MPADSPContext
just for this function, which is also silly. Of course, everything
changes if you are planning to write a NEON optimized version of this
function...
>> offset = (offset - 32)& 511;
>> *synth_buf_offset = offset;
>> }
>> +#endif
>>
>> #define C3 FIXHR(0.86602540378443864676/2)
>>
>> @@ -2227,7 +2262,11 @@ static int mp_decode_frame(MPADecodeCont
>> for(ch=0;ch<s->nb_channels;ch++) {
>> samples_ptr = samples + ch;
>> for(i=0;i<nb_frames;i++) {
>> - RENAME(ff_mpa_synth_filter)(s->synth_buf[ch],&(s->synth_buf_offset[ch]),
>> + RENAME(ff_mpa_synth_filter)(
>> +#if CONFIG_FLOAT
>> + s,
>> +#endif
>
> Do I really need to tell you that this is hideously ugly?
No, that's why I was expecting some suggestion ;)
-Vitor
More information about the ffmpeg-cvslog
mailing list