summaryrefslogtreecommitdiffstats
path: root/libmpcodecs/ad_imaadpcm.c
diff options
context:
space:
mode:
authormelanson <melanson@b3059339-0415-0410-9bf9-f77b7e298cf2>2002-03-30 22:27:45 +0000
committermelanson <melanson@b3059339-0415-0410-9bf9-f77b7e298cf2>2002-03-30 22:27:45 +0000
commita9803b9f75c07b97c597cca6223e29887a75b759 (patch)
tree2f0f9d2b085ce8402512fcf422d989715bcd8df8 /libmpcodecs/ad_imaadpcm.c
parent73309be6c854414cecdcfbb8110926ed45b4af52 (diff)
downloadmpv-a9803b9f75c07b97c597cca6223e29887a75b759.tar.bz2
mpv-a9803b9f75c07b97c597cca6223e29887a75b759.tar.xz
reworked ADPCM decoders; changes include:
* fixed MS IMA ADPCM * dissolved adpcm.c/.h into appropriate ad_* decoders * DK4 audio is handled directly by IMA ADPCM decoder (this obsoletes ad_dk4adpcm.c) git-svn-id: svn://svn.mplayerhq.hu/mplayer/trunk@5409 b3059339-0415-0410-9bf9-f77b7e298cf2
Diffstat (limited to 'libmpcodecs/ad_imaadpcm.c')
-rw-r--r--libmpcodecs/ad_imaadpcm.c351
1 files changed, 333 insertions, 18 deletions
diff --git a/libmpcodecs/ad_imaadpcm.c b/libmpcodecs/ad_imaadpcm.c
index eca064d6c5..7f9e076eb0 100644
--- a/libmpcodecs/ad_imaadpcm.c
+++ b/libmpcodecs/ad_imaadpcm.c
@@ -1,11 +1,71 @@
+/*
+ IMA ADPCM Decoder for MPlayer
+ by Mike Melanson
+
+ This file is in charge of decoding all of the various IMA ADPCM data
+ formats that various entities have created. Details about the data
+ formats can be found here:
+ http://www.pcisys.net/~melanson/codecs/
+
+ So far, this file handles these formats:
+ 'ima4': IMA ADPCM found in QT files
+ 0x11: IMA ADPCM found in MS AVI/ASF/WAV files
+ 0x61: DK4 ADPCM found in certain AVI files on Sega Saturn CD-ROMs;
+ note that this is a 'rogue' format number in that it was
+ never officially registered with Microsoft
+*/
+
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include "config.h"
+#include "bswap.h"
#include "ad_internal.h"
-#include "../adpcm.h"
+#define MS_IMA_ADPCM_PREAMBLE_SIZE 4
+
+#define QT_IMA_ADPCM_PREAMBLE_SIZE 2
+#define QT_IMA_ADPCM_BLOCK_SIZE 0x22
+#define QT_IMA_ADPCM_SAMPLES_PER_BLOCK 64
+
+#define BE_16(x) (be2me_16(*(unsigned short *)(x)))
+#define BE_32(x) (be2me_32(*(unsigned int *)(x)))
+#define LE_16(x) (le2me_16(*(unsigned short *)(x)))
+#define LE_32(x) (le2me_32(*(unsigned int *)(x)))
+
+// pertinent tables for IMA ADPCM
+static int adpcm_step[89] =
+{
+ 7, 8, 9, 10, 11, 12, 13, 14, 16, 17,
+ 19, 21, 23, 25, 28, 31, 34, 37, 41, 45,
+ 50, 55, 60, 66, 73, 80, 88, 97, 107, 118,
+ 130, 143, 157, 173, 190, 209, 230, 253, 279, 307,
+ 337, 371, 408, 449, 494, 544, 598, 658, 724, 796,
+ 876, 963, 1060, 1166, 1282, 1411, 1552, 1707, 1878, 2066,
+ 2272, 2499, 2749, 3024, 3327, 3660, 4026, 4428, 4871, 5358,
+ 5894, 6484, 7132, 7845, 8630, 9493, 10442, 11487, 12635, 13899,
+ 15289, 16818, 18500, 20350, 22385, 24623, 27086, 29794, 32767
+};
+
+static int adpcm_index[16] =
+{
+ -1, -1, -1, -1, 2, 4, 6, 8,
+ -1, -1, -1, -1, 2, 4, 6, 8
+};
+
+// useful macros
+// clamp a number between 0 and 88
+#define CLAMP_0_TO_88(x) if (x < 0) x = 0; else if (x > 88) x = 88;
+// clamp a number within a signed 16-bit range
+#define CLAMP_S16(x) if (x < -32768) x = -32768; \
+ else if (x > 32767) x = 32767;
+// clamp a number above 16
+#define CLAMP_ABOVE_16(x) if (x < 16) x = 16;
+// sign extend a 16-bit value
+#define SE_16BIT(x) if (x & 0x8000) x -= 0x10000;
+// sign extend a 4-bit value
+#define SE_4BIT(x) if (x & 0x8) x -= 0x10;
static ad_info_t info =
{
@@ -14,32 +74,52 @@ static ad_info_t info =
AFM_IMAADPCM,
"Nick Kurshev",
"Mike Melanson",
- "ima4 (MOV files)"
+ ""
};
LIBAD_EXTERN(imaadpcm)
+static int preinit(sh_audio_t *sh_audio)
+{
+ // not exactly sure what this field is for
+ sh_audio->audio_out_minsize = 8192;
+
+ // if format is "ima4", assume the audio is coming from a QT file which
+ // indicates constant block size, whereas an AVI/ASF/WAV file will fill
+ // in this field with 0x11
+ if ((sh_audio->format == 0x11) || (sh_audio->format == 0x61))
+ {
+ sh_audio->ds->ss_div = (sh_audio->wf->nBlockAlign -
+ (MS_IMA_ADPCM_PREAMBLE_SIZE * sh_audio->wf->nChannels)) * 2;
+ sh_audio->ds->ss_mul = sh_audio->wf->nBlockAlign;
+ }
+ else
+ {
+ sh_audio->ds->ss_div = QT_IMA_ADPCM_SAMPLES_PER_BLOCK;
+ sh_audio->ds->ss_mul = QT_IMA_ADPCM_BLOCK_SIZE * sh_audio->wf->nChannels;
+ }
+ return 1;
+}
+
static int init(sh_audio_t *sh_audio)
{
/* IMA-ADPCM 4:1 audio codec:*/
sh_audio->channels=sh_audio->wf->nChannels;
sh_audio->samplerate=sh_audio->wf->nSamplesPerSec;
/* decodes 34 byte -> 64 short*/
- sh_audio->i_bps=IMA_ADPCM_BLOCK_SIZE*(sh_audio->channels*sh_audio->samplerate)/
- IMA_ADPCM_SAMPLES_PER_BLOCK; /* 1:4 */
- return 1;
-}
+ sh_audio->i_bps =
+ (sh_audio->ds->ss_mul * sh_audio->samplerate) / sh_audio->ds->ss_div;
+
+ if ((sh_audio->a_in_buffer =
+ (unsigned char *)malloc(sh_audio->ds->ss_mul)) == NULL)
+ return 0;
-static int preinit(sh_audio_t *sh_audio)
-{
- sh_audio->audio_out_minsize=4096;
- sh_audio->ds->ss_div=IMA_ADPCM_SAMPLES_PER_BLOCK;
- sh_audio->ds->ss_mul=IMA_ADPCM_BLOCK_SIZE * sh_audio->wf->nChannels;
return 1;
}
-static void uninit(sh_audio_t *sh)
+static void uninit(sh_audio_t *sh_audio)
{
+ free(sh_audio->a_in_buffer);
}
static int control(sh_audio_t *sh,int cmd,void* arg, ...)
@@ -48,12 +128,247 @@ static int control(sh_audio_t *sh,int cmd,void* arg, ...)
return CONTROL_UNKNOWN;
}
+static void decode_nibbles(unsigned short *output,
+ int output_size, int channels,
+ int predictor_l, int index_l,
+ int predictor_r, int index_r)
+{
+ int step[2];
+ int predictor[2];
+ int index[2];
+ int diff;
+ int i;
+ int sign;
+ int delta;
+ int channel_number = 0;
+
+ step[0] = adpcm_step[index_l];
+ step[1] = adpcm_step[index_r];
+ predictor[0] = predictor_l;
+ predictor[1] = predictor_r;
+ index[0] = index_l;
+ index[1] = index_r;
+
+ for (i = 0; i < output_size; i++)
+ {
+ delta = output[i];
+
+ index[channel_number] += adpcm_index[delta];
+ CLAMP_0_TO_88(index[channel_number]);
+
+ sign = delta & 8;
+ delta = delta & 7;
+
+ diff = step[channel_number] >> 3;
+ if (delta & 4) diff += step[channel_number];
+ if (delta & 2) diff += step[channel_number] >> 1;
+ if (delta & 1) diff += step[channel_number] >> 2;
+
+ if (sign)
+ predictor[channel_number] -= diff;
+ else
+ predictor[channel_number] += diff;
+
+ CLAMP_S16(predictor[channel_number]);
+ output[i] = predictor[channel_number];
+ step[channel_number] = adpcm_step[index[channel_number]];
+
+ // toggle channel
+ channel_number ^= channels - 1;
+
+ }
+}
+
+static int qt_ima_adpcm_decode_block(unsigned short *output,
+ unsigned char *input, int channels)
+{
+ int initial_predictor_l = 0;
+ int initial_predictor_r = 0;
+ int initial_index_l = 0;
+ int initial_index_r = 0;
+ int i;
+
+ initial_predictor_l = BE_16(&input[0]);
+ initial_index_l = initial_predictor_l;
+
+ // mask, sign-extend, and clamp the predictor portion
+ initial_predictor_l &= 0xFF80;
+ SE_16BIT(initial_predictor_l);
+ CLAMP_S16(initial_predictor_l);
+
+ // mask and clamp the index portion
+ initial_index_l &= 0x7F;
+ CLAMP_0_TO_88(initial_index_l);
+
+ // handle stereo
+ if (channels > 1)
+ {
+ initial_predictor_r = BE_16(&input[QT_IMA_ADPCM_BLOCK_SIZE]);
+ initial_index_r = initial_predictor_r;
+
+ // mask, sign-extend, and clamp the predictor portion
+ initial_predictor_r &= 0xFF80;
+ SE_16BIT(initial_predictor_r);
+ CLAMP_S16(initial_predictor_r);
+
+ // mask and clamp the index portion
+ initial_index_r &= 0x7F;
+ CLAMP_0_TO_88(initial_index_r);
+ }
+
+ // break apart all of the nibbles in the block
+ if (channels == 1)
+ for (i = 0; i < QT_IMA_ADPCM_SAMPLES_PER_BLOCK / 2; i++)
+ {
+ output[i * 2 + 0] = input[2 + i] & 0x0F;
+ output[i * 2 + 1] = input[2 + i] >> 4;
+ }
+ else
+ for (i = 0; i < QT_IMA_ADPCM_SAMPLES_PER_BLOCK / 2 * 2; i++)
+ {
+ output[i * 4 + 0] = input[2 + i] & 0x0F;
+ output[i * 4 + 1] = input[2 + QT_IMA_ADPCM_BLOCK_SIZE + i] & 0x0F;
+ output[i * 4 + 2] = input[2 + i] >> 4;
+ output[i * 4 + 3] = input[2 + QT_IMA_ADPCM_BLOCK_SIZE + i] >> 4;
+ }
+
+ decode_nibbles(output,
+ QT_IMA_ADPCM_SAMPLES_PER_BLOCK * channels, channels,
+ initial_predictor_l, initial_index_l,
+ initial_predictor_r, initial_index_r);
+
+ return QT_IMA_ADPCM_SAMPLES_PER_BLOCK * channels;
+}
+
+static int ms_ima_adpcm_decode_block(unsigned short *output,
+ unsigned char *input, int channels, int block_size)
+{
+ int predictor_l = 0;
+ int predictor_r = 0;
+ int index_l = 0;
+ int index_r = 0;
+ int i;
+ int channel_counter;
+ int channel_index;
+ int channel_index_l;
+ int channel_index_r;
+
+ predictor_l = LE_16(&input[0]);
+ SE_16BIT(predictor_l);
+ index_l = input[2];
+ if (channels == 2)
+ {
+ predictor_r = LE_16(&input[4]);
+ SE_16BIT(predictor_r);
+ index_r = input[6];
+ }
+
+ if (channels == 1)
+ for (i = 0;
+ i < (block_size - MS_IMA_ADPCM_PREAMBLE_SIZE * channels) / 2; i++)
+ {
+ output[i * 2 + 0] = input[MS_IMA_ADPCM_PREAMBLE_SIZE + i] & 0x0F;
+ output[i * 2 + 1] = input[MS_IMA_ADPCM_PREAMBLE_SIZE + i] >> 4;
+ }
+ else
+ {
+ // encoded as 8 nibbles (4 bytes) per channel; switch channel every
+ // 4th byte
+ channel_counter = 0;
+ channel_index_l = 0;
+ channel_index_r = 1;
+ channel_index = channel_index_l;
+ for (i = 0;
+ i < (block_size - MS_IMA_ADPCM_PREAMBLE_SIZE * channels); i++)
+ {
+ output[channel_index + 0] =
+ input[MS_IMA_ADPCM_PREAMBLE_SIZE * 2 + i] & 0x0F;
+ output[channel_index + 2] =
+ input[MS_IMA_ADPCM_PREAMBLE_SIZE * 2 + i] >> 4;
+ channel_index += 4;
+ channel_counter++;
+ if (channel_counter == 4)
+ {
+ channel_index_l = channel_index;
+ channel_index = channel_index_r;
+ }
+ else if (channel_counter == 8)
+ {
+ channel_index_r = channel_index;
+ channel_index = channel_index_l;
+ channel_counter = 0;
+ }
+ }
+ }
+
+ decode_nibbles(output,
+ (block_size - MS_IMA_ADPCM_PREAMBLE_SIZE * channels) * 2,
+ channels,
+ predictor_l, index_l,
+ predictor_r, index_r);
+
+ return (block_size - MS_IMA_ADPCM_PREAMBLE_SIZE * channels) * 2;
+}
+
+static int dk4_ima_adpcm_decode_block(unsigned short *output,
+ unsigned char *input, int channels, int block_size)
+{
+ int i;
+ int output_ptr;
+ int predictor_l = 0;
+ int predictor_r = 0;
+ int index_l = 0;
+ int index_r = 0;
+
+ // the first predictor value goes straight to the output
+ predictor_l = output[0] = LE_16(&input[0]);
+ SE_16BIT(predictor_l);
+ index_l = input[2];
+ if (channels == 2)
+ {
+ predictor_r = output[1] = LE_16(&input[4]);
+ SE_16BIT(predictor_r);
+ index_r = input[6];
+ }
+
+ output_ptr = channels;
+ for (i = MS_IMA_ADPCM_PREAMBLE_SIZE * channels; i < block_size; i++)
+ {
+ output[output_ptr++] = input[i] >> 4;
+ output[output_ptr++] = input[i] & 0x0F;
+ }
+
+ decode_nibbles(&output[channels],
+ (block_size - MS_IMA_ADPCM_PREAMBLE_SIZE * channels) * 2 - channels,
+ channels,
+ predictor_l, index_l,
+ predictor_r, index_r);
+
+ return (block_size - MS_IMA_ADPCM_PREAMBLE_SIZE * channels) * 2 - channels;
+}
+
static int decode_audio(sh_audio_t *sh_audio,unsigned char *buf,int minlen,int maxlen)
{
- unsigned char ibuf[IMA_ADPCM_BLOCK_SIZE * 2]; /* bytes / stereo frame */
- if (demux_read_data(sh_audio->ds, ibuf,
- IMA_ADPCM_BLOCK_SIZE * sh_audio->wf->nChannels) !=
- IMA_ADPCM_BLOCK_SIZE * sh_audio->wf->nChannels)
- return -1;
- return 2*ima_adpcm_decode_block((unsigned short*)buf,ibuf, sh_audio->wf->nChannels);
+ if (demux_read_data(sh_audio->ds, sh_audio->a_in_buffer,
+ sh_audio->ds->ss_mul) !=
+ sh_audio->ds->ss_mul)
+ return -1;
+
+ if (sh_audio->format == 0x11)
+ {
+ return 2 * ms_ima_adpcm_decode_block(
+ (unsigned short*)buf, sh_audio->a_in_buffer, sh_audio->wf->nChannels,
+ sh_audio->ds->ss_mul);
+ }
+ else if (sh_audio->format == 0x61)
+ {
+ return 2 * dk4_ima_adpcm_decode_block(
+ (unsigned short*)buf, sh_audio->a_in_buffer, sh_audio->wf->nChannels,
+ sh_audio->ds->ss_mul);
+ }
+ else
+ {
+ return 2 * qt_ima_adpcm_decode_block(
+ (unsigned short*)buf, sh_audio->a_in_buffer, sh_audio->wf->nChannels);
+ }
}