#include "coding.h" /* LucasArts' iMUSE decoder, mainly for VIMA (like IMA but with variable frame and code sizes). * Reverse engineered from various .exe * * Info: * - https://github.com/scummvm/scummvm/blob/master/engines/scumm/imuse_digi/dimuse_codecs.cpp (V1) * - https://wiki.multimedia.cx/index.php/VIMA (V2) * - https://github.com/residualvm/residualvm/tree/master/engines/grim/imuse * https://github.com/residualvm/residualvm/tree/master/engines/grim/movie/codecs (V2) */ static const int16_t step_table[] = { /* same as IMA */ 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 19, 21, 23, 25, 28, 31, 34, 37, 41, 45, 50, 55, 60, 66, 73, 80, 88, 97, 107, 118, 130, 143, 157, 173, 190, 209, 230, 253, 279, 307, 337, 371, 408, 449, 494, 544, 598, 658, 724, 796, 876, 963, 1060, 1166, 1282, 1411, 1552, 1707, 1878, 2066, 2272, 2499, 2749, 3024, 3327, 3660, 4026, 4428, 4871, 5358, 5894, 6484, 7132, 7845, 8630, 9493, 10442,11487,12635,13899, 15289,16818,18500,20350,22385,24623,27086,29794, 32767, }; /* pre-calculated in V1: for (i = 0; i < 89; i++) { int counter = (4 * step_table[i] / 7) >> 1; int size = 1; while (counter > 0) { size++; counter >>= 1; } code_size_table[i] = clamp(size, 3, 8) - 1 } */ static const uint8_t code_size_table_v1[89] = { 2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 5, 5, 6, 6, 6, 6, 6, 6, 6, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, }; static const uint8_t code_size_table_v2[89] = { 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 5, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, }; static const int8_t index_table2b[4] = { -1, 4, -1, 4, }; static const int8_t index_table3b_v1[8] = { -1,-1, 2, 8, -1,-1, 2, 8, }; static const int8_t index_table3b_v2[8] = { -1,-1, 2, 6, -1,-1, 2, 6, }; static const int8_t index_table4b[16] = { -1,-1,-1,-1, 1, 2, 4, 6, -1,-1,-1,-1, 1, 2, 4, 6, }; static const int8_t index_table5b_v1[32] = { -1,-1,-1,-1,-1,-1,-1,-1, 1, 2, 4, 6, 8,12,16,32, -1,-1,-1,-1,-1,-1,-1,-1, 1, 2, 4, 6, 8,12,16,32, }; static const int8_t index_table5b_v2[32] = { -1,-1,-1,-1,-1,-1,-1,-1, 1, 1, 1, 2, 2, 4, 5, 6, -1,-1,-1,-1,-1,-1,-1,-1, 1, 1, 1, 2, 2, 4, 5, 6, }; static const int8_t index_table6b_v1[64] = { -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, 1, 2, 4, 6, 8,10,12,14, 16,18,20,22,24,26,28,32, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, 1, 2, 4, 6, 8,10,12,14, 16,18,20,22,24,26,28,32, }; static const int8_t index_table6b_v2[64] = { -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 4, 4, 4, 5, 5, 6, 6, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 4, 4, 4, 5, 5, 6, 6, }; static const int8_t index_table7b_v1[128] = { -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, 1, 2, 3, 4, 5, 6, 7, 8, 9,10,11,12,13,14,15,16, 17,18,19,20,21,22,23,24, 25,26,27,28,29,30,31,32, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, 1, 2, 3, 4, 5, 6, 7, 8, 9,10,11,12,13,14,15,16, 17,18,19,20,21,22,23,24, 25,26,27,28,29,30,31,32, }; static const int8_t index_table7b_v2[128] = { -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 6, 6, 6, 6, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, -1,-1,-1,-1,-1,-1,-1,-1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 6, 6, 6, 6, }; static const int8_t* index_tables_v1[8] = { NULL, NULL, index_table2b, index_table3b_v1, index_table4b, index_table5b_v1, index_table6b_v1, index_table7b_v1, }; /* seems V2 doesn't actually use <4b, nor mirrored parts, even though they are defined */ static const int8_t* index_tables_v2[8] = { NULL, NULL, index_table2b, index_table3b_v2, index_table4b, index_table5b_v2, index_table6b_v2, index_table7b_v2, }; #define MAX_CHANNELS 2 #define MAX_BLOCK_SIZE 0x2000 #define MAX_BLOCK_COUNT 0x10000 /* arbitrary max */ /* ************************** */ typedef struct { /*const*/ int16_t* samples; int filled; int channels; //todo may be more useful with filled/full? use 2 mark methods? } sbuf_t; /* copy, move and mark consumed samples */ static void sbuf_consume(sample_t** p_outbuf, int32_t* p_samples_to_do, sbuf_t* sbuf) { int samples_consume; samples_consume = *p_samples_to_do; if (samples_consume > sbuf->filled) samples_consume = sbuf->filled; /* memcpy is safe when filled/samples_copy is 0 (but must pass non-NULL bufs) */ memcpy(*p_outbuf, sbuf->samples, samples_consume * sbuf->channels * sizeof(int16_t)); sbuf->samples += samples_consume * sbuf->channels; sbuf->filled -= samples_consume; *p_outbuf += samples_consume * sbuf->channels; *p_samples_to_do -= samples_consume; } static int clamp_s32(int val, int min, int max) { if (val > max) return max; else if (val < min) return min; return val; } /* ************************** */ typedef enum { COMP, MCMP } imuse_type_t; struct imuse_codec_data { /* config */ imuse_type_t type; int channels; size_t block_count; struct block_entry_t { uint32_t offset; /* from file start */ uint32_t size; uint32_t flags; uint32_t data; } *block_table; uint16_t adpcm_table[64 * 89]; /* state */ sbuf_t sbuf; int current_block; int16_t samples[MAX_BLOCK_SIZE / sizeof(int16_t) * MAX_CHANNELS]; }; imuse_codec_data* init_imuse(STREAMFILE* sf, int channels) { int i, j; off_t offset, data_offset; imuse_codec_data* data = NULL; if (channels > MAX_CHANNELS) goto fail; data = calloc(1, sizeof(struct imuse_codec_data)); if (!data) goto fail; data->channels = channels; /* read index table */ if (read_u32be(0x00,sf) == 0x434F4D50) { /* "COMP" */ data->block_count = read_u32be(0x04,sf); if (data->block_count > MAX_BLOCK_COUNT) goto fail; /* 08: base codec? */ /* 0c: some size? */ data->block_table = calloc(data->block_count, sizeof(struct block_entry_t)); if (!data->block_table) goto fail; offset = 0x10; for (i = 0; i < data->block_count; i++) { struct block_entry_t* entry = &data->block_table[i]; entry->offset = read_u32be(offset + 0x00, sf); entry->size = read_u32be(offset + 0x04, sf); entry->flags = read_u32be(offset + 0x08, sf); /* 0x0c: null */ entry->data = MAX_BLOCK_SIZE; /* blocks decode into fixed size, that may include header */ if (entry->size > MAX_BLOCK_SIZE) { VGM_LOG("IMUSE: block size too big\n"); goto fail; } if (entry->flags != 0x0D && entry->flags != 0x0F) { /* VIMA */ VGM_LOG("IMUSE: unknown codec\n"); goto fail; /* others are bunch of mini-codecs (ex. The Dig) */ } offset += 0x10; } /* detect type */ { uint32_t id = read_u32be(data->block_table[0].offset + 0x02, sf); if (id == 0x694D5553) { /* "iMUS" header [The Curse of Monkey Island (PC)] */ data->type = COMP; } else { goto fail; /* no header [The Dig (PC)] */ } } } else if (read_u32be(0x00,sf) == 0x4D434D50) { /* "MCMP" */ data->block_count = read_u16be(0x04,sf); if (data->block_count > MAX_BLOCK_COUNT) goto fail; data->block_table = calloc(data->block_count, sizeof(struct block_entry_t)); if (!data->block_table) goto fail; /* pre-calculate for simpler logic */ data_offset = 0x06 + data->block_count * 0x09; data_offset += 0x02 + read_u16be(data_offset + 0x00, sf); /* mini text header */ offset = 0x06; for (i = 0; i < data->block_count; i++) { struct block_entry_t* entry = &data->block_table[i]; entry->flags = read_u8 (offset + 0x00, sf); entry->data = read_u32be(offset + 0x01, sf); entry->size = read_u32be(offset + 0x05, sf); entry->offset = data_offset; /* blocks of data and audio are separate */ if (entry->data > MAX_BLOCK_SIZE || entry->size > MAX_BLOCK_SIZE) { VGM_LOG("IMUSE: block size too big\n"); goto fail; } if (entry->flags != 0x00 && entry->flags != 0x01) { /* data or VIMA */ VGM_LOG("IMUSE: unknown codec\n"); goto fail; } offset += 0x09; data_offset += entry->size; } data->type = MCMP; /* with header [Grim Fandango (multi)] */ /* there are iMUS or RIFF headers but affect parser */ } else { goto fail; } /* iMUSE pre-calculates main decode ops as a table, looks similar to standard IMA expand */ for (i = 0; i < 64; i++) { for (j = 0; j < 89; j++) { int counter = 32; int value = 0; int step = step_table[j]; while (counter > 0) { if (counter & i) value += step; step >>= 1; counter >>= 1; } data->adpcm_table[i + j * 64] = value; /* non sequential: all 64 [0]s, [1]s ... [88]s */ } } reset_imuse(data); return data; fail: free_imuse(data); return NULL; } /* **************************************** */ static void decode_vima1(STREAMFILE* sf, sbuf_t* sbuf, uint8_t* buf, size_t data_left, int block_num, uint16_t* adpcm_table) { int ch, i, j, s; int bitpos; int adpcm_history[MAX_CHANNELS] = {0}; int adpcm_step_index[MAX_CHANNELS] = {0}; int chs = sbuf->channels; /* read header (outside decode in original code) */ { int pos = 0; size_t copy_size; /* decodes BLOCK_SIZE bytes (not samples), including copy_size if exists, but not first 16b * or ADPCM headers. ADPCM setup must be set to 0 if headers weren't read. */ copy_size = get_u16be(buf + pos); pos += 0x02; if (block_num == 0 && copy_size > 0) { /* iMUS header (always in first block) */ pos += copy_size; data_left -= copy_size; } else if (copy_size > 0) { /* presumably PCM data (not seen) */ for (i = 0, j = pos; i < copy_size / sizeof(sample_t); i++, j += 2) { sbuf->samples[i] = get_s16le(buf + j); } sbuf->filled += copy_size / chs / sizeof(sample_t); pos += copy_size; data_left -= copy_size; VGM_LOG("IMUS: found PCM block %i\n", block_num); } else { /* ADPCM header (never in first block) */ for (i = 0; i < chs; i++) { adpcm_step_index[i] = get_u8 (buf + pos + 0x00); //adpcm_step[i] = get_s32be(buf + pos + 0x01); /* same as step_table[step_index] */ adpcm_history[i] = get_s32be(buf + pos + 0x05); pos += 0x09; adpcm_step_index[i] = clamp_s32(adpcm_step_index[i], 0, 88); /* not originally */ } } bitpos = pos * 8; } /* decode ADPCM data after header * (stereo layout: all samples from L, then all for R) */ for (ch = 0; ch < chs; ch++) { int sample, step_index; int samples_to_do; int samples_left = data_left / sizeof(int16_t); int first_sample = sbuf->filled * chs + ch; if (chs == 1) { samples_to_do = samples_left; } else { /* L has +1 code for aligment in first block, must be read to reach R (code seems empty). * Not sure if COMI uses decoded bytes or decoded samples (returns samples_left / channels) * though but the latter makes more sense. */ if (ch == 0) samples_to_do = (samples_left + 1) / chs; else samples_to_do = (samples_left + 0) / chs; } //;VGM_ASSERT((samples_left + 1) / 2 != (samples_left + 0) / 2, "IMUSE: sample diffs\n"); step_index = adpcm_step_index[ch]; sample = adpcm_history[ch]; for (i = 0, s = first_sample; i < samples_to_do; i++, s += chs) { int code_size, code, sign_mask, data_mask, delta; if (bitpos >= MAX_BLOCK_SIZE * 8) { VGM_LOG("IMUSE: wrong bit offset\n"); break; } code_size = code_size_table_v1[step_index]; /* get bit thing from COMI (reads closest 16b then masks + shifts as needed), BE layout */ code = get_u16be(buf + (bitpos >> 3)); //ok code = (code << (bitpos & 7)) & 0xFFFF; code = code >> (16 - code_size); bitpos += code_size; sign_mask = (1 << (code_size - 1)); data_mask = sign_mask - 1; /* done with a LUT in COMI */ delta = adpcm_table[(step_index * 64) + (((code & data_mask) << (7 - code_size)))]; delta += step_table[step_index] >> (code_size - 1); if (code & sign_mask) delta = -delta; sample += delta; sample = clamp16(sample); sbuf->samples[s] = sample; step_index += index_tables_v1[code_size][code]; step_index = clamp_s32(step_index, 0, 88); } } sbuf->filled += data_left / sizeof(int16_t) / chs; } static int decode_block1(STREAMFILE* sf, imuse_codec_data* data, uint8_t* block, size_t data_left) { int block_num = data->current_block; switch(data->block_table[block_num].flags) { case 0x0D: case 0x0F: decode_vima1(sf, &data->sbuf, block, data_left, block_num, data->adpcm_table); break; default: return 0; } return 1; } static void decode_data2(STREAMFILE* sf, sbuf_t* sbuf, uint8_t* buf, size_t data_left, int block_num) { int i, j; int channels = sbuf->channels; if (block_num == 0) { /* iMUS header (always in first block, not shared with audio data unlike V1) */ sbuf->filled = 0; } else { /* presumably PCM data (not seen) */ for (i = 0, j = 0; i < data_left / sizeof(sample_t); i++, j += 2) { sbuf->samples[i] = get_s16le(buf + j); } sbuf->filled += data_left / channels / sizeof(sample_t); VGM_LOG("IMUS: found PCM block %i\n", block_num); } } static void decode_vima2(STREAMFILE* sf, sbuf_t* sbuf, uint8_t* buf, size_t data_left, uint16_t* adpcm_table) { int ch, i, s; int bitpos; int adpcm_history[MAX_CHANNELS] = {0}; int adpcm_step_index[MAX_CHANNELS] = {0}; int chs = sbuf->channels; uint16_t word; int pos = 0; /* read ADPCM header */ { for (i = 0; i < chs; i++) { adpcm_step_index[i] = get_u8 (buf + pos + 0x00); adpcm_history[i] = get_s16be(buf + pos + 0x01); pos += 0x03; /* checked as < 0 and only for first index, means "stereo" */ if (adpcm_step_index[i] & 0x80) { adpcm_step_index[i] = (~adpcm_step_index[i]) & 0xFF; if (chs != 2) return; } /* not originally done but in case of garbage data */ adpcm_step_index[i] = clamp_s32(adpcm_step_index[i], 0, 88); } } bitpos = 0; word = get_u16be(buf + pos); /* originally with a rolling buf, use index to validate overflow */ pos += 0x02; /* decode ADPCM data after header * (stereo layout: all samples from L, then all for R) */ for (ch = 0; ch < chs; ch++) { int sample, step_index; int samples_to_do; int samples_left = data_left / sizeof(int16_t); int first_sample = sbuf->filled * chs + ch; samples_to_do = samples_left / chs; step_index = adpcm_step_index[ch]; sample = adpcm_history[ch]; for (i = 0, s = first_sample; i < samples_to_do; i++, s += chs) { int code_size, code, sign_mask, data_mask, delta; if (pos >= MAX_BLOCK_SIZE) { VGM_LOG("IMUSE: wrong pos offset\n"); break; } code_size = code_size_table_v2[step_index]; sign_mask = (1 << (code_size - 1)); data_mask = (sign_mask - 1); /* get bit thing, masks current code and moves 'upwards' word after reading 8 bits */ bitpos += code_size; code = (word >> (16 - bitpos)) & (sign_mask | data_mask); if (bitpos > 7) { word = (word << 8) | buf[pos++]; bitpos -= 8; } /* clean sign stuff for next tests */ if (code & sign_mask) code ^= sign_mask; else sign_mask = 0; /* all bits set mean 'keyframe' = read next sample */ if (code == data_mask) { sample = (int16_t)(word << bitpos); word = (word << 8) | buf[pos++]; sample |= (word >> (8 - bitpos)) & 0xFF; word = (word << 8) | buf[pos++]; } else { delta = adpcm_table[(step_index * 64) + ((code << (7 - code_size)))]; if (code) delta += step_table[step_index] >> (code_size - 1); if (sign_mask) delta = -delta; sample += delta; sample = clamp16(sample); } sbuf->samples[s] = sample; step_index += index_tables_v2[code_size][code]; step_index = clamp_s32(step_index, 0, 88); } } sbuf->filled += data_left / sizeof(int16_t) / chs; } static int decode_block2(STREAMFILE* sf, imuse_codec_data* data, uint8_t* block, size_t data_left) { int block_num = data->current_block; switch(data->block_table[block_num].flags) { case 0x00: decode_data2(sf, &data->sbuf, block, data_left, block_num); break; case 0x01: decode_vima2(sf, &data->sbuf, block, data_left, data->adpcm_table); break; default: return 0; } return 1; } /* decodes a whole block into sample buffer, all at once due to L/R layout and VBR data */ static int decode_block(STREAMFILE* sf, imuse_codec_data* data) { int ok; uint8_t block[MAX_BLOCK_SIZE]; size_t data_left; data->sbuf.samples = data->samples; data->sbuf.channels = data->channels; if (data->current_block >= data->block_count) { return 0; } /* read block */ { off_t offset = data->block_table[data->current_block].offset; size_t size = data->block_table[data->current_block].size; read_streamfile(block, offset, size, sf); data_left = data->block_table[data->current_block].data; } switch(data->type) { case COMP: ok = decode_block1(sf, data, block, data_left); break; case MCMP: ok = decode_block2(sf, data, block, data_left); break; default: return 0; } /* block fully read */ data->current_block++; return ok; } void decode_imuse(VGMSTREAM* vgmstream, sample_t* outbuf, int32_t samples_to_do) { imuse_codec_data* data = vgmstream->codec_data; STREAMFILE* sf = vgmstream->ch[0].streamfile; int ok; while (samples_to_do > 0) { sbuf_t* sbuf = &data->sbuf; if (sbuf->filled == 0) { ok = decode_block(sf, data); if (!ok) goto fail; } sbuf_consume(&outbuf, &samples_to_do, sbuf); } return; fail: //todo fill silence return; } void free_imuse(imuse_codec_data* data) { if (!data) return; free(data->block_table); free(data); } void seek_imuse(imuse_codec_data* data, int32_t num_sample) { if (!data) return; //todo find closest block, set skip count reset_imuse(data); } void reset_imuse(imuse_codec_data* data) { if (!data) return; data->current_block = 0; data->sbuf.filled = 0; }