mirror of
https://github.com/vgmstream/vgmstream.git
synced 2025-01-19 08:07:23 +01:00
855 lines
33 KiB
C
855 lines
33 KiB
C
#include "mpeg_decoder.h"
|
|
|
|
#ifdef VGM_USE_MPEG
|
|
|
|
/**
|
|
* Utils to parse EALayer3, an MP3 variant. EALayer3 frames have custom headers (removing unneded bits)
|
|
* with regular MPEG data and optional PCM blocks. We transform EA-frames to MPEG-frames on the fly
|
|
* and manually fill the sample PCM sample buffer.
|
|
*
|
|
* Layer III MPEG1 uses two granules (data chunks) per frame, while MPEG2/2.5 ("LSF mode") only one.
|
|
* EA-frames contain one granule, so to reconstruct one MPEG-frame we need two EA-frames (MPEG1) or
|
|
* one (MPEG2). This is only for our decoder, real EALayer3 would decode EA-frames directly.
|
|
* EALayer3 v1 and v2 differ in part of the header, but are mostly the same.
|
|
*
|
|
* Reverse engineering by Zench: https://bitbucket.org/Zenchreal/ealayer3 (ealayer3.exe decoder)
|
|
* Reference: https://www.mp3-tech.org/programmer/docs/mp3_theory.pdf
|
|
* https://github.com/FFmpeg/FFmpeg/blob/master/libavcodec/mpegaudiodec_template.c#L1306
|
|
*/
|
|
|
|
/* **************************************************************************** */
|
|
/* DEFS */
|
|
/* **************************************************************************** */
|
|
|
|
#define EALAYER3_MAX_EA_FRAME_SIZE 0x1000*2 /* enough for one EA-frame without PCM block */
|
|
#define EALAYER3_MAX_GRANULES 2
|
|
#define EALAYER3_MAX_CHANNELS 2
|
|
|
|
/* helper to pass around */
|
|
typedef struct {
|
|
STREAMFILE *sf;
|
|
off_t offset;
|
|
vgm_bitstream is;
|
|
uint8_t buf[EALAYER3_MAX_EA_FRAME_SIZE];
|
|
int leftover_bits;
|
|
} ealayer3_buffer_t;
|
|
|
|
/* parsed info from a single EALayer3 frame */
|
|
typedef struct {
|
|
/* EALayer3 v1 header */
|
|
uint32_t v1_pcm_flag;
|
|
uint32_t v1_offset_samples;
|
|
uint32_t v1_pcm_samples;
|
|
uint32_t v1_pcm_unknown;
|
|
|
|
/* EALayer3 v2 header */
|
|
uint32_t v2_extended_flag;
|
|
uint32_t v2_stereo_flag;
|
|
uint32_t v2_reserved;
|
|
uint32_t v2_frame_size; /* full size including headers and pcm block */
|
|
uint32_t v2_offset_mode; /* discard mode */
|
|
uint32_t v2_offset_samples; /* use depends on mode */
|
|
uint32_t v2_pcm_samples;
|
|
uint32_t v2_common_size; /* granule size: common header+data size; can be zero */
|
|
|
|
/* EALayer3 common header + side info */
|
|
uint32_t version_index;
|
|
uint32_t sample_rate_index;
|
|
uint32_t channel_mode;
|
|
uint32_t mode_extension;
|
|
|
|
uint32_t granule_index; /* 0 = first, 1 = second (for MPEG1, that needs pairs) */
|
|
uint32_t scfsi[EALAYER3_MAX_CHANNELS]; /* SCaleFactor Selection Info */
|
|
uint32_t main_data_size[EALAYER3_MAX_CHANNELS]; /* AKA part2_3_length */
|
|
uint32_t others_1[EALAYER3_MAX_CHANNELS]; /* rest of the side info as-is, divided in 2 */
|
|
uint32_t others_2[EALAYER3_MAX_CHANNELS];
|
|
|
|
/* derived from the above */
|
|
uint32_t data_offset_b; /* start of the MPEG data */
|
|
uint32_t pre_size; /* size of the V1/V2 part */
|
|
uint32_t base_size_b; /* size (bits) of the header+side info, up to data_size */
|
|
uint32_t data_size_b; /* size (bits) of the main MPEG data up to pcm block; can be zero */
|
|
uint32_t padding_size_b; /* size (bits) of the padding after base+data */
|
|
uint32_t common_size; /* size of the common part (base+data+padding) */
|
|
uint32_t pcm_size; /* size of the pcm block */
|
|
uint32_t eaframe_size; /* size of all of the above, for convenience */
|
|
|
|
int mpeg1; /* flag, as MPEG2/2.5 ("low sample frequency" mode) has some differences */
|
|
int version;
|
|
int channels;
|
|
int sample_rate;
|
|
|
|
} ealayer3_frame_t;
|
|
|
|
|
|
static int ealayer3_parse_frame(mpeg_codec_data *data, int num_stream, ealayer3_buffer_t *ib, ealayer3_frame_t *eaf);
|
|
static int ealayer3_parse_frame_v1(ealayer3_buffer_t *ib, ealayer3_frame_t *eaf, int channels_per_frame, int is_v1b);
|
|
static int ealayer3_parse_frame_v2(ealayer3_buffer_t *ib, ealayer3_frame_t *eaf);
|
|
static int ealayer3_parse_frame_common(ealayer3_buffer_t *ib, ealayer3_frame_t *eaf);
|
|
static int ealayer3_rebuild_mpeg_frame(vgm_bitstream *is_0, ealayer3_frame_t *eaf_0, vgm_bitstream *is_1, ealayer3_frame_t *eaf_1, vgm_bitstream *os);
|
|
static int ealayer3_write_pcm_block(VGMSTREAMCHANNEL *stream, mpeg_codec_data *data, int num_stream, ealayer3_frame_t *eaf);
|
|
static int ealayer3_skip_data(VGMSTREAMCHANNEL *stream, mpeg_codec_data *data, int num_stream, int at_start);
|
|
static int ealayer3_is_empty_frame_v2p(STREAMFILE *sf, off_t offset);
|
|
|
|
/* **************************************************************************** */
|
|
/* EXTERNAL API */
|
|
/* **************************************************************************** */
|
|
|
|
/* init codec from an EALayer3 frame */
|
|
int mpeg_custom_setup_init_ealayer3(STREAMFILE *streamfile, off_t start_offset, mpeg_codec_data *data, coding_t *coding_type) {
|
|
int ok;
|
|
ealayer3_buffer_t ib = {0};
|
|
ealayer3_frame_t eaf;
|
|
|
|
|
|
//;VGM_LOG("init at %lx\n", start_offset);
|
|
/* get first frame for info */
|
|
{
|
|
ib.sf = streamfile;
|
|
ib.offset = start_offset;
|
|
ib.is.buf = ib.buf;
|
|
|
|
ok = ealayer3_parse_frame(data, -1, &ib, &eaf);
|
|
if (!ok) goto fail;
|
|
}
|
|
;VGM_ASSERT(!eaf.mpeg1, "EAL3: mpeg2 found at 0x%lx\n", start_offset); /* rare [FIFA 08 (PS3) abk] */
|
|
|
|
*coding_type = coding_MPEG_ealayer3;
|
|
data->channels_per_frame = eaf.channels;
|
|
data->samples_per_frame = eaf.mpeg1 ? 1152 : 576;
|
|
|
|
/* handled at frame start */
|
|
//data->skip_samples = 576 + 529;
|
|
//data->samples_to_discard = data->skip_samples;
|
|
|
|
/* encoder delay: EALayer3 handles this while decoding (skips samples as writes PCM blocks) */
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
/* writes data to the buffer and moves offsets, transforming EALayer3 frames */
|
|
int mpeg_custom_parse_frame_ealayer3(VGMSTREAMCHANNEL *stream, mpeg_codec_data *data, int num_stream) {
|
|
mpeg_custom_stream *ms = data->streams[num_stream];
|
|
int ok, granule_found;
|
|
ealayer3_buffer_t ib_0 = {0}, ib_1 = {0};
|
|
ealayer3_frame_t eaf_0, eaf_1;
|
|
|
|
|
|
/* the first frame samples must be discarded (verified vs sx.exe with a file without PCM blocks),
|
|
* but we can't set samples_to_discard since PCM blocks would be discarded
|
|
* SCHl block samples field takes into account this discard (its value already substracts this) */
|
|
if ((data->type == MPEG_EAL31 || data->type == MPEG_EAL31b) && ms->current_size_count == 0) {
|
|
/* seems true for MP2/576 frame samples too, though they are rare so it's hard to test */
|
|
ms->decode_to_discard += 529 + 576; /* standard MP3 decoder delay + 1 granule samples */
|
|
ms->current_size_count++;
|
|
}
|
|
|
|
|
|
/* read first frame/granule, or PCM-only frame (found alone at the end of SCHl streams) */
|
|
{
|
|
//;VGM_LOG("s%i: get granule0 at %lx\n", num_stream,stream->offset);
|
|
if (!ealayer3_skip_data(stream, data, num_stream, 1))
|
|
goto fail;
|
|
|
|
ib_0.sf = stream->streamfile;
|
|
ib_0.offset = stream->offset;
|
|
ib_0.is.buf = ib_0.buf;
|
|
|
|
ok = ealayer3_parse_frame(data, num_stream, &ib_0, &eaf_0);
|
|
if (!ok) goto fail;
|
|
|
|
ok = ealayer3_write_pcm_block(stream, data, num_stream, &eaf_0);
|
|
if (!ok) goto fail;
|
|
|
|
stream->offset += eaf_0.eaframe_size;
|
|
//;VGM_LOG("s%i: get granule0 done at %lx (eaf_size=%x, common_size=%x)\n", num_stream,stream->offset, eaf_0.eaframe_size, eaf_0.common_size);
|
|
|
|
if (!ealayer3_skip_data(stream, data, num_stream, 0))
|
|
goto fail;
|
|
}
|
|
|
|
/* In EAL3 V2P sometimes there is a new SNS/SPS block between granules. Instead of trying to fix it here
|
|
* or in blocked layout (too complex/patchy), SNS/SPS uses a custom streamfile that simply removes all
|
|
* block headers, so this parser only sees raw EALayer3 data. It also discards samples, which confuses
|
|
* blocked layout calculations
|
|
*
|
|
* Similarly (as V2P decodes and writes 1 granule at a time) stream can end in granule0. Since mpg123
|
|
* decodes in pairs we detect and feed it a fake end granule1, to get the last granule0's 576 samples. */
|
|
|
|
granule_found = 0;
|
|
/* get second frame/granule (MPEG1 only) if first granule was found */
|
|
while (eaf_0.common_size && eaf_0.mpeg1 && !granule_found) {
|
|
//;VGM_LOG("s%i: get granule1 at %lx\n", num_stream,stream->offset);
|
|
if (!ealayer3_skip_data(stream, data, num_stream, 1))
|
|
goto fail;
|
|
|
|
/* detect end granule0 (which may be before stream end in multichannel) and create a usable last granule1 */
|
|
if (data->type == MPEG_EAL32P && eaf_0.mpeg1 && ealayer3_is_empty_frame_v2p(stream->streamfile, stream->offset)) {
|
|
//;VGM_LOG("EAL3: fake granule1 needed\n");
|
|
/* memcpy/clone for now as I'm not sure now to create a valid empty granule1, but
|
|
* probably doesn't matter since num_samples should end before reaching granule1 samples (<=576) */
|
|
eaf_1 = eaf_0;
|
|
ib_1 = ib_0;
|
|
eaf_1.granule_index = 1;
|
|
break;
|
|
}
|
|
|
|
ib_1.sf = stream->streamfile;
|
|
ib_1.offset = stream->offset;
|
|
ib_1.is.buf = ib_1.buf;
|
|
|
|
ok = ealayer3_parse_frame(data, num_stream, &ib_1, &eaf_1);
|
|
if (!ok) goto fail;
|
|
|
|
ok = ealayer3_write_pcm_block(stream, data, num_stream, &eaf_1);
|
|
if (!ok) goto fail;
|
|
|
|
stream->offset += eaf_1.eaframe_size;
|
|
//;VGM_LOG("s%i: get granule1 done at %lx (eaf_size=%x, common_size=%x)\n", num_stream,stream->offset, eaf_1.eaframe_size, eaf_1.common_size);
|
|
|
|
if (!ealayer3_skip_data(stream, data, num_stream, 0))
|
|
goto fail;
|
|
|
|
/* in V1a there may be PCM-only frames between granules so read until next one (or parse fails) */
|
|
if (eaf_1.common_size > 0)
|
|
granule_found = 1;
|
|
}
|
|
|
|
/* rebuild EALayer3 frame to MPEG frame */
|
|
{
|
|
vgm_bitstream os = {0};
|
|
|
|
os.buf = ms->buffer;
|
|
os.bufsize = ms->buffer_size;
|
|
|
|
ok = ealayer3_rebuild_mpeg_frame(&ib_0.is, &eaf_0, &ib_1.is, &eaf_1, &os);
|
|
if (!ok) goto fail;
|
|
|
|
ms->bytes_in_buffer = os.b_off / 8; /* wrote full MPEG frame, hopefully */
|
|
}
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
|
|
/* **************************************************************************** */
|
|
/* INTERNAL HELPERS */
|
|
/* **************************************************************************** */
|
|
|
|
/* Read at most N bits from streamfile. This makes more smaller reads (not good) but
|
|
* allows exact frame size reading (good), as reading over a frame then reading back
|
|
* is expensive in EALayer3 since it uses custom streamfiles. */
|
|
static void fill_buf(ealayer3_buffer_t *ib, int bits) {
|
|
size_t read_size, bytes_size;
|
|
int mod;
|
|
|
|
/* count leftover bits since we can only read 8 bits at a time:
|
|
* - fill 6b: read 1 byte (8b) > leftover 2b
|
|
* - fill 20b: remove leftover 2b (=fill 18b), read 3 bytes (16+8b) > leftover 6b
|
|
* - fill 4b: remove leftover 6b > no need to read > lefover 2b
|
|
* - etc
|
|
*/
|
|
|
|
//;VGM_LOG("fill: %i + (l=%i)\n", bits, bits);
|
|
|
|
if (ib->leftover_bits >= bits) {
|
|
ib->leftover_bits -= bits;
|
|
return;
|
|
}
|
|
|
|
bits -= ib->leftover_bits;
|
|
mod = (bits % 8);
|
|
bytes_size = (bits / 8) + (mod > 0 ? 0x01 : 0);
|
|
|
|
//;VGM_LOG("filled: %lx + %x (b=%i, m=%i)\n", ib->offset, bytes_size, bits, (mod > 0 ? 8 - mod : 0));
|
|
|
|
read_size = read_streamfile(ib->buf + ib->is.bufsize, ib->offset, bytes_size, ib->sf);
|
|
ib->is.bufsize += read_size;
|
|
ib->offset += read_size;
|
|
ib->leftover_bits = (mod > 0 ? 8 - mod : 0);
|
|
}
|
|
|
|
static int ealayer3_parse_frame(mpeg_codec_data *data, int num_stream, ealayer3_buffer_t *ib, ealayer3_frame_t *eaf) {
|
|
int ok;
|
|
|
|
/* We must pass this from state, as not all EA-frames have channel info.
|
|
* (unknown in the first EA-frame but that's ok) */
|
|
int channels_per_frame = 0;
|
|
if (num_stream >= 0) {
|
|
channels_per_frame = data->streams[num_stream]->channels_per_frame;
|
|
}
|
|
|
|
/* make sure as there is re-parsing in loops */
|
|
memset(eaf, 0, sizeof(ealayer3_frame_t));
|
|
|
|
switch(data->type) {
|
|
case MPEG_EAL31: ok = ealayer3_parse_frame_v1(ib, eaf, channels_per_frame, 0); break;
|
|
case MPEG_EAL31b: ok = ealayer3_parse_frame_v1(ib, eaf, channels_per_frame, 1); break;
|
|
case MPEG_EAL32P:
|
|
case MPEG_EAL32S: ok = ealayer3_parse_frame_v2(ib, eaf); break;
|
|
default: goto fail;
|
|
}
|
|
if (!ok) goto fail;
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
|
|
/* read V1"a" (in SCHl) and V1"b" (in SNS) EALayer3 frame */
|
|
static int ealayer3_parse_frame_v1(ealayer3_buffer_t *ib, ealayer3_frame_t *eaf, int channels_per_frame, int is_v1b) {
|
|
int ok;
|
|
vgm_bitstream *is = &ib->is;
|
|
|
|
|
|
/* read EA-frame V1 header */
|
|
fill_buf(ib, 8);
|
|
r_bits(is, 8,&eaf->v1_pcm_flag);
|
|
|
|
eaf->pre_size = 1; /* 8b */
|
|
|
|
if (eaf->v1_pcm_flag != 0x00 && eaf->v1_pcm_flag != 0xEE) {
|
|
VGM_LOG("EAL3 v1: header not 0x00 or 0xEE\n");
|
|
goto fail; /* wrong offset? */
|
|
}
|
|
if (eaf->v1_pcm_flag == 0xEE && !channels_per_frame) {
|
|
VGM_LOG("EAL3 v1: PCM block in first frame\n");
|
|
goto fail; /* must know from a prev frame (can't use eaf->channels for V1a) */
|
|
}
|
|
|
|
/* read EA-frame common header (V1a PCM blocks don't have EA-frames, while V1b do) */
|
|
if (is_v1b || eaf->v1_pcm_flag == 0x00) {
|
|
ok = ealayer3_parse_frame_common(ib, eaf);
|
|
if (!ok) goto fail;
|
|
}
|
|
|
|
/* check PCM block */
|
|
if (eaf->v1_pcm_flag == 0xEE) {
|
|
fill_buf(ib, 32);
|
|
r_bits(is, 16,&eaf->v1_offset_samples); /* PCM block offset in the buffer */
|
|
r_bits(is, 16,&eaf->v1_pcm_samples); /* number of PCM samples, can be 0 */
|
|
|
|
eaf->pre_size += 2+2; /* 16b+16b */
|
|
eaf->pcm_size = (2*eaf->v1_pcm_samples * channels_per_frame);
|
|
|
|
if (is_v1b) { /* extra 32b in v1b */
|
|
fill_buf(ib, 32);
|
|
r_bits(is, 32,&eaf->v1_pcm_unknown);
|
|
|
|
eaf->pre_size += 4; /* 32b */
|
|
|
|
VGM_ASSERT(eaf->v1_pcm_unknown != 0, "EA EAL3 v1: v1_pcm_unknown not 0\n");
|
|
}
|
|
}
|
|
|
|
eaf->eaframe_size = eaf->pre_size + eaf->common_size + eaf->pcm_size;
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
/* read V2"PCM" and V2"Spike" EALayer3 frame (exactly the same but V2P seems to have bigger
|
|
* PCM blocks and maybe smaller frames) */
|
|
static int ealayer3_parse_frame_v2(ealayer3_buffer_t *ib, ealayer3_frame_t *eaf) {
|
|
int ok;
|
|
vgm_bitstream *is = &ib->is;
|
|
|
|
|
|
/* read EA-frame V2 header */
|
|
fill_buf(ib, 16);
|
|
r_bits(is, 1,&eaf->v2_extended_flag);
|
|
r_bits(is, 1,&eaf->v2_stereo_flag);
|
|
r_bits(is, 2,&eaf->v2_reserved);
|
|
r_bits(is, 12,&eaf->v2_frame_size);
|
|
|
|
eaf->pre_size = 2; /* 16b */
|
|
|
|
if (eaf->v2_extended_flag) {
|
|
fill_buf(ib, 32);
|
|
r_bits(is, 2,&eaf->v2_offset_mode);
|
|
r_bits(is, 10,&eaf->v2_offset_samples);
|
|
r_bits(is, 10,&eaf->v2_pcm_samples);
|
|
r_bits(is, 10,&eaf->v2_common_size);
|
|
|
|
eaf->pre_size += 4; /* 32b */
|
|
}
|
|
|
|
/* read EA-frame common header */
|
|
if (!eaf->v2_extended_flag || (eaf->v2_extended_flag && eaf->v2_common_size)) {
|
|
ok = ealayer3_parse_frame_common(ib, eaf);
|
|
if (!ok) goto fail;
|
|
}
|
|
VGM_ASSERT(eaf->v2_extended_flag && eaf->v2_common_size == 0, "EA EAL3: v2 empty frame\n"); /* seen in V2S */
|
|
VGM_ASSERT(eaf->v2_extended_flag && eaf->v2_offset_samples > 0, "EA EAL3: v2_offset_mode=%x with value=0x%x\n", eaf->v2_offset_mode, eaf->v2_offset_samples);
|
|
//VGM_ASSERT(eaf->v2_pcm_samples > 0, "EA EAL3: v2_pcm_samples 0x%x\n", eaf->v2_pcm_samples);
|
|
|
|
eaf->pcm_size = (2*eaf->v2_pcm_samples * eaf->channels);
|
|
|
|
eaf->eaframe_size = eaf->pre_size + eaf->common_size + eaf->pcm_size;
|
|
|
|
if (eaf->v2_frame_size != eaf->eaframe_size) {
|
|
VGM_LOG("EAL3: different v2 frame size vs calculated (0x%x vs 0x%x)\n", eaf->v2_frame_size, eaf->eaframe_size);
|
|
goto fail;
|
|
}
|
|
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
|
|
/* parses an EALayer3 frame (common part) */
|
|
static int ealayer3_parse_frame_common(ealayer3_buffer_t *ib, ealayer3_frame_t *eaf) {
|
|
/* index tables */
|
|
static const int versions[4] = { /* MPEG 2.5 */ 3, /* reserved */ -1, /* MPEG 2 */ 2, /* MPEG 1 */ 1 };
|
|
static const int sample_rates[4][4] = { /* [version_index][sample rate index] */
|
|
{ 11025, 12000, 8000, -1}, /* MPEG2.5 */
|
|
{ -1, -1, -1, -1}, /* reserved */
|
|
{ 22050, 24000, 16000, -1}, /* MPEG2 */
|
|
{ 44100, 48000, 32000, -1}, /* MPEG1 */
|
|
};
|
|
static const int channels[4] = { 2,2,2, 1 }; /* [channel_mode] */
|
|
|
|
vgm_bitstream *is = &ib->is;
|
|
off_t start_b_off = is->b_off;
|
|
int i, fill_bits, others_2_bits;
|
|
|
|
|
|
/* read main header */
|
|
fill_buf(ib, 8);
|
|
r_bits(is, 2,&eaf->version_index);
|
|
r_bits(is, 2,&eaf->sample_rate_index);
|
|
r_bits(is, 2,&eaf->channel_mode);
|
|
r_bits(is, 2,&eaf->mode_extension);
|
|
|
|
|
|
/* check empty frame */
|
|
if (eaf->version_index == 0 &&
|
|
eaf->sample_rate_index == 0 &&
|
|
eaf->channel_mode == 0 &&
|
|
eaf->mode_extension == 0) {
|
|
VGM_LOG("EAL3: empty frame\n");
|
|
goto fail;
|
|
}
|
|
|
|
|
|
/* derived */
|
|
eaf->version = versions[eaf->version_index];
|
|
eaf->channels = channels[eaf->channel_mode];
|
|
eaf->sample_rate = sample_rates[eaf->version_index][eaf->sample_rate_index];
|
|
eaf->mpeg1 = (eaf->version == 1);
|
|
|
|
if (eaf->version == -1 || eaf->sample_rate == -1) {
|
|
VGM_LOG("EAL3: illegal header values\n");
|
|
goto fail;
|
|
}
|
|
|
|
others_2_bits = eaf->mpeg1 ? 47-32 : 51-32;
|
|
|
|
/* read side info */
|
|
fill_buf(ib, 1);
|
|
r_bits(is, 1,&eaf->granule_index);
|
|
|
|
fill_bits = (eaf->mpeg1 && eaf->granule_index == 1) ? 4 * eaf->channels : 0;
|
|
fill_bits = fill_bits + (12 + 32 + others_2_bits) * eaf->channels;
|
|
fill_buf(ib, fill_bits);
|
|
|
|
if (eaf->mpeg1 && eaf->granule_index == 1) {
|
|
for (i = 0; i < eaf->channels; i++) {
|
|
r_bits(is, 4,&eaf->scfsi[i]);
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < eaf->channels; i++) {
|
|
r_bits(is, 12,&eaf->main_data_size[i]);
|
|
/* divided in 47b=32+15 (MPEG1) or 51b=32+19 (MPEG2), arbitrarily */
|
|
r_bits(is, 32,&eaf->others_1[i]);
|
|
r_bits(is, others_2_bits,&eaf->others_2[i]);
|
|
}
|
|
|
|
|
|
/* derived */
|
|
eaf->data_offset_b = is->b_off; /* header size + above size */
|
|
eaf->base_size_b = (is->b_off - start_b_off); /* above size without header */
|
|
for (i = 0; i < eaf->channels; i++) {
|
|
eaf->data_size_b += eaf->main_data_size[i]; /* can be 0, meaning a micro EA-frame */
|
|
}
|
|
if ((eaf->base_size_b + eaf->data_size_b) % 8) /* aligned to closest 8b */
|
|
eaf->padding_size_b = 8 - ((eaf->base_size_b+eaf->data_size_b) % 8);
|
|
|
|
fill_buf(ib, eaf->data_size_b + eaf->padding_size_b); /* read MPEG data (not PCM block) */
|
|
is->b_off += eaf->data_size_b + eaf->padding_size_b;
|
|
|
|
eaf->common_size = (eaf->base_size_b + eaf->data_size_b + eaf->padding_size_b)/8;
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
|
|
/* converts an EALAYER3 frame to a standard MPEG frame from pre-parsed info */
|
|
static int ealayer3_rebuild_mpeg_frame(vgm_bitstream *is_0, ealayer3_frame_t *eaf_0, vgm_bitstream *is_1, ealayer3_frame_t *eaf_1, vgm_bitstream* os) {
|
|
uint32_t c = 0;
|
|
int i, j;
|
|
int expected_bitrate_index, expected_frame_size;
|
|
|
|
|
|
/* ignore PCM-only frames */
|
|
if (!eaf_0->common_size)
|
|
return 1;
|
|
|
|
/* extra checks */
|
|
if (eaf_0->mpeg1 && (!eaf_1
|
|
|| eaf_0->mpeg1 != eaf_1->mpeg1
|
|
|| eaf_0->version != eaf_1->version
|
|
|| eaf_0->granule_index == eaf_1->granule_index
|
|
|| !eaf_0->common_size || !eaf_1->common_size)) {
|
|
VGM_LOG("EAL3: EA-frames for MPEG1 don't match\n");
|
|
goto fail;
|
|
}
|
|
|
|
|
|
/* get bitrate: use "free format" (bigger bitrate) to avoid the need of bit reservoir
|
|
* this feature is in the spec but some decoders may not support it
|
|
* (free format detection is broken in some MP3 in mpg123 < 1.25.8 but works ok) */
|
|
expected_bitrate_index = 0x00;
|
|
if (eaf_0->mpeg1) {
|
|
expected_frame_size = 144l * (320*2) * 1000l / eaf_0->sample_rate;
|
|
} else {
|
|
expected_frame_size = 72l * (160*2) * 1000l / eaf_0->sample_rate;
|
|
}
|
|
#if 0
|
|
/* this uses max official bitrate (320/160) but some frames need more = complex bit reservoir */
|
|
expected_bitrate_index = 0x0E;
|
|
if (eaf_0->mpeg1) { /* 320: 44100=0x414, 48000=0x3C0, 32000=0x5A0 */
|
|
expected_frame_size = 144l * 320 * 1000l / eaf_0->sample_rate;
|
|
} else { /* 160: 22050=0x20A, 24000=0x1E0, 16000=0x2D0, 11025=0x414, 12000=0x3C0, 8000=0x5A0 */
|
|
expected_frame_size = 72l * 160 * 1000l / eaf_0->sample_rate;
|
|
}
|
|
#endif
|
|
|
|
/* write MPEG1/2 frame header */
|
|
w_bits(os, 11, 0x7FF); /* sync */
|
|
w_bits(os, 2, eaf_0->version_index);
|
|
w_bits(os, 2, 0x01); /* layer III index */
|
|
w_bits(os, 1, 1); /* "no CRC" flag */
|
|
w_bits(os, 4, expected_bitrate_index);
|
|
w_bits(os, 2, eaf_0->sample_rate_index);
|
|
w_bits(os, 1, 0); /* padding */
|
|
w_bits(os, 1, 0); /* private */
|
|
w_bits(os, 2, eaf_0->channel_mode);
|
|
w_bits(os, 2, eaf_0->mode_extension);
|
|
w_bits(os, 1, 1); /* copyrighted */
|
|
w_bits(os, 1, 1); /* original */
|
|
w_bits(os, 2, 0); /* emphasis */
|
|
|
|
if (eaf_0->mpeg1) {
|
|
int private_bits = (eaf_0->channels==1 ? 5 : 3);
|
|
|
|
/* write MPEG1 side info */
|
|
w_bits(os, 9, 0); /* main data start (no bit reservoir) */
|
|
w_bits(os, private_bits, 0);
|
|
|
|
for (i = 0; i < eaf_1->channels; i++) {
|
|
w_bits(os, 4, eaf_1->scfsi[i]); /* saved in granule1 only */
|
|
}
|
|
for (i = 0; i < eaf_0->channels; i++) { /* granule0 */
|
|
w_bits(os, 12, eaf_0->main_data_size[i]);
|
|
w_bits(os, 32, eaf_0->others_1[i]);
|
|
w_bits(os, 47-32, eaf_0->others_2[i]);
|
|
}
|
|
for (i = 0; i < eaf_1->channels; i++) { /* granule1 */
|
|
w_bits(os, 12, eaf_1->main_data_size[i]);
|
|
w_bits(os, 32, eaf_1->others_1[i]);
|
|
w_bits(os, 47-32, eaf_1->others_2[i]);
|
|
}
|
|
|
|
/* write MPEG1 main data */
|
|
is_0->b_off = eaf_0->data_offset_b;
|
|
for (i = 0; i < eaf_0->channels; i++) { /* granule0 */
|
|
for (j = 0; j < eaf_0->main_data_size[i]; j++) {
|
|
r_bits(is_0, 1, &c);
|
|
w_bits(os, 1, c);
|
|
}
|
|
}
|
|
|
|
is_1->b_off = eaf_1->data_offset_b;
|
|
for (i = 0; i < eaf_1->channels; i++) { /* granule1 */
|
|
for (j = 0; j < eaf_1->main_data_size[i]; j++) {
|
|
r_bits(is_1, 1, &c);
|
|
w_bits(os, 1, c);
|
|
}
|
|
}
|
|
}
|
|
else {
|
|
int private_bits = (eaf_0->channels==1 ? 1 : 2);
|
|
|
|
/* write MPEG2 side info */
|
|
w_bits(os, 8, 0); /* main data start (no bit reservoir) */
|
|
w_bits(os, private_bits, 0);
|
|
|
|
for (i = 0; i < eaf_0->channels; i++) {
|
|
w_bits(os, 12, eaf_0->main_data_size[i]);
|
|
w_bits(os, 32, eaf_0->others_1[i]);
|
|
w_bits(os, 51-32, eaf_0->others_2[i]);
|
|
}
|
|
|
|
/* write MPEG2 main data */
|
|
is_0->b_off = eaf_0->data_offset_b;
|
|
for (i = 0; i < eaf_0->channels; i++) {
|
|
for (j = 0; j < eaf_0->main_data_size[i]; j++) {
|
|
r_bits(is_0, 1, &c);
|
|
w_bits(os, 1, c);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* align to closest 8b */
|
|
if (os->b_off % 8) {
|
|
int align_bits = 8 - (os->b_off % 8);
|
|
w_bits(os, align_bits, 0);
|
|
}
|
|
|
|
|
|
if (os->b_off/8 > expected_frame_size) {
|
|
/* bit reservoir! shouldn't happen with free bitrate, otherwise it's hard to fix as needs complex buffering/calcs */
|
|
VGM_LOG("EAL3: written 0x%x but expected less than 0x%x\n", (uint32_t)(os->b_off/8), expected_frame_size);
|
|
}
|
|
else {
|
|
/* fill ancillary data (should be ignored, but 0x00 seems to improve mpg123's free bitrate detection) */
|
|
memset(os->buf + os->b_off/8, 0x00, expected_frame_size - os->b_off/8);
|
|
}
|
|
|
|
os->b_off = expected_frame_size*8;
|
|
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
static void ealayer3_copy_pcm_block(uint8_t* outbuf, off_t pcm_offset, int pcm_number, int channels_per_frame, int is_packed, STREAMFILE *sf) {
|
|
int i, ch;
|
|
uint8_t pcm_block[1152 * 2 * 2]; /* assumed max: 1 MPEG frame samples * 16b * max channels */
|
|
size_t pcm_size = pcm_number * 2 * channels_per_frame;
|
|
size_t bytes;
|
|
|
|
if (pcm_number == 0)
|
|
return;
|
|
|
|
if (pcm_number > 1152) {
|
|
VGM_LOG("EAL3: big PCM block of %i samples\n", pcm_number);
|
|
return;
|
|
}
|
|
|
|
bytes = read_streamfile(pcm_block, pcm_offset, pcm_size, sf);
|
|
if (bytes != pcm_size) {
|
|
VGM_LOG("EAL3: incorrect pcm_number %i at %lx\n", pcm_number, pcm_offset);
|
|
return;
|
|
}
|
|
|
|
//;VGM_LOG("copy PCM at %lx + %i\n", pcm_offset, pcm_number);
|
|
|
|
/* read + write PCM block samples (always BE) */
|
|
if (is_packed) {
|
|
/* ch0+ch1 packed together */
|
|
int pos = 0;
|
|
for (i = 0; i < pcm_number * channels_per_frame; i++) {
|
|
int16_t pcm_sample = get_s16be(pcm_block + pos);
|
|
put_16bitLE(outbuf + pos, pcm_sample);
|
|
|
|
pos += sizeof(sample);
|
|
}
|
|
}
|
|
else {
|
|
/* all of ch0 first, then all of ch1 (EAL3 v1b only) */
|
|
int get_pos = 0;
|
|
for (ch = 0; ch < channels_per_frame; ch++) {
|
|
int put_pos = sizeof(sample) * ch;
|
|
for (i = 0; i < pcm_number; i++) {
|
|
int16_t pcm_sample = get_s16be(pcm_block + get_pos);
|
|
put_16bitLE(outbuf + put_pos, pcm_sample);
|
|
|
|
get_pos += sizeof(sample);
|
|
put_pos += sizeof(sample) * channels_per_frame;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/* write PCM block directly to sample buffer and setup decode discard (EALayer3 seems to use this as a prefetch of sorts).
|
|
* Seems to alter decoded sample buffer to handle encoder delay/padding in a twisted way. */
|
|
static int ealayer3_write_pcm_block(VGMSTREAMCHANNEL *stream, mpeg_codec_data *data, int num_stream, ealayer3_frame_t *eaf) {
|
|
mpeg_custom_stream *ms = data->streams[num_stream];
|
|
int channels_per_frame = ms->channels_per_frame;
|
|
size_t bytes_filled;
|
|
|
|
|
|
bytes_filled = sizeof(sample) * ms->samples_filled * channels_per_frame;
|
|
if (bytes_filled + eaf->pcm_size > ms->output_buffer_size) {
|
|
VGM_LOG("EAL3: can't fill the sample buffer with 0x%x\n", eaf->pcm_size);
|
|
goto fail;
|
|
}
|
|
|
|
if (eaf->v1_pcm_samples && !eaf->pcm_size) {
|
|
VGM_LOG("EAL3: pcm_size without pcm_samples\n");
|
|
goto fail;
|
|
}
|
|
|
|
if (eaf->v1_pcm_samples || eaf->v1_offset_samples) {
|
|
uint8_t* outbuf = ms->output_buffer + bytes_filled;
|
|
off_t pcm_offset = stream->offset + eaf->pre_size + eaf->common_size;
|
|
size_t decode_to_discard;
|
|
|
|
VGM_ASSERT(eaf->v1_offset_samples > 576, "EAL3: big discard %i at 0x%x\n", eaf->v1_offset_samples, (uint32_t)stream->offset);
|
|
VGM_ASSERT(eaf->v1_pcm_samples > 0x100, "EAL3: big samples %i at 0x%x\n", eaf->v1_pcm_samples, (uint32_t)stream->offset);
|
|
VGM_ASSERT(eaf->v1_offset_samples > 0 && eaf->v1_pcm_samples == 0, "EAL3: offset_samples without pcm_samples\n"); /* not seen but could work */
|
|
|
|
//;VGM_LOG("EA EAL3 v1: offset=%lx + %x, offset_samples=%x, pcm_samples=%i, spf=%i\n",
|
|
// stream->offset, eaf->pre_size + eaf->common_size, eaf->v1_offset_samples, eaf->v1_pcm_samples, data->samples_per_frame);
|
|
|
|
/* V1b PCM block is in 'planar' format (ex. NFS:U PS3) */
|
|
ealayer3_copy_pcm_block(outbuf, pcm_offset, eaf->v1_pcm_samples, channels_per_frame, (data->type == MPEG_EAL31), stream->streamfile);
|
|
ms->samples_filled += eaf->v1_pcm_samples;
|
|
|
|
//TODO: we should put samples at offset but most EAL3 use it at first frame, which decodes ok, and rarely
|
|
// in the last frame [ex. Celebrity Sports Showdown], which is ~60-80 samples off (could click on segments?)
|
|
|
|
/* v1_offset_samples in V1a controls how the PCM block goes in the sample buffer. Value seems to start
|
|
* from frame samples end, taking into account that 1st frame discards 576+529 samples.
|
|
* ex. with 47 samples:
|
|
* - offset 47 puts block at sample 0 (at 576*2-47 w/o 576+529 discard),
|
|
* - offset 63 puts block at sample -16 (only 31 samples visible, so 576*2-63 w/o discard),
|
|
* - offset 0 seems to cause sample buffer overrun (at 576*2-0 = outside single frame buffer?)
|
|
* In V1b seems to works similarly but offset looks adjusted after initial discard (so offset 0 for first frame)
|
|
*
|
|
* This behaviour matters most in looping sfx (ex. Burnout Paradise), or tracks that start
|
|
* without silence (ex. NFS:UG2), and NFS:UC PS3 (EAL3v1b) vs PC (EAXAS) gets correct waveform this way */
|
|
decode_to_discard = eaf->v1_pcm_samples;
|
|
ms->decode_to_discard += decode_to_discard;
|
|
}
|
|
|
|
if (eaf->v2_extended_flag) {
|
|
uint8_t* outbuf = ms->output_buffer + bytes_filled;
|
|
off_t pcm_offset = stream->offset + eaf->pre_size + eaf->common_size;
|
|
size_t usable_samples, decode_to_discard;
|
|
|
|
/* V2P usually only copies big PCM, while V2S discards then copies few samples (similar to V1b).
|
|
* Unlike V1b, both modes seem to use 'packed' PCM block */
|
|
ealayer3_copy_pcm_block(outbuf, pcm_offset, eaf->v2_pcm_samples, channels_per_frame, 1, stream->streamfile);
|
|
ms->samples_filled += eaf->v2_pcm_samples;
|
|
|
|
//;VGM_LOG("EA EAL3 v2: off=%lx, mode=%x, value=%i, pcm=%i, c-size=%x, pcm_o=%lx\n",
|
|
// stream->offset, eaf->v2_offset_mode, eaf->v2_offset_samples, eaf->v2_pcm_samples, eaf->v2_common_size, pcm_offset);
|
|
|
|
//todo improve how discarding works since there could exists a subtle-but-unlikely PCM+granule usage
|
|
//todo test other modes (only seen IGNORE)
|
|
|
|
/* get how many samples we can use in this granule + pcm block (thus how many we can't) */
|
|
if (eaf->v2_offset_mode == 0x00) { /* IGNORE (looks correct in V2P loops, ex. NFS:W) */
|
|
/* offset_samples is usually 0 in V2P (no discard), varies in V2S and may be 576 (full discard).
|
|
* If block has pcm_samples then usable_samples will be at least that value (for all known files),
|
|
* and is assumed PCM isn't discarded so only discards the decoded granule. */
|
|
usable_samples = 576 - eaf->v2_offset_samples;
|
|
if (eaf->common_size == 0)
|
|
usable_samples = eaf->v2_pcm_samples;
|
|
|
|
if (usable_samples == eaf->v2_pcm_samples) {
|
|
decode_to_discard = 576;
|
|
}
|
|
else {
|
|
VGM_LOG("EAL3: unknown discard\n");
|
|
decode_to_discard = 0;
|
|
}
|
|
}
|
|
else if (eaf->v2_offset_mode == 0x01) { /* PRESERVE */
|
|
usable_samples = 576;
|
|
if (eaf->common_size == 0)
|
|
usable_samples = eaf->v2_pcm_samples;
|
|
decode_to_discard = 0; /* all preserved */
|
|
}
|
|
else if (eaf->v2_offset_mode == 0x02) { /* MUTE */
|
|
usable_samples = 576;
|
|
if (eaf->common_size == 0)
|
|
usable_samples = eaf->v2_pcm_samples * 2; // why 2?
|
|
decode_to_discard = 0; /* not discarded but muted */
|
|
//mute_samples = eaf->v2_offset_samples; //todo must 0 first N decoded samples
|
|
}
|
|
else {
|
|
VGM_LOG("EAL3: unknown mode\n"); /* not defined */
|
|
usable_samples = 576;
|
|
decode_to_discard = 0;
|
|
}
|
|
|
|
ms->decode_to_discard += decode_to_discard;
|
|
}
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
|
|
//TODO: this causes lots of rebuffering/slowness in multichannel since each stream has to read back
|
|
// (frames are interleaved like s0_g0, s1_g0, s2_g0, s0_g1, s1_g1, s2_g1, ...,
|
|
// stream0 advances buffers to s0_g1, but stream1 needs to read back to s1_g0, often trashing custom IO)
|
|
// would need to store granule0 after reading but not decoding until next?
|
|
|
|
/* Skip EA-frames from other streams for .sns/sps multichannel (interleaved 1 EA-frame per stream).
|
|
* Due to EALayer3 being in blocks and other complexities (we can't go past a block) all
|
|
* streams's offsets should start in the first stream's EA-frame.
|
|
*
|
|
* So to properly read one MPEG-frame from a stream we need to:
|
|
* - skip one EA-frame per previous streams until offset is in current stream's EA-frame
|
|
* (ie. 1st stream skips 0, 2nd stream skips 1, 3rd stream skips 2)
|
|
* - read EA-frame (granule0)
|
|
* - skip one EA-frame per following streams until offset is in first stream's EA-frame
|
|
* (ie. 1st stream skips 2, 2nd stream skips 1, 3rd stream skips 0)
|
|
* - repeat again for granule1
|
|
*
|
|
* EALayer3 v1 in SCHl uses external offsets and 1ch multichannel instead.
|
|
*/
|
|
static int ealayer3_skip_data(VGMSTREAMCHANNEL *stream, mpeg_codec_data *data, int num_stream, int at_start) {
|
|
int ok, i;
|
|
ealayer3_buffer_t ib = {0};
|
|
ealayer3_frame_t eaf;
|
|
int skips = at_start ? num_stream : data->streams_size - 1 - num_stream;
|
|
|
|
/* v1 does multichannel with set offsets */
|
|
if (data->type == MPEG_EAL31)
|
|
return 1;
|
|
|
|
for (i = 0; i < skips; i++) {
|
|
ib.sf = stream->streamfile;
|
|
ib.offset = stream->offset;
|
|
ib.is.buf = ib.buf;
|
|
|
|
ok = ealayer3_parse_frame(data, num_stream, &ib, &eaf);
|
|
if (!ok) goto fail;
|
|
|
|
stream->offset += eaf.eaframe_size;
|
|
//;VGM_LOG("s%i-%i: skipping %x, now at %lx\n", num_stream,i,eaf.eaframe_size,stream->offset);
|
|
}
|
|
//;VGM_LOG("s%i: skipped %i frames, now at %lx\n", num_stream,skips,stream->offset);
|
|
|
|
return 1;
|
|
fail:
|
|
return 0;
|
|
}
|
|
|
|
static int ealayer3_is_empty_frame_v2p(STREAMFILE *sf, off_t offset) {
|
|
/* V2P frame header should contain a valid frame size (lower 12b) */
|
|
uint16_t v2_header = read_u16be(offset, sf);
|
|
return (v2_header % 0xFFF) == 0 || v2_header == 0xFFFF;
|
|
}
|
|
|
|
#endif
|