#include "coding.h" #include "../util.h" #include "../vgmstream.h" #ifdef VGM_USE_MPEG #include #define AHX_EXPECTED_FRAME_SIZE 0x414 #define MPEG_DEFAULT_BUFFER_SIZE 0x1000 /* should be >= AHX_EXPECTED_FRAME_SIZE */ #define MPEG_SYNC_BITS 0xFFE00000 #define MPEG_PADDING_BIT 0x200 static mpeg_codec_data *init_mpeg_codec_data_internal(STREAMFILE *streamfile, off_t start_offset, long given_sample_rate, int given_channels, coding_t *coding_type, int * actual_sample_rate, int * actual_channels, int interleaved, int fixed_frame_size, int fsb_padding); static mpg123_handle * init_mpg123_handle(); static void decode_mpeg_default(VGMSTREAMCHANNEL *stream, mpeg_codec_data * data, sample * outbuf, int32_t samples_to_do, int channels); static void decode_mpeg_interleave(VGMSTREAM * vgmstream, mpeg_codec_data * data, sample * outbuf, int32_t samples_to_do, int channels); static void decode_mpeg_interleave_samples(VGMSTREAMCHANNEL *stream, mpeg_codec_data * data, mpg123_handle *m, int channels, int num_stream, size_t block_size); static void update_frame_sizes(mpeg_codec_data * data, VGMSTREAMCHANNEL *stream); static void update_base_frame_sizes(mpeg_codec_data * data, STREAMFILE *streamFile, off_t start_offset, int fixed_frame_size, int current_frame_size, int fsb_padding); /** * Inits regular MPEG. */ mpeg_codec_data *init_mpeg_codec_data(STREAMFILE *streamfile, off_t start_offset, long given_sample_rate, int given_channels, coding_t *coding_type, int * actual_sample_rate, int * actual_channels) { return init_mpeg_codec_data_internal(streamfile, start_offset, given_sample_rate, given_channels, coding_type, actual_sample_rate, actual_channels, 0, 0, 0); } /** * Init interleaved MPEG. */ mpeg_codec_data *init_mpeg_codec_data_interleaved(STREAMFILE *streamfile, off_t start_offset, coding_t *coding_type, int channels, int fixed_frame_size, int fsb_padding) { return init_mpeg_codec_data_internal(streamfile, start_offset, -1, channels, coding_type, NULL, NULL, 1, fixed_frame_size, fsb_padding); } static mpeg_codec_data *init_mpeg_codec_data_internal(STREAMFILE *streamfile, off_t start_offset, long given_sample_rate, int given_channels, coding_t *coding_type, int * actual_sample_rate, int * actual_channels, int interleaved, int fixed_frame_size, int fsb_padding) { mpeg_codec_data *data = NULL; int current_frame_size = 0; /* init codec */ data = calloc(1,sizeof(mpeg_codec_data)); if (!data) goto fail; data->buffer_size = MPEG_DEFAULT_BUFFER_SIZE; data->buffer = calloc(sizeof(uint8_t), data->buffer_size); if (!data->buffer) goto fail; data->m = init_mpg123_handle(); if (!data->m) goto fail; /* check format */ { mpg123_handle *main_m = data->m; off_t read_offset = 0; int rc; long sample_rate_per_frame; int channels_per_frame, encoding; size_t samples_per_frame; struct mpg123_frameinfo mi; /* read first frame(s) */ do { size_t bytes_done; if (read_streamfile(data->buffer, start_offset+read_offset, data->buffer_size, streamfile) != data->buffer_size) goto fail; read_offset+=1; rc = mpg123_decode(main_m, data->buffer,data->buffer_size, NULL,0, &bytes_done); if (rc != MPG123_OK && rc != MPG123_NEW_FORMAT && rc != MPG123_NEED_MORE) goto fail; //todo handle MPG123_DONE } while (rc != MPG123_NEW_FORMAT); /* check first frame header and validate */ rc = mpg123_getformat(main_m,&sample_rate_per_frame,&channels_per_frame,&encoding); if (rc != MPG123_OK) goto fail; mpg123_info(main_m,&mi); if (encoding != MPG123_ENC_SIGNED_16) goto fail; if (sample_rate_per_frame != mi.rate) goto fail; if ((given_sample_rate != -1 && sample_rate_per_frame != given_sample_rate && !interleaved) || (given_channels != -1 && channels_per_frame != given_channels && !interleaved)) goto fail; if (mi.version == MPG123_1_0 && mi.layer == 1) *coding_type = coding_MPEG1_L1; else if (mi.version == MPG123_1_0 && mi.layer == 2) *coding_type = coding_MPEG1_L2; else if (mi.version == MPG123_1_0 && mi.layer == 3) *coding_type = coding_MPEG1_L3; else if (mi.version == MPG123_2_0 && mi.layer == 1) *coding_type = coding_MPEG2_L1; else if (mi.version == MPG123_2_0 && mi.layer == 2) *coding_type = coding_MPEG2_L2; else if (mi.version == MPG123_2_0 && mi.layer == 3) *coding_type = coding_MPEG2_L3; else if (mi.version == MPG123_2_5 && mi.layer == 1) *coding_type = coding_MPEG25_L1; else if (mi.version == MPG123_2_5 && mi.layer == 2) *coding_type = coding_MPEG25_L2; else if (mi.version == MPG123_2_5 && mi.layer == 3) *coding_type = coding_MPEG25_L3; else goto fail; if (mi.layer == 1) samples_per_frame = 384; else if (mi.layer == 2) samples_per_frame = 1152; else if (mi.layer == 3 && mi.version == MPG123_1_0) //MP3 samples_per_frame = 1152; else if (mi.layer == 3) samples_per_frame = 576; else goto fail; data->sample_rate_per_frame = sample_rate_per_frame; data->channels_per_frame = channels_per_frame; data->samples_per_frame = samples_per_frame; /* unlikely (can fixed with bigger buffer or a feed loop) */ if (mi.framesize > data->buffer_size) goto fail; current_frame_size = mi.framesize; /* reinit, to ignore the reading we've done so far */ mpg123_open_feed(main_m); } /* Init interleaved audio, which needs separate decoders per stream and frame size stuff. * We still leave data->m as a "base" info/format to simplify some stuff (could be improved) */ if (interleaved) { int i; data->interleaved = interleaved; if (given_channels < 1 || given_channels > 32) goto fail; /* arbitrary max */ if (given_channels < data->channels_per_frame) goto fail; update_base_frame_sizes(data, streamfile, start_offset, fixed_frame_size, current_frame_size, fsb_padding); if (!data->base_frame_size) goto fail; data->ms_size = given_channels / data->channels_per_frame; data->ms = calloc(sizeof(mpg123_handle *), data->ms_size); for (i=0; i < data->ms_size; i++) { data->ms[i] = init_mpg123_handle(); if (!data->ms[i]) goto fail; } data->frame_buffer_size = sizeof(sample) * data->samples_per_frame * data->channels_per_frame; data->frame_buffer = calloc(sizeof(uint8_t), data->frame_buffer_size); if (!data->frame_buffer) goto fail; data->interleave_buffer_size = sizeof(sample) * data->samples_per_frame * given_channels; data->interleave_buffer = calloc(sizeof(uint8_t), data->interleave_buffer_size); if (!data->interleave_buffer) goto fail; } return data; fail: free_mpeg(data); return NULL; } /** * Inits MPEG for AHX, which ignores frame headers. */ mpeg_codec_data *init_mpeg_codec_data_ahx(STREAMFILE *streamFile, off_t start_offset, int channel_count) { mpeg_codec_data *data = NULL; /* init codec */ data = calloc(1,sizeof(mpeg_codec_data)); if (!data) goto fail; data->buffer_size = MPEG_DEFAULT_BUFFER_SIZE; data->buffer = calloc(sizeof(uint8_t), data->buffer_size); if (!data->buffer) goto fail; data->m = init_mpg123_handle(); if (!data->m) goto fail; return data; fail: free_mpeg(data); return NULL; } static mpg123_handle * init_mpg123_handle() { mpg123_handle *m = NULL; int rc; /* inits a new mpg123 handle */ m = mpg123_new(NULL,&rc); if (rc == MPG123_NOT_INITIALIZED) { /* inits the library if needed */ if (mpg123_init() != MPG123_OK) goto fail; m = mpg123_new(NULL,&rc); if (rc != MPG123_OK) goto fail; } else if (rc != MPG123_OK) { goto fail; } mpg123_param(m,MPG123_REMOVE_FLAGS,MPG123_GAPLESS,0.0); //todo fix gapless mpg123_param(m,MPG123_RESYNC_LIMIT, -1, 0x10000); /* should be enough */ if (mpg123_open_feed(m) != MPG123_OK) { goto fail; } return m; fail: mpg123_delete(m); return NULL; } /************/ /* DECODERS */ /************/ void decode_mpeg(VGMSTREAM * vgmstream, sample * outbuf, int32_t samples_to_do, int channels) { mpeg_codec_data * data = (mpeg_codec_data *) vgmstream->codec_data; /* MPEGs streams contain one or two channels, so we may only need half VGMSTREAMCHANNELs for offsets */ if (data->interleaved) { decode_mpeg_interleave(vgmstream, data, outbuf, samples_to_do, channels); } else { decode_mpeg_default(&vgmstream->ch[0], data, outbuf, samples_to_do, channels); } } /** * Decode anything mpg123 can. * Feeds raw data and extracts decoded samples as needed. */ static void decode_mpeg_default(VGMSTREAMCHANNEL *stream, mpeg_codec_data * data, sample * outbuf, int32_t samples_to_do, int channels) { int samples_done = 0; mpg123_handle *m = data->m; while (samples_done < samples_to_do) { size_t bytes_done; int rc; /* read more raw data */ if (!data->buffer_full) { data->bytes_in_buffer = read_streamfile(data->buffer,stream->offset,data->buffer_size,stream->streamfile); /* end of stream, fill rest with 0s */ if (!data->bytes_in_buffer) { memset(outbuf + samples_done * channels, 0, (samples_to_do - samples_done) * sizeof(sample)); break; } data->buffer_full = 1; data->buffer_used = 0; stream->offset += data->bytes_in_buffer; } /* feed new raw data to the decoder if needed, copy decoded results to output */ if (!data->buffer_used) { rc = mpg123_decode(m, data->buffer,data->bytes_in_buffer, (unsigned char *)(outbuf+samples_done*channels), (samples_to_do-samples_done)*sizeof(sample)*channels, &bytes_done); data->buffer_used = 1; } else { rc = mpg123_decode(m, NULL,0, (unsigned char *)(outbuf+samples_done*channels), (samples_to_do-samples_done)*sizeof(sample)*channels, &bytes_done); } /* not enough raw data, request more */ if (rc == MPG123_NEED_MORE) { data->buffer_full = 0; } /* update copied samples */ samples_done += bytes_done/sizeof(sample)/channels; } } /** * Decode interleaved (multichannel) MPEG. Works with mono/stereo too. * Channels (1 or 2), samples and frame size per stream should be constant. //todo extra validations * * Reads frame 'streams' (ex. 4ch = 1+1+1+1 = 4 streams or 2+2 = 2 streams), decodes * samples per stream and muxes them into a single internal buffer before copying to outbuf * (to make sure channel samples are orderly copied between decode_mpeg calls). * * Interleave variations: * - blocks of frames: fixed block_size per stream (unknown number of samples) [XVAG] * (ex. b1 = N samples of ch1, b2 = N samples of ch2, b3 = M samples of ch1, etc) * - partial frames: single frames per stream with padding (block_size is frame_size+padding) [FSB] * (ex. f1+f3+f5 = 1152*2 samples of ch1+2, f2+f4 = 1152*2 samples of ch3+4, etc) */ static void decode_mpeg_interleave(VGMSTREAM * vgmstream, mpeg_codec_data * data, sample * outbuf, int32_t samples_to_do, int channels) { int samples_done = 0, bytes_max, bytes_to_copy; while (samples_done < samples_to_do) { if (data->bytes_used_in_interleave_buffer < data->bytes_in_interleave_buffer) { /* copy remaining samples */ bytes_to_copy = data->bytes_in_interleave_buffer - data->bytes_used_in_interleave_buffer; bytes_max = (samples_to_do - samples_done) * sizeof(sample) * channels; if (bytes_to_copy > bytes_max) bytes_to_copy = bytes_max; memcpy((uint8_t*)(outbuf+samples_done*channels), data->interleave_buffer + data->bytes_used_in_interleave_buffer, bytes_to_copy); /* update samples copied */ data->bytes_used_in_interleave_buffer += bytes_to_copy; samples_done += bytes_to_copy / sizeof(sample) / channels; } else { /* fill the internal sample buffer */ int i; data->bytes_in_interleave_buffer = 0; data->bytes_used_in_interleave_buffer = 0; for (i=0; i < data->ms_size; i++) { decode_mpeg_interleave_samples(&vgmstream->ch[i], data, data->ms[i], channels, i, vgmstream->interleave_block_size); } } } } /** * Decodes frames from a stream and muxes the samples into a intermediate buffer. * Skips to the next interleaved block once reaching the stream's block end. */ static void decode_mpeg_interleave_samples(VGMSTREAMCHANNEL *stream, mpeg_codec_data * data, mpg123_handle *m, int channels, int num_stream, size_t block_size) { size_t bytes_done; /* decode samples from 1 full frame */ do { int rc; /* padded frame stuff */ update_frame_sizes(data, stream); /* read more raw data (only 1 frame, to check interleave block end) */ if (!data->buffer_full) { data->bytes_in_buffer = read_streamfile(data->buffer,stream->offset,data->current_frame_size,stream->streamfile); /* end of stream, fill frame buffer with 0s but continue normally with other streams */ if (!data->bytes_in_buffer) { memset(data->frame_buffer, 0, data->frame_buffer_size); bytes_done = data->frame_buffer_size; break; } data->buffer_full = 1; data->buffer_used = 0; stream->offset += data->current_frame_size + data->current_padding; /* skip FSB frame+garbage */ if (block_size && ((stream->offset - stream->channel_start_offset) % block_size==0)) { stream->offset += block_size * (data->ms_size-1); /* skip a block per stream if block done */ } } /* feed new raw data to the decoder if needed, copy decoded results to frame buffer output */ if (!data->buffer_used) { rc = mpg123_decode(m, data->buffer, data->bytes_in_buffer, (unsigned char *)data->frame_buffer, data->frame_buffer_size, &bytes_done); data->buffer_used = 1; } else { rc = mpg123_decode(m, NULL,0, (unsigned char *)data->frame_buffer, data->frame_buffer_size, &bytes_done); } /* samples per frame should be constant... */ if (bytes_done > 0 && bytes_done < data->frame_buffer_size) { VGM_LOG("borked frame: %i bytes done, expected %i, rc=%i\n", bytes_done, data->frame_buffer_size, rc); memset(data->frame_buffer + bytes_done, 0, data->frame_buffer_size - bytes_done); bytes_done = data->frame_buffer_size; } /* not enough raw data, request more */ if (rc == MPG123_NEED_MORE) { data->buffer_full = 0; continue; } break; } while (1); /* copy decoded frame to intermediate sample buffer, muxing channels * (ex stream1: ch1s1 ch1s2, stream2: ch2s1 ch2s2 > ch1s1 ch2s1 ch1s2 ch2s2) */ { size_t samples_done; size_t sz = sizeof(sample); int channels_f = data->channels_per_frame; int fch, i; samples_done = bytes_done / sz / channels_f; for (fch = 0; fch < channels_f; fch++) { /* channels inside the frame */ for (i = 0; i < samples_done; i++) { /* decoded samples */ off_t in_offset = sz*i*channels_f + sz*fch; off_t out_offset = sz*i*channels + sz*(num_stream*channels_f + fch); memcpy(data->interleave_buffer + out_offset, data->frame_buffer + in_offset, sz); } } data->bytes_in_interleave_buffer += bytes_done; } } /** * Very Clunky Stuff for FSBs of varying padding sizes per frame. * Padding sometimes contains next frame header so we can't feed it to mpg123 or it gets confused. * Expected to be called at the beginning of a new frame. */ static void update_frame_sizes(mpeg_codec_data * data, VGMSTREAMCHANNEL *stream) { if (!data->fixed_frame_size) { /* Manually fix frame size. Not ideal but mpg123_info.framesize is weird. */ uint32_t header = (uint32_t)read_32bitBE(stream->offset, stream->streamfile); if (header & MPEG_SYNC_BITS) data->current_frame_size = data->base_frame_size + (header & MPEG_PADDING_BIT ? 1 : 0); else data->current_frame_size = 0; /* todo skip invalid frame? */ if (data->fsb_padding) //todo not always ok data->current_padding = (data->current_frame_size % data->fsb_padding) ? data->fsb_padding - (data->current_frame_size % data->fsb_padding) : 0; } } static void update_base_frame_sizes(mpeg_codec_data * data, STREAMFILE *streamFile, off_t start_offset, int fixed_frame_size, int current_frame_size, int fsb_padding) { if (fixed_frame_size) { data->fixed_frame_size = fixed_frame_size; data->base_frame_size = data->fixed_frame_size; data->current_frame_size = data->fixed_frame_size; } else { /* adjust sizes in the first frame */ //todo: sometimes mpg123_info.framesize is not correct, manually calculate? (Xing headers?) uint32_t header = (uint32_t)read_32bitBE(start_offset, streamFile); if (header & MPEG_SYNC_BITS) data->base_frame_size = current_frame_size - (header & MPEG_PADDING_BIT ? 1 : 0); else data->base_frame_size = 0; /* todo skip invalid frame? */ data->current_frame_size = current_frame_size; data->fsb_padding = fsb_padding; if (data->fsb_padding) //todo not always ok data->current_padding = (data->current_frame_size % data->fsb_padding) ? data->fsb_padding - (data->current_frame_size % data->fsb_padding) : 0; } } /** * Decode AHX mono frames. * mpg123 expects frames of 0x414 (160kbps, 22050Hz) but they actually vary and are much shorter */ void decode_fake_mpeg2_l2(VGMSTREAMCHANNEL *stream, mpeg_codec_data * data, sample * outbuf, int32_t samples_to_do) { int samples_done = 0; const int frame_size = AHX_EXPECTED_FRAME_SIZE; mpg123_handle *m = data->m; while (samples_done < samples_to_do) { size_t bytes_done; int rc; /* read more raw data */ if (!data->buffer_full) { /* fill buffer up to next frame ending (or file ending) */ int bytes_into_header = 0; const uint8_t header[4] = {0xff,0xf5,0xe0,0xc0}; off_t frame_offset = 0; /* assume that we are starting at a header, skip it and look for the next one */ read_streamfile(data->buffer, stream->offset+frame_offset, 4, stream->streamfile); frame_offset += 4; do { uint8_t byte; byte = read_8bit(stream->offset+frame_offset,stream->streamfile); data->buffer[frame_offset] = byte; frame_offset++; if (byte == header[bytes_into_header]) { bytes_into_header++; } else { /* This might have been the first byte of the header, so * we need to check again. * No need to get more complicated than this, though, since * there are no repeated characters in the search string. */ if (bytes_into_header>0) { frame_offset--; } bytes_into_header=0; } if (bytes_into_header==4) { break; } } while (frame_offset < frame_size); if (bytes_into_header==4) frame_offset-=4; memset(data->buffer+frame_offset,0,frame_size-frame_offset); data->buffer_full = 1; data->buffer_used = 0; stream->offset += frame_offset; } /* feed new raw data to the decoder if needed, copy decodec results to output */ if (!data->buffer_used) { rc = mpg123_decode(m, data->buffer,frame_size, (unsigned char *)(outbuf+samples_done), (samples_to_do-samples_done)*sizeof(sample), &bytes_done); data->buffer_used = 1; } else { rc = mpg123_decode(m, NULL,0, (unsigned char *)(outbuf+samples_done), (samples_to_do-samples_done)*sizeof(sample), &bytes_done); } /* not enough raw data, request more */ if (rc == MPG123_NEED_MORE) { data->buffer_full = 0; } /* update copied samples */ samples_done += bytes_done/sizeof(sample);/* mono */ } } /*********/ /* UTILS */ /*********/ void free_mpeg(mpeg_codec_data *data) { if (!data) return; mpg123_delete(data->m); if (data->interleaved) { int i; for (i=0; i < data->ms_size; i++) { mpg123_delete(data->ms[i]); } free(data->ms); free(data->interleave_buffer); free(data->frame_buffer); } free(data->buffer); free(data); /* The astute reader will note that a call to mpg123_exit is never * made. While is is evilly breaking our contract with mpg123, it * doesn't actually do anything except set the "initialized" flag * to 0. And if we exit we run the risk of turning it off when * someone else in another thread is using it. */ } void reset_mpeg(VGMSTREAM *vgmstream) { off_t input_offset; mpeg_codec_data *data = vgmstream->codec_data; /* input_offset is ignored as we can assume it will be 0 for a seek to sample 0 */ mpg123_feedseek(data->m,0,SEEK_SET,&input_offset); /* reset multistream */ //todo check if stream offsets are properly reset if (data->interleaved) { int i; for (i=0; i < data->ms_size; i++) { mpg123_feedseek(data->ms[i],0,SEEK_SET,&input_offset); vgmstream->loop_ch[i].offset = vgmstream->loop_ch[i].channel_start_offset + input_offset; } data->bytes_in_interleave_buffer = 0; data->bytes_used_in_interleave_buffer = 0; } } void seek_mpeg(VGMSTREAM *vgmstream, int32_t num_sample) { /* won't work for fake or multistream MPEG */ off_t input_offset; mpeg_codec_data *data = vgmstream->codec_data; /* seek multistream */ if (!data->interleaved) { mpg123_feedseek(data->m, num_sample,SEEK_SET,&input_offset); vgmstream->loop_ch[0].offset = vgmstream->loop_ch[0].channel_start_offset + input_offset; } else { int i; /* re-start from 0 */ for (i=0; i < data->ms_size; i++) { mpg123_feedseek(data->ms[i],0,SEEK_SET,&input_offset); vgmstream->loop_ch[i].offset = vgmstream->loop_ch[i].channel_start_offset; } /* manually add skip samples, since we don't really know the correct offset */ //todo call decode with samples_to_do and fake header data->bytes_in_interleave_buffer = 0; data->bytes_used_in_interleave_buffer = 0; } data->buffer_full = 0; data->buffer_used = 0; } long mpeg_bytes_to_samples(long bytes, const mpeg_codec_data *data) { struct mpg123_frameinfo mi; mpg123_handle *m = data->m; if (MPG123_OK != mpg123_info(m, &mi)) return 0; /* In this case just return 0 and expect to fail (if used for num_samples) * We would need to read the number of frames in some frame header or count them to get samples */ if (mi.vbr != MPG123_CBR) //maybe abr_rate could be used return 0; return (int64_t)bytes * mi.rate * 8 / (mi.bitrate * 1000); } /** * disables/enables stderr output, useful for MPEG known to contain recoverable errors */ void mpeg_set_error_logging(mpeg_codec_data * data, int enable) { mpg123_param(data->m, MPG123_ADD_FLAGS, MPG123_QUIET, !enable); if (data->interleaved) { int i; for (i=0; i < data->ms_size; i++) { mpg123_param(data->ms[i], MPG123_ADD_FLAGS, MPG123_QUIET, !enable); } } } #endif