mirror of
https://github.com/vgmstream/vgmstream.git
synced 2024-12-21 10:55:53 +01:00
254 lines
10 KiB
C
254 lines
10 KiB
C
|
#include "../vgmstream.h"
|
||
|
|
||
|
#ifdef VGM_USE_FFMPEG
|
||
|
|
||
|
/* ******************************************** */
|
||
|
/* FAKE RIFF HELPERS */
|
||
|
/* ******************************************** */
|
||
|
/* All helpers copy a RIFF header to buf and returns the number of bytes in buf or -1 when buf is not big enough */
|
||
|
|
||
|
static int ffmpeg_fmt_chunk_swap_endian(uint8_t * chunk, uint16_t codec);
|
||
|
|
||
|
int ffmpeg_make_riff_atrac3(uint8_t * buf, size_t buf_size, size_t sample_count, size_t data_size, int channels, int sample_rate, int block_align, int joint_stereo, int encoder_delay) {
|
||
|
uint16_t codec_ATRAC3 = 0x0270;
|
||
|
size_t riff_size = 4+4+ 4 + 0x28 + 0x10 + 4+4;
|
||
|
|
||
|
if (buf_size < riff_size)
|
||
|
return -1;
|
||
|
|
||
|
memcpy(buf+0x00, "RIFF", 4);
|
||
|
put_32bitLE(buf+0x04, (int32_t)(riff_size-4-4 + data_size)); /* riff size */
|
||
|
memcpy(buf+0x08, "WAVE", 4);
|
||
|
|
||
|
memcpy(buf+0x0c, "fmt ", 4);
|
||
|
put_32bitLE(buf+0x10, 0x20);/*fmt size*/
|
||
|
put_16bitLE(buf+0x14, codec_ATRAC3);
|
||
|
put_16bitLE(buf+0x16, channels);
|
||
|
put_32bitLE(buf+0x18, sample_rate);
|
||
|
put_32bitLE(buf+0x1c, sample_rate*channels / sizeof(sample)); /* average bytes per second (wrong) */
|
||
|
put_32bitLE(buf+0x20, (int16_t)(block_align)); /* block align */
|
||
|
|
||
|
put_16bitLE(buf+0x24, 0x0e); /* extra data size */
|
||
|
put_16bitLE(buf+0x26, 1); /* unknown, always 1 */
|
||
|
put_16bitLE(buf+0x28, 0x0800 * channels); /* unknown (some size? 0x1000=2ch, 0x0800=1ch) */
|
||
|
put_16bitLE(buf+0x2a, 0); /* unknown, always 0 */
|
||
|
put_16bitLE(buf+0x2c, joint_stereo ? 0x0001 : 0x0000);
|
||
|
put_16bitLE(buf+0x2e, joint_stereo ? 0x0001 : 0x0000); /* repeated? */
|
||
|
put_16bitLE(buf+0x30, 1); /* unknown, always 1 (frame_factor?) */
|
||
|
put_16bitLE(buf+0x32, 0); /* unknown, always 0 */
|
||
|
|
||
|
memcpy(buf+0x34, "fact", 4);
|
||
|
put_32bitLE(buf+0x38, 0x8); /* fact size */
|
||
|
put_32bitLE(buf+0x3c, sample_count);
|
||
|
put_32bitLE(buf+0x40, encoder_delay);
|
||
|
|
||
|
memcpy(buf+0x44, "data", 4);
|
||
|
put_32bitLE(buf+0x48, data_size); /* data size */
|
||
|
|
||
|
return riff_size;
|
||
|
}
|
||
|
|
||
|
int ffmpeg_make_riff_xma1(uint8_t * buf, size_t buf_size, size_t sample_count, size_t data_size, int channels, int sample_rate) {
|
||
|
uint16_t codec_XMA1 = 0x0165;
|
||
|
size_t riff_size;
|
||
|
int streams, i;
|
||
|
|
||
|
streams = (channels + 1) / 2;
|
||
|
|
||
|
riff_size = 4+4+ 4 + 0x14 + 0x14*streams + 4+4;
|
||
|
|
||
|
if (buf_size < riff_size)
|
||
|
return -1;
|
||
|
|
||
|
memcpy(buf+0x00, "RIFF", 4);
|
||
|
put_32bitLE(buf+0x04, (int32_t)(riff_size-4-4 + data_size)); /* riff size */
|
||
|
memcpy(buf+0x08, "WAVE", 4);
|
||
|
|
||
|
memcpy(buf+0x0c, "fmt ", 4);
|
||
|
put_32bitLE(buf+0x10, 0xc + 0x14*streams);/*fmt size*/
|
||
|
put_16bitLE(buf+0x14, codec_XMA1);
|
||
|
put_16bitLE(buf+0x16, 16); /* bits per sample */
|
||
|
put_16bitLE(buf+0x18, 0x10D6); /* encoder options */
|
||
|
put_16bitLE(buf+0x1a, 0); /* largest stream skip (wrong, unneeded) */
|
||
|
put_16bitLE(buf+0x1c, streams); /* number of streams */
|
||
|
put_8bit (buf+0x1e, 0); /* loop count */
|
||
|
put_8bit (buf+0x1f, 2); /* version */
|
||
|
|
||
|
for (i = 0; i < streams; i++) {
|
||
|
int stream_channels;
|
||
|
uint32_t speakers;
|
||
|
off_t off = 0x20 + 0x14*i;/* stream riff offset */
|
||
|
|
||
|
/* with odd channels the last stream is mono */
|
||
|
stream_channels = channels / streams + (channels%2 != 0 && i+1 != streams ? 1 : 0);
|
||
|
VGM_LOG("sch=%i, %i, %i\n", stream_channels, channels / streams, (channels%2 != 0 && i+1 != streams ? 1 : 0));
|
||
|
switch(i) { /* per stream, values from xmaencode */
|
||
|
case 0: speakers = stream_channels == 1 ? 0x0001 : 0x0201; break;/* L R */
|
||
|
case 1: speakers = stream_channels == 1 ? 0x0004 : 0x0804; break;/* C LFE */
|
||
|
case 2: speakers = stream_channels == 1 ? 0x0040 : 0x8040; break;/* LB RB */
|
||
|
case 3: speakers = stream_channels == 1 ? 0x0000 : 0x0000; break;/* somehow empty (maybe should use 0x2010 LS RS) */
|
||
|
default: speakers = 0;
|
||
|
}
|
||
|
|
||
|
put_32bitLE(buf+off+0x00, sample_rate*stream_channels / sizeof(sample)); /* average bytes per second (wrong, unneeded) */
|
||
|
put_32bitLE(buf+off+0x04, sample_rate);
|
||
|
put_32bitLE(buf+off+0x08, 0); /* loop start */
|
||
|
put_32bitLE(buf+off+0x0c, 0); /* loop end */
|
||
|
put_8bit (buf+off+0x10, 0); /* loop subframe */
|
||
|
put_8bit (buf+off+0x11, channels);
|
||
|
put_16bitLE(buf+off+0x12, speakers);
|
||
|
}
|
||
|
|
||
|
memcpy(buf+riff_size-4-4, "data", 4);
|
||
|
put_32bitLE(buf+riff_size-4, data_size); /* data size */
|
||
|
|
||
|
return riff_size;
|
||
|
}
|
||
|
|
||
|
int ffmpeg_make_riff_xma2(uint8_t * buf, size_t buf_size, size_t sample_count, size_t data_size, int channels, int sample_rate, int block_count, int block_size) {
|
||
|
uint16_t codec_XMA2 = 0x0166;
|
||
|
size_t riff_size = 4+4+ 4 + 0x3c + 4+4;
|
||
|
size_t bytecount;
|
||
|
int streams;
|
||
|
uint32_t speakers;
|
||
|
|
||
|
/* info from xma2defs.h, xact3wb.h and audiodefs.h */
|
||
|
streams = (channels + 1) / 2;
|
||
|
switch (channels) {
|
||
|
case 1: speakers = 0x04; break; /* 1.0: FC */
|
||
|
case 2: speakers = 0x01 | 0x02; break; /* 2.0: FL FR */
|
||
|
case 3: speakers = 0x01 | 0x02 | 0x08; break; /* 2.1: FL FR LF */
|
||
|
case 4: speakers = 0x01 | 0x02 | 0x10 | 0x20; break; /* 4.0: FL FR BL BR */
|
||
|
case 5: speakers = 0x01 | 0x02 | 0x08 | 0x10 | 0x20; break; /* 4.1: FL FR LF BL BR */
|
||
|
case 6: speakers = 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20; break; /* 5.1: FL FR FC LF BL BR */
|
||
|
case 7: speakers = 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x0100; break; /* 6.1: FL FR FC LF BL BR BC */
|
||
|
case 8: speakers = 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80; break; /* 7.1: FL FR FC LF BL BR FLC FRC */
|
||
|
default: speakers = 0; break;
|
||
|
}
|
||
|
|
||
|
if (buf_size < riff_size)
|
||
|
return -1;
|
||
|
|
||
|
bytecount = sample_count * channels * sizeof(sample);
|
||
|
|
||
|
memcpy(buf+0x00, "RIFF", 4);
|
||
|
put_32bitLE(buf+0x04, (int32_t)(riff_size-4-4 + data_size)); /* riff size */
|
||
|
memcpy(buf+0x08, "WAVE", 4);
|
||
|
|
||
|
memcpy(buf+0x0c, "fmt ", 4);
|
||
|
put_32bitLE(buf+0x10, 0x34);/*fmt size*/
|
||
|
put_16bitLE(buf+0x14, codec_XMA2);
|
||
|
put_16bitLE(buf+0x16, channels);
|
||
|
put_32bitLE(buf+0x18, sample_rate);
|
||
|
put_32bitLE(buf+0x1c, sample_rate*channels / sizeof(sample)); /* average bytes per second (wrong unneeded) */
|
||
|
put_16bitLE(buf+0x20, (int16_t)(channels*sizeof(sample))); /* block align */
|
||
|
put_16bitLE(buf+0x22, 16); /* bits per sample */
|
||
|
|
||
|
put_16bitLE(buf+0x24, 0x22); /* extra data size */
|
||
|
put_16bitLE(buf+0x26, streams); /* number of streams */
|
||
|
put_32bitLE(buf+0x28, speakers); /* speaker position */
|
||
|
put_32bitLE(buf+0x2c, bytecount); /* PCM samples */
|
||
|
put_32bitLE(buf+0x30, block_size); /* XMA block size */
|
||
|
/* (looping values not set, expected to be handled externally) */
|
||
|
put_32bitLE(buf+0x34, 0); /* play begin */
|
||
|
put_32bitLE(buf+0x38, 0); /* play length */
|
||
|
put_32bitLE(buf+0x3c, 0); /* loop begin */
|
||
|
put_32bitLE(buf+0x40, 0); /* loop length */
|
||
|
put_8bit(buf+0x44, 0); /* loop count */
|
||
|
put_8bit(buf+0x45, 4); /* encoder version */
|
||
|
put_16bitLE(buf+0x46, block_count); /* blocks count = entries in seek table */
|
||
|
|
||
|
memcpy(buf+0x48, "data", 4);
|
||
|
put_32bitLE(buf+0x4c, data_size); /* data size */
|
||
|
|
||
|
return riff_size;
|
||
|
}
|
||
|
|
||
|
int ffmpeg_make_riff_xma2_from_fmt(uint8_t * buf, size_t buf_size, off_t fmt_offset, size_t fmt_size, size_t data_size, STREAMFILE *streamFile, int big_endian) {
|
||
|
size_t riff_size = 4+4+ 4 + 4+4+fmt_size + 4+4;
|
||
|
uint8_t chunk[100];
|
||
|
|
||
|
if (buf_size < riff_size || fmt_size > 100)
|
||
|
goto fail;
|
||
|
if (read_streamfile(chunk,fmt_offset,fmt_size, streamFile) != fmt_size)
|
||
|
goto fail;
|
||
|
|
||
|
if (big_endian)
|
||
|
ffmpeg_fmt_chunk_swap_endian(chunk, 0x166);
|
||
|
|
||
|
memcpy(buf+0x00, "RIFF", 4);
|
||
|
put_32bitLE(buf+0x04, (int32_t)(riff_size-4-4 + data_size)); /* riff size */
|
||
|
memcpy(buf+0x08, "WAVE", 4);
|
||
|
|
||
|
memcpy(buf+0x0c, "fmt ", 4);
|
||
|
put_32bitLE(buf+0x10, fmt_size);/*fmt size*/
|
||
|
memcpy(buf+0x14, chunk, fmt_size);
|
||
|
|
||
|
memcpy(buf+0x14+fmt_size, "data", 4);
|
||
|
put_32bitLE(buf+0x14+fmt_size+4, data_size); /* data size */
|
||
|
|
||
|
return riff_size;
|
||
|
|
||
|
fail:
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
int ffmpeg_make_riff_xwma(uint8_t * buf, size_t buf_size, int codec, size_t sample_count, size_t data_size, int channels, int sample_rate, int avg_bps, int block_align) {
|
||
|
size_t riff_size = 4+4+ 4 + 0x1a + 4+4;
|
||
|
|
||
|
if (buf_size < riff_size)
|
||
|
return -1;
|
||
|
|
||
|
memcpy(buf+0x00, "RIFF", 4);
|
||
|
put_32bitLE(buf+0x04, (int32_t)(riff_size-4-4 + data_size)); /* riff size */
|
||
|
memcpy(buf+0x08, "XWMA", 4);
|
||
|
|
||
|
memcpy(buf+0x0c, "fmt ", 4);
|
||
|
put_32bitLE(buf+0x10, 0x12);/*fmt size*/
|
||
|
put_16bitLE(buf+0x14, codec);
|
||
|
put_16bitLE(buf+0x16, channels);
|
||
|
put_32bitLE(buf+0x18, sample_rate);
|
||
|
put_32bitLE(buf+0x1c, avg_bps); /* average bits per second, somehow vital for XWMA */
|
||
|
put_16bitLE(buf+0x20, block_align); /* block align */
|
||
|
put_16bitLE(buf+0x22, 16); /* bits per sample */
|
||
|
put_16bitLE(buf+0x24, 0); /* unk */
|
||
|
/* here goes the "dpds" table, but it's not needed by FFmpeg */
|
||
|
|
||
|
memcpy(buf+0x26, "data", 4);
|
||
|
put_32bitLE(buf+0x2a, data_size); /* data size */
|
||
|
|
||
|
return riff_size;
|
||
|
}
|
||
|
|
||
|
|
||
|
static int ffmpeg_fmt_chunk_swap_endian(uint8_t * chunk, uint16_t codec) {
|
||
|
if (codec != 0x166)/* XMA2 */
|
||
|
goto fail;
|
||
|
|
||
|
put_16bitLE(chunk + 0x00, get_16bitBE(chunk + 0x00));/*wFormatTag*/
|
||
|
put_16bitLE(chunk + 0x02, get_16bitBE(chunk + 0x02));/*nChannels*/
|
||
|
put_32bitLE(chunk + 0x04, get_32bitBE(chunk + 0x04));/*nSamplesPerSec*/
|
||
|
put_32bitLE(chunk + 0x08, get_32bitBE(chunk + 0x08));/*nAvgBytesPerSec*/
|
||
|
put_16bitLE(chunk + 0x0c, get_16bitBE(chunk + 0x0c));/*nBlockAlign*/
|
||
|
put_16bitLE(chunk + 0x0e, get_16bitBE(chunk + 0x0e));/*wBitsPerSample*/
|
||
|
put_16bitLE(chunk + 0x10, get_16bitBE(chunk + 0x10));/*cbSize*/
|
||
|
put_16bitLE(chunk + 0x12, get_16bitBE(chunk + 0x12));/*NumStreams*/
|
||
|
put_32bitLE(chunk + 0x14, get_32bitBE(chunk + 0x14));/*ChannelMask*/
|
||
|
put_32bitLE(chunk + 0x18, get_32bitBE(chunk + 0x18));/*SamplesEncoded*/
|
||
|
put_32bitLE(chunk + 0x1c, get_32bitBE(chunk + 0x1c));/*BytesPerBlock*/
|
||
|
put_32bitLE(chunk + 0x20, get_32bitBE(chunk + 0x20));/*PlayBegin*/
|
||
|
put_32bitLE(chunk + 0x24, get_32bitBE(chunk + 0x24));/*PlayLength*/
|
||
|
put_32bitLE(chunk + 0x28, get_32bitBE(chunk + 0x28));/*LoopBegin*/
|
||
|
put_32bitLE(chunk + 0x2c, get_32bitBE(chunk + 0x2c));/*LoopLength*/
|
||
|
/* put_8bit(chunk + 0x30, get_8bit(chunk + 0x30));*//*LoopCount*/
|
||
|
/* put_8bit(chunk + 0x31, get_8bit(chunk + 0x31));*//*EncoderVersion*/
|
||
|
put_16bitLE(chunk + 0x32, get_16bitBE(chunk + 0x32));/*BlockCount*/
|
||
|
|
||
|
return 1;
|
||
|
|
||
|
fail:
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
#endif
|