quakespasm/Quake/snd_mp3.c

/*
 * MP3 decoding support using libmad:  Adapted from the SoX library at
 * http://sourceforge.net/projects/sox/, LGPLv2, Copyright (c) 2007-2009
 * SoX contributors, written by Fabrizio Gennari <fabrizio.ge@tiscali.it>,
 * with the decoding part based on the decoder tutorial program madlld
 * written by Bertrand Petit <madlld@phoe.fmug.org> (BSD license, see at
 * http://www.bsd-dk.dk/~elrond/audio/madlld/).  The tag identification
 * functions were initially adapted from GPL-licensed libid3tag library
 * (see at http://www.underbit.com/products/mad/) then rephrased further.
 * Adapted for use in Quake and Hexen II game engines by O.Sezer:
 * Copyright (C) 2010-2019 O.Sezer <sezero@users.sourceforge.net>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or (at
 * your option) any later version.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 *
 * See the GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 */

#include "quakedef.h"

#if defined(USE_CODEC_MP3)
#include "snd_codec.h"
#include "snd_codeci.h"
#include "snd_mp3.h"
#include <mad.h>

/* Under Windows, importing data from DLLs is a dicey proposition. This is true
 * when using dlopen, but also true if linking directly against the DLL if the
 * header does not mark the data as __declspec(dllexport), which mad.h does not.
 * Sidestep the issue by defining our own mad_timer_zero. This is needed because
 * mad_timer_zero is used in some of the mad.h macros.
 */
#define mad_timer_zero mad_timer_zero_stub
static mad_timer_t const mad_timer_zero_stub = {0, 0};

/* MAD returns values with MAD_F_FRACBITS (28) bits of precision, though it's
   not certain that all of them are meaningful. Default to 16 bits to
   align with most users expectation of output file should be 16 bits. */
#define MP3_MAD_SAMPLEBITS	16
#define MP3_MAD_SAMPLEWIDTH	2
#define MP3_BUFFER_SIZE		(5 * 8192)

/* Private data */
typedef struct _mp3_priv_t
{
	unsigned char mp3_buffer[MP3_BUFFER_SIZE];
	struct mad_stream	Stream;
	struct mad_frame	Frame;
	struct mad_synth	Synth;
	mad_timer_t		Timer;
	ptrdiff_t		cursamp;
	size_t			FrameCount;
} mp3_priv_t;

/* http://id3.org/ID3v1 :  3 bytes "TAG" identifier and 125 bytes tag data */
static inline qboolean tag_is_id3v1(const unsigned char *data, size_t length)
{
	if (length >= 3 &&
	     data[0] == 'T' && data[1] == 'A' && data[2] == 'G')
	{
		return true;
	}
	return false;
}

/* ID3v1 extended tag: just before ID3v1, always 227 bytes.
 * https://www.getid3.org/phpBB3/viewtopic.php?t=1202
 * https://en.wikipedia.org/wiki/ID3v1#Enhanced_tag
 * Not an official standard, is only supported by few programs. */
static inline qboolean tag_is_id3v1ext(const unsigned char *data, size_t length)
{
	if (length >= 4 &&
	     data[0] == 'T' && data[1] == 'A' && data[2] == 'G' && data[3] == '+')
	{
		return true;
	}
	return false;
}

#define ID3_TAG_FLAG_FOOTERPRESENT 0x10
static inline qboolean tag_is_id3v2(const unsigned char *data, size_t length)
{
	/* ID3v2 header is 10 bytes:  http://id3.org/id3v2.4.0-structure */
	if (length >= 10 &&
	/* bytes 0-2: "ID3" identifier */
	    (data[0] == 'I' && data[1] == 'D' && data[2] == '3') &&
	/* bytes 3-4: version num (major,revision), each byte always less than 0xff. */
	    data[3] < 0xff && data[4] < 0xff &&
	/* bytes 6-9 are the ID3v2 tag size: a 32 bit 'synchsafe' integer, i.e. the
	 * highest bit 7 in each byte zeroed.  i.e.: 7 bit information in each byte ->
	  * effectively a 28 bit value.  */
	    data[6] < 0x80 && data[7] < 0x80 && data[8] < 0x80 && data[9] < 0x80)
	{
		return true;
	}
	return false;
}

static inline long get_id3v2_len(const unsigned char *data, long datalen)
{
	/* size is a 'synchsafe' integer (see above) */
	long taglen = (long)((data[6]<<21) + (data[7]<<14) + (data[8]<<7) + data[9]);
	taglen += 10; /* header size */
	/* ID3v2 header[5] is flags (bits 4-7 only, 0-3 are zero).
	 * bit 4 set: footer is present (a copy of the header but
	 * with "3DI" as ident.)  */
	if (data[5] & ID3_TAG_FLAG_FOOTERPRESENT)
		taglen += 10;
	for ( ; taglen < datalen && !data[taglen]; ++taglen)
		; /* consume optional padding (always zeroes) */
	return taglen;
}

/* http://wiki.hydrogenaud.io/index.php?title=APEv1_specification
 * http://wiki.hydrogenaud.io/index.php?title=APEv2_specification
 * Header/footer is 32 bytes: bytes 0-7 ident, bytes 8-11 version,
 * bytes 12-17 size.  bytes 24-31 are reserved: must be all zeroes.
 */
static inline qboolean tag_is_apetag(const unsigned char *data, size_t length)
{
	unsigned int v;

	if (length < 32) return false;
	if (memcmp(data,"APETAGEX",8) != 0)
		return false;
	v = (data[11]<<24) | (data[10]<<16) | (data[9]<<8) | data[8];
	if (v != 2000U && v != 1000U)
		return false;
	v = 0;
	if (memcmp(&data[24],&v,4) != 0 || memcmp(&data[28],&v,4) != 0)
		return false;
	return true;
}

static inline long get_ape_len(const unsigned char *data, long datalen, unsigned int *version)
{
	long taglen = (long)((data[15]<<24) | (data[14]<<16) | (data[13]<<8) | data[12]);
	*version = (data[11]<<24) | (data[10]<<16) | (data[9]<<8) | data[8];
	return taglen; /* caller will handle the additional v2 header length */
}

static int skip_tags_first(snd_stream_t *stream, unsigned char *buf, size_t bufsize)
{
	long len; size_t readsize;

	readsize = FS_fread(buf, 1, bufsize, &stream->fh);
	if (!readsize || FS_ferror(&stream->fh))
		return -1;

	/* ID3v2 tag is at the start */
	if (tag_is_id3v2(buf, readsize))
	{
		len = get_id3v2_len(buf, (long)readsize);
		if (len >= stream->fh.length) return -1;
		/* hack the fshandle_t start pos and length members */
		stream->fh.start += len;
		stream->fh.length -= len;
		FS_rewind(&stream->fh);
		Con_DPrintf("MP3: skipped %ld bytes ID3v2 tag\n", len);
	}
	/* APE tag _might_ be at the start: read the header */
	else if (tag_is_apetag(buf, readsize))
	{
		unsigned int v;
		len = get_ape_len(buf, (long)readsize, &v);
		len += 32; /* we're at top: have a header. */
		if (len >= stream->fh.length) return -1;
		/* hack the fshandle_t start pos and length members */
		stream->fh.start += len;
		stream->fh.length -= len;
		FS_rewind(&stream->fh);
		Con_DPrintf("MP3: skipped %ld bytes APEv2 tag\n", len);
	}

	/* ID3v1 tag is at the end */
	if (stream->fh.length < 128)
		goto ape;
	FS_fseek(&stream->fh, -128, SEEK_END);
	readsize = FS_fread(buf, 1, 128, &stream->fh);
	FS_rewind(&stream->fh);
	if (readsize != 128) return -1;
	if (tag_is_id3v1(buf, 128))
	{
		/* hack fshandle_t->length */
		stream->fh.length -= 128;
		Con_DPrintf("MP3: skipped ID3v1 tag\n");

		/* APE tag may be before the ID3v1: read the footer */
		if (stream->fh.length < 32)
			goto end;
		FS_fseek(&stream->fh, -32, SEEK_END);
		readsize = FS_fread(buf, 1, 32, &stream->fh);
		FS_rewind(&stream->fh);
		if (readsize != 32) return -1;
		if (tag_is_apetag(buf, 32))
		{
			unsigned int v;
			len = get_ape_len(buf, (long)readsize, &v);
			if (v == 2000U) len += 32; /* header */
			if (len >= stream->fh.length) return -1;
			if (v == 2000U) { /* verify header : */
				FS_fseek(&stream->fh, -len, SEEK_END);
				readsize = FS_fread(buf, 1, 32, &stream->fh);
				FS_rewind(&stream->fh);
				if (readsize != 32) return -1;
				if (!tag_is_apetag(buf, 32)) return -1;
			}
			/* hack fshandle_t->length */
			stream->fh.length -= len;
			Con_DPrintf("MP3: skipped %ld bytes APEv%u tag\n", len, v/1000);
			goto end;
		}
		/* extended ID3v1 just before the ID3v1 tag? (unlikely)  */
		if (stream->fh.length < 227)
			goto end;
		FS_fseek(&stream->fh, -227, SEEK_END);
		readsize = FS_fread(buf, 1, 227, &stream->fh);
		FS_rewind(&stream->fh);
		if (readsize != 227) return -1;
		if (tag_is_id3v1ext(buf, 227))
		{
			/* hack fshandle_t->length */
			stream->fh.length -= 227;
			Con_DPrintf("MP3: skipped ID3v1 extended tag\n");
			goto end;
		}
	}
	ape:	/* APE tag may be at the end: read the footer */
	if (stream->fh.length >= 32)
	{
		FS_fseek(&stream->fh, -32, SEEK_END);
		readsize = FS_fread(buf, 1, 32, &stream->fh);
		FS_rewind(&stream->fh);
		if (readsize != 32) return -1;
		if (tag_is_apetag(buf, 32))
		{
			unsigned int v;
			len = get_ape_len(buf, (long)readsize, &v);
			if (v == 2000U) len += 32; /* header */
			if (len >= stream->fh.length) return -1;
			if (v == 2000U) { /* verify header : */
				FS_fseek(&stream->fh, -len, SEEK_END);
				readsize = FS_fread(buf, 1, 32, &stream->fh);
				FS_rewind(&stream->fh);
				if (readsize != 32) return -1;
				if (!tag_is_apetag(buf, 32)) return -1;
			}
			/* hack fshandle_t->length */
			stream->fh.length -= len;
			Con_DPrintf("MP3: skipped %ld bytes APEv%u tag\n", len, v/1000);
		}
	}

	end:
	return (stream->fh.length > 0)? 0:  -1;
}

/* (Re)fill the stream buffer that is to be decoded.  If any data
 * still exists in the buffer then they are first shifted to be
 * front of the stream buffer.  */
static int mp3_inputdata(snd_stream_t *stream)
{
	mp3_priv_t *p = (mp3_priv_t *) stream->priv;
	size_t bytes_read;
	size_t remaining;

	remaining = p->Stream.bufend - p->Stream.next_frame;

	/* libmad does not consume all the buffer it's given. Some
	 * data, part of a truncated frame, is left unused at the
	 * end of the buffer. That data must be put back at the
	 * beginning of the buffer and taken in account for
	 * refilling the buffer. This means that the input buffer
	 * must be large enough to hold a complete frame at the
	 * highest observable bit-rate (currently 448 kb/s).
	 * TODO: Is 2016 bytes the size of the largest frame?
	 * (448000*(1152/32000))/8
	 */
	memmove(p->mp3_buffer, p->Stream.next_frame, remaining);

	bytes_read = FS_fread(p->mp3_buffer + remaining, 1,
				MP3_BUFFER_SIZE - remaining, &stream->fh);
	if (bytes_read == 0)
		return -1;

	mad_stream_buffer(&p->Stream, p->mp3_buffer, bytes_read+remaining);
	p->Stream.error = MAD_ERROR_NONE;

	return 0;
}

static int mp3_startread(snd_stream_t *stream)
{
	mp3_priv_t *p = (mp3_priv_t *) stream->priv;
	size_t ReadSize;

	/* skip tags known to be at start or end and adjust the file */
	if (skip_tags_first(stream, p->mp3_buffer, MP3_BUFFER_SIZE) < 0)
		return -1;

	mad_stream_init(&p->Stream);
	mad_frame_init(&p->Frame);
	mad_synth_init(&p->Synth);
	mad_timer_reset(&p->Timer);

	/* Decode at least one valid frame to find out the input
	 * format.  The decoded frame will be saved off so that it
	 * can be processed later.
	 */
	ReadSize = FS_fread(p->mp3_buffer, 1, MP3_BUFFER_SIZE, &stream->fh);
	if (!ReadSize || FS_ferror(&stream->fh))
		return -1;

	mad_stream_buffer(&p->Stream, p->mp3_buffer, ReadSize);

	/* Find a valid frame before starting up.  This makes sure
	 * that we have a valid MP3 and also skips past ID3v2 tags
	 * at the beginning of the audio file.
	 */
	p->Stream.error = MAD_ERROR_NONE;
	while (mad_frame_decode(&p->Frame,&p->Stream))
	{
		/* check whether input buffer needs a refill */
		if (p->Stream.error == MAD_ERROR_BUFLEN)
		{
			if (mp3_inputdata(stream) == -1)
				return -1;/* EOF with no valid data */

			continue;
		}

		/* We know that a valid frame hasn't been found yet
		 * so help libmad out and go back into frame seek mode.
		 */
		mad_stream_sync(&p->Stream);
		p->Stream.error = MAD_ERROR_NONE;
	}

	if (p->Stream.error)
	{
		Con_Printf("MP3: No valid MP3 frame found\n");
		return -1;
	}

	switch(p->Frame.header.mode)
	{
	case MAD_MODE_SINGLE_CHANNEL:
	case MAD_MODE_DUAL_CHANNEL:
	case MAD_MODE_JOINT_STEREO:
	case MAD_MODE_STEREO:
		stream->info.channels = MAD_NCHANNELS(&p->Frame.header);
		break;
	default:
		Con_Printf("MP3: Cannot determine number of channels\n");
		return -1;
	}

	p->FrameCount = 1;

	mad_timer_add(&p->Timer,p->Frame.header.duration);
	mad_synth_frame(&p->Synth,&p->Frame);
	stream->info.rate = p->Synth.pcm.samplerate;
	stream->info.bits = MP3_MAD_SAMPLEBITS;
	stream->info.width = MP3_MAD_SAMPLEWIDTH;

	p->cursamp = 0;

	return 0;
}

/* Read up to len samples from p->Synth
 * If needed, read some more MP3 data, decode them and synth them
 * Place in buf[].
 * Return number of samples read.  */
static int mp3_decode(snd_stream_t *stream, byte *buf, int len)
{
	mp3_priv_t *p = (mp3_priv_t *) stream->priv;
	int donow, i, done = 0;
	mad_fixed_t sample;
	int chan, x;

	do
	{
		x = (p->Synth.pcm.length - p->cursamp) * stream->info.channels;
		donow = q_min(len, x);
		i = 0;
		while (i < donow)
		{
			for (chan = 0; chan < stream->info.channels; chan++)
			{
				sample = p->Synth.pcm.samples[chan][p->cursamp];
				/* convert from fixed to short,
				 * write in host-endian format. */
				if (sample <= -MAD_F_ONE)
					sample = -0x7FFF;
				else if (sample >= MAD_F_ONE)
					sample = 0x7FFF;
				else
					sample >>= (MAD_F_FRACBITS + 1 - 16);
				if (host_bigendian)
				{
					*buf++ = (sample >> 8) & 0xFF;
					*buf++ = sample & 0xFF;
				}
				else /* assumed LITTLE_ENDIAN. */
				{
					*buf++ = sample & 0xFF;
					*buf++ = (sample >> 8) & 0xFF;
				}
				i++;
			}
			p->cursamp++;
		}

		len -= donow;
		done += donow;

		if (len == 0)
			break;

		/* check whether input buffer needs a refill */
		if (p->Stream.error == MAD_ERROR_BUFLEN)
		{
			if (mp3_inputdata(stream) == -1)
			{
				/* check feof() ?? */
				Con_DPrintf("mp3 EOF\n");
				break;
			}
		}

		if (mad_frame_decode(&p->Frame, &p->Stream))
		{
			if (MAD_RECOVERABLE(p->Stream.error))
			{
				mad_stream_sync(&p->Stream); /* to frame seek mode */
				continue;
			}
			else
			{
				if (p->Stream.error == MAD_ERROR_BUFLEN)
					continue;
				else
				{
					Con_Printf("MP3: unrecoverable frame level error (%s)\n",
							mad_stream_errorstr(&p->Stream));
					break;
				}
			}
		}
		p->FrameCount++;
		mad_timer_add(&p->Timer, p->Frame.header.duration);
		mad_synth_frame(&p->Synth, &p->Frame);
		p->cursamp = 0;
	} while (1);

	return done;
}

static int mp3_stopread(snd_stream_t *stream)
{
	mp3_priv_t *p = (mp3_priv_t*) stream->priv;

	mad_synth_finish(&p->Synth);
	mad_frame_finish(&p->Frame);
	mad_stream_finish(&p->Stream);

	return 0;
}

static int mp3_madseek(snd_stream_t *stream, unsigned long offset)
{
	mp3_priv_t *p = (mp3_priv_t *) stream->priv;
	size_t   initial_bitrate = p->Frame.header.bitrate;
	size_t   consumed = 0;
	int vbr = 0;		/* Variable Bit Rate, bool */
	qboolean depadded = false;
	unsigned long to_skip_samples = 0;

	/* Reset all */
	FS_rewind(&stream->fh);
	mad_timer_reset(&p->Timer);
	p->FrameCount = 0;

	/* They where opened in startread */
	mad_synth_finish(&p->Synth);
	mad_frame_finish(&p->Frame);
	mad_stream_finish(&p->Stream);

	mad_stream_init(&p->Stream);
	mad_frame_init(&p->Frame);
	mad_synth_init(&p->Synth);

	offset /= stream->info.channels;
	to_skip_samples = offset;

	while (1)	/* Read data from the MP3 file */
	{
		int bytes_read, padding = 0;
		size_t leftover = p->Stream.bufend - p->Stream.next_frame;

		memcpy(p->mp3_buffer, p->Stream.this_frame, leftover);
		bytes_read = FS_fread(p->mp3_buffer + leftover, (size_t) 1,
					MP3_BUFFER_SIZE - leftover, &stream->fh);
		if (bytes_read <= 0)
		{
			Con_DPrintf("seek failure. unexpected EOF (frames=%lu leftover=%lu)\n",
					(unsigned long)p->FrameCount, (unsigned long)leftover);
			break;
		}
		for ( ; !depadded && padding < bytes_read && !p->mp3_buffer[padding]; ++padding)
			;
		depadded = true;
		mad_stream_buffer(&p->Stream, p->mp3_buffer + padding, leftover + bytes_read - padding);

		while (1)	/* Decode frame headers */
		{
			static unsigned short samples;
			p->Stream.error = MAD_ERROR_NONE;

			/* Not an audio frame */
			if (mad_header_decode(&p->Frame.header, &p->Stream) == -1)
			{
				if (p->Stream.error == MAD_ERROR_BUFLEN)
					break;	/* Normal behaviour; get some more data from the file */
				if (!MAD_RECOVERABLE(p->Stream.error))
				{
					Con_DPrintf("unrecoverable MAD error\n");
					break;
				}
				if (p->Stream.error == MAD_ERROR_LOSTSYNC)
				{
					Con_DPrintf("MAD lost sync\n");
				}
				else
				{
					Con_DPrintf("recoverable MAD error\n");
				}
				continue;
			}

			consumed +=  p->Stream.next_frame - p->Stream.this_frame;
			vbr      |= (p->Frame.header.bitrate != initial_bitrate);

			samples = 32 * MAD_NSBSAMPLES(&p->Frame.header);

			p->FrameCount++;
			mad_timer_add(&p->Timer, p->Frame.header.duration);

			if (to_skip_samples <= samples)
			{
				mad_frame_decode(&p->Frame,&p->Stream);
				mad_synth_frame(&p->Synth, &p->Frame);
				p->cursamp = to_skip_samples;
				return 0;
			}
			else	to_skip_samples -= samples;

			/* If not VBR, we can extrapolate frame size */
			if (p->FrameCount == 64 && !vbr)
			{
				p->FrameCount = offset / samples;
				to_skip_samples = offset % samples;
				if (0 != FS_fseek(&stream->fh, (p->FrameCount * consumed / 64), SEEK_SET))
					return -1;

				/* Reset Stream for refilling buffer */
				mad_stream_finish(&p->Stream);
				mad_stream_init(&p->Stream);
				break;
			}
		}
	}

	return -1;
}

static qboolean S_MP3_CodecInitialize (void)
{
	return true;
}

static void S_MP3_CodecShutdown (void)
{
}

static qboolean S_MP3_CodecOpenStream (snd_stream_t *stream)
{
	int err;

	stream->priv = calloc(1, sizeof(mp3_priv_t));
	if (!stream->priv)
	{
		Con_Printf("Insufficient memory for MP3 audio\n");
		return false;
	}
	err = mp3_startread(stream);
	if (err != 0)
	{
		Con_Printf("%s is not a valid mp3 file\n", stream->name);
	}
	else if (stream->info.channels != 1 && stream->info.channels != 2)
	{
		Con_Printf("Unsupported number of channels %d in %s\n",
					stream->info.channels, stream->name);
	}
	else
	{
		return true;
	}
	free(stream->priv);
	return false;
}

static int S_MP3_CodecReadStream (snd_stream_t *stream, int bytes, void *buffer)
{
	int res = mp3_decode(stream, (byte *)buffer, bytes / stream->info.width);
	return res * stream->info.width;
}

static void S_MP3_CodecCloseStream (snd_stream_t *stream)
{
	mp3_stopread(stream);
	free(stream->priv);
	S_CodecUtilClose(&stream);
}

static int S_MP3_CodecRewindStream (snd_stream_t *stream)
{
	/*
	mp3_stopread(stream);
	FS_rewind(&stream->fh);
	return mp3_startread(stream);
	*/
	return mp3_madseek(stream, 0);
}

snd_codec_t mp3_codec =
{
	CODECTYPE_MP3,
	true,	/* always available. */
	"mp3",
	S_MP3_CodecInitialize,
	S_MP3_CodecShutdown,
	S_MP3_CodecOpenStream,
	S_MP3_CodecReadStream,
	S_MP3_CodecRewindStream,
	S_MP3_CodecCloseStream,
	NULL
};

#endif	/* USE_CODEC_MP3 */