mpd/src/decoder/plugins/OpusDecoderPlugin.cxx

528 lines
13 KiB
C++
Raw Normal View History

/*
2021-01-01 19:54:25 +01:00
* Copyright 2003-2021 The Music Player Daemon Project
* http://www.musicpd.org
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
*/
#include "OpusDecoderPlugin.h"
#include "OggDecoder.hxx"
#include "OpusDomain.hxx"
#include "OpusHead.hxx"
#include "OpusTags.hxx"
#include "lib/xiph/OggPacket.hxx"
2016-05-14 10:32:13 +02:00
#include "lib/xiph/OggFind.hxx"
2014-01-24 00:02:24 +01:00
#include "../DecoderAPI.hxx"
#include "decoder/Reader.hxx"
#include "input/Reader.hxx"
2013-01-07 22:12:09 +01:00
#include "OggCodec.hxx"
2017-02-08 08:26:58 +01:00
#include "tag/Handler.hxx"
#include "tag/Builder.hxx"
2014-01-24 16:18:21 +01:00
#include "input/InputStream.hxx"
#include "util/RuntimeError.hxx"
#include "Log.hxx"
#include <opus.h>
#include <ogg/ogg.h>
2013-07-30 20:11:57 +02:00
#include <string.h>
namespace {
constexpr opus_int32 opus_sample_rate = 48000;
/**
* Allocate an output buffer for 16 bit PCM samples big enough to hold
* a quarter second, larger than 120ms required by libopus.
*/
constexpr unsigned opus_output_buffer_frames = opus_sample_rate / 4;
gcc_pure
bool
IsOpusHead(const ogg_packet &packet) noexcept
{
return packet.bytes >= 8 && memcmp(packet.packet, "OpusHead", 8) == 0;
}
gcc_pure
bool
IsOpusTags(const ogg_packet &packet) noexcept
{
return packet.bytes >= 8 && memcmp(packet.packet, "OpusTags", 8) == 0;
}
/**
* Convert an EBU R128 value to ReplayGain.
*/
constexpr float
EbuR128ToReplayGain(float ebu_r128) noexcept
{
/* add 5dB to compensate for the different reference levels
between ReplayGain (89dB) and EBU R128 (-23 LUFS) */
return ebu_r128 + 5;
}
bool
mpd_opus_init([[maybe_unused]] const ConfigBlock &block)
{
LogDebug(opus_domain, opus_get_version_string());
return true;
}
class MPDOpusDecoder final : public OggDecoder {
2016-05-09 15:34:39 +02:00
OpusDecoder *opus_decoder = nullptr;
opus_int16 *output_buffer = nullptr;
/**
* The output gain from the Opus header in dB that should be
* applied unconditionally, but is often used specifically for
* ReplayGain. Initialized by OnOggBeginning().
*/
float output_gain;
2020-07-01 20:51:44 +02:00
/**
* The pre-skip value from the Opus header. Initialized by
* OnOggBeginning().
*/
unsigned pre_skip;
/**
* The number of decoded samples which shall be skipped. At
* the beginning of the file, this gets set to #pre_skip (by
* OnOggBeginning()), and may also be set while seeking.
*/
unsigned skip;
2014-11-11 07:41:01 +01:00
/**
* If non-zero, then a previous Opus stream has been found
* already with this number of channels. If opus_decoder is
* nullptr, then its end-of-stream packet has been found
* already.
*/
2016-05-09 15:34:39 +02:00
unsigned previous_channels = 0;
2014-11-11 07:41:01 +01:00
size_t frame_size;
/**
* The granulepos of the next sample to be submitted to
* DecoderClient::SubmitData(). Negative if unkown.
* Initialized by OnOggBeginning().
*/
ogg_int64_t granulepos;
/**
* Was DecoderClient::SubmitReplayGain() called? We need to
* keep track of this, because it will usually be called by
* HandleTags(), but if there is no OpusTags packet, we need
* to submit our #output_gain value from the OpusHead.
*/
bool submitted_replay_gain = false;
public:
explicit MPDOpusDecoder(DecoderReader &reader)
:OggDecoder(reader) {}
~MPDOpusDecoder();
/**
* Has DecoderClient::Ready() been called yet?
*/
[[nodiscard]] bool IsInitialized() const {
return previous_channels != 0;
}
bool Seek(uint64_t where_frame);
private:
void AddGranulepos(ogg_int64_t n) noexcept {
assert(n >= 0);
if (granulepos >= 0)
granulepos += n;
}
void HandleTags(const ogg_packet &packet);
void HandleAudio(const ogg_packet &packet);
protected:
/* virtual methods from class OggVisitor */
void OnOggBeginning(const ogg_packet &packet) override;
void OnOggPacket(const ogg_packet &packet) override;
void OnOggEnd() override;
};
MPDOpusDecoder::~MPDOpusDecoder()
{
delete[] output_buffer;
if (opus_decoder != nullptr)
opus_decoder_destroy(opus_decoder);
}
void
MPDOpusDecoder::OnOggPacket(const ogg_packet &packet)
{
if (IsOpusTags(packet))
HandleTags(packet);
else
HandleAudio(packet);
}
void
MPDOpusDecoder::OnOggBeginning(const ogg_packet &packet)
{
assert(packet.b_o_s);
if (opus_decoder != nullptr || !IsOpusHead(packet))
throw std::runtime_error("BOS packet must be OpusHead");
unsigned channels;
signed output_gain_i;
if (!ScanOpusHeader(packet.packet, packet.bytes, channels, output_gain_i, pre_skip) ||
!audio_valid_channel_count(channels))
throw std::runtime_error("Malformed BOS packet");
/* convert Q7.8 fixed-point to float */
output_gain = float(output_gain_i) / 256.0f;
granulepos = 0;
skip = pre_skip;
assert(opus_decoder == nullptr);
assert(IsInitialized() == (output_buffer != nullptr));
2014-11-11 07:41:01 +01:00
if (IsInitialized() && channels != previous_channels)
throw FormatRuntimeError("Next stream has different channels (%u -> %u)",
previous_channels, channels);
/* TODO: parse attributes from the OpusHead (sample rate,
channels, ...) */
int opus_error;
opus_decoder = opus_decoder_create(opus_sample_rate, channels,
&opus_error);
if (opus_decoder == nullptr)
throw FormatRuntimeError("libopus error: %s",
opus_strerror(opus_error));
if (IsInitialized()) {
2014-11-11 07:41:01 +01:00
/* decoder was already initialized by the previous
stream; skip the rest of this method */
LogDebug(opus_domain, "Found another stream");
return;
2014-11-11 07:41:01 +01:00
}
const auto eos_granulepos = UpdateEndGranulePos();
const auto duration = eos_granulepos >= 0
? SignedSongTime::FromScale<uint64_t>(eos_granulepos,
opus_sample_rate)
: SignedSongTime::Negative();
2014-11-11 07:41:01 +01:00
previous_channels = channels;
2013-08-03 21:00:50 +02:00
const AudioFormat audio_format(opus_sample_rate,
SampleFormat::S16, channels);
client.Ready(audio_format, eos_granulepos > 0, duration);
2013-08-03 21:00:50 +02:00
frame_size = audio_format.GetFrameSize();
if (output_buffer == nullptr)
/* note: if we ever support changing the channel count
in chained streams, we need to reallocate this
buffer instead of keeping it */
output_buffer = new opus_int16[opus_output_buffer_frames
* audio_format.channels];
auto cmd = client.GetCommand();
if (cmd != DecoderCommand::NONE)
throw cmd;
}
void
MPDOpusDecoder::OnOggEnd()
2014-11-11 08:36:22 +01:00
{
if (!IsSeekable() && IsInitialized()) {
2014-11-11 07:41:01 +01:00
/* allow chaining of (unseekable) streams */
assert(opus_decoder != nullptr);
assert(output_buffer != nullptr);
opus_decoder_destroy(opus_decoder);
opus_decoder = nullptr;
} else
throw StopDecoder();
2014-11-11 08:36:22 +01:00
}
inline void
MPDOpusDecoder::HandleTags(const ogg_packet &packet)
{
ReplayGainInfo rgi;
2013-10-25 19:05:49 +02:00
rgi.Clear();
TagBuilder tag_builder;
AddTagHandler h(tag_builder);
if (!ScanOpusTags(packet.packet, packet.bytes, &rgi, h))
return;
if (rgi.IsDefined()) {
/* submit all valid EBU R128 values with output_gain
applied */
if (rgi.track.IsDefined())
rgi.track.gain += EbuR128ToReplayGain(output_gain);
if (rgi.album.IsDefined())
rgi.album.gain += EbuR128ToReplayGain(output_gain);
client.SubmitReplayGain(&rgi);
submitted_replay_gain = true;
}
if (!tag_builder.empty()) {
Tag tag = tag_builder.Commit();
auto cmd = client.SubmitTag(input_stream, std::move(tag));
if (cmd != DecoderCommand::NONE)
throw cmd;
}
}
inline void
MPDOpusDecoder::HandleAudio(const ogg_packet &packet)
{
assert(opus_decoder != nullptr);
if (!submitted_replay_gain) {
/* if we didn't see an OpusTags packet with EBU R128
values, we still need to apply the output gain
value from the OpusHead packet; submit it as "track
gain" value */
ReplayGainInfo rgi;
rgi.Clear();
rgi.track.gain = EbuR128ToReplayGain(output_gain);
client.SubmitReplayGain(&rgi);
submitted_replay_gain = true;
}
int nframes = opus_decode(opus_decoder,
(const unsigned char*)packet.packet,
packet.bytes,
output_buffer, opus_output_buffer_frames,
0);
if (gcc_unlikely(nframes <= 0)) {
if (nframes < 0)
throw FormatRuntimeError("libopus error: %s",
opus_strerror(nframes));
else
return;
}
/* apply the "skip" value */
if (skip >= (unsigned)nframes) {
skip -= nframes;
AddGranulepos(nframes);
return;
}
const opus_int16 *data = output_buffer;
data += skip * previous_channels;
nframes -= skip;
AddGranulepos(skip);
skip = 0;
if (packet.e_o_s && packet.granulepos > 0 && granulepos >= 0) {
/* End Trimming (RFC7845 4.4): "The page with the 'end
of stream' flag set MAY have a granule position
that indicates the page contains less audio data
than would normally be returned by decoding up
through the final packet. This is used to end the
stream somewhere other than an even frame
boundary. [...] The remaining samples are
discarded. */
ogg_int64_t remaining = packet.granulepos - granulepos;
if (remaining <= 0)
return;
if (remaining < nframes)
nframes = remaining;
}
/* submit decoded samples to the DecoderClient */
const size_t nbytes = nframes * frame_size;
auto cmd = client.SubmitData(input_stream,
data, nbytes,
0);
if (cmd != DecoderCommand::NONE)
throw cmd;
if (packet.granulepos > 0) {
granulepos = packet.granulepos;
client.SubmitTimestamp(FloatDuration(granulepos - pre_skip)
/ opus_sample_rate);
} else
AddGranulepos(nframes);
}
2013-01-07 23:05:33 +01:00
bool
MPDOpusDecoder::Seek(uint64_t where_frame)
2013-01-07 23:05:33 +01:00
{
assert(IsSeekable());
2014-05-11 18:34:09 +02:00
assert(input_stream.IsSeekable());
assert(input_stream.KnownSize());
2013-01-07 23:05:33 +01:00
2014-08-26 11:33:45 +02:00
const ogg_int64_t where_granulepos(where_frame);
2013-01-07 23:05:33 +01:00
/* we don't know the exact granulepos after seeking, so let's
set it to -1 - it will be set after the next packet which
declares its granulepos */
granulepos = -1;
try {
SeekGranulePos(where_granulepos);
2020-07-01 20:51:44 +02:00
/* since all frame numbers are offset by the file's
pre-skip value, we need to apply it here as well;
we could just seek to "where_frame+pre_skip" as
well, but I think by decoding those samples and
discard them, we're safer */
skip = pre_skip;
return true;
} catch (...) {
return false;
}
2013-01-07 23:05:33 +01:00
}
void
mpd_opus_stream_decode(DecoderClient &client,
InputStream &input_stream)
{
if (ogg_codec_detect(&client, input_stream) != OGG_CODEC_OPUS)
return;
/* rewind the stream, because ogg_codec_detect() has
moved it */
try {
input_stream.LockRewind();
} catch (...) {
}
DecoderReader reader(client, input_stream);
MPDOpusDecoder d(reader);
while (true) {
try {
d.Visit();
break;
} catch (DecoderCommand cmd) {
if (cmd == DecoderCommand::SEEK) {
if (d.Seek(client.GetSeekFrame()))
client.CommandFinished();
else
client.SeekError();
} else if (cmd != DecoderCommand::NONE)
break;
}
}
}
bool
ReadAndParseOpusHead(OggSyncState &sync, OggStreamState &stream,
unsigned &channels, signed &output_gain, unsigned &pre_skip)
{
ogg_packet packet;
return OggReadPacket(sync, stream, packet) && packet.b_o_s &&
IsOpusHead(packet) &&
2020-07-01 17:48:44 +02:00
ScanOpusHeader(packet.packet, packet.bytes, channels,
output_gain, pre_skip) &&
audio_valid_channel_count(channels);
}
bool
ReadAndVisitOpusTags(OggSyncState &sync, OggStreamState &stream,
TagHandler &handler)
{
ogg_packet packet;
return OggReadPacket(sync, stream, packet) &&
IsOpusTags(packet) &&
ScanOpusTags(packet.packet, packet.bytes,
nullptr,
handler);
}
void
VisitOpusDuration(InputStream &is, OggSyncState &sync, OggStreamState &stream,
ogg_int64_t pre_skip, TagHandler &handler)
{
ogg_packet packet;
if (OggSeekFindEOS(sync, stream, packet, is) &&
packet.granulepos >= pre_skip) {
const auto duration =
SongTime::FromScale<uint64_t>(packet.granulepos,
opus_sample_rate);
handler.OnDuration(duration);
}
}
2013-01-07 23:06:02 +01:00
static bool
mpd_opus_scan_stream(InputStream &is, TagHandler &handler)
{
InputStreamReader reader(is);
OggSyncState oy(reader);
ogg_page first_page;
if (!oy.ExpectPage(first_page))
return false;
OggStreamState os(first_page);
unsigned channels, pre_skip;
signed output_gain;
if (!ReadAndParseOpusHead(oy, os, channels, output_gain, pre_skip) ||
!ReadAndVisitOpusTags(oy, os, handler))
return false;
handler.OnAudioFormat(AudioFormat(opus_sample_rate,
SampleFormat::S16, channels));
VisitOpusDuration(is, oy, os, pre_skip, handler);
return true;
}
const char *const opus_suffixes[] = {
"opus",
"ogg",
"oga",
nullptr
};
const char *const opus_mime_types[] = {
/* the official MIME type (RFC 5334) */
"audio/ogg",
/* deprecated (RFC 5334) */
"application/ogg",
/* deprecated; from an early draft */
"audio/opus",
nullptr
};
} /* anonymous namespace */
constexpr DecoderPlugin opus_decoder_plugin =
DecoderPlugin("opus", mpd_opus_stream_decode, mpd_opus_scan_stream)
.WithInit(mpd_opus_init)
.WithSuffixes(opus_suffixes)
.WithMimeTypes(opus_mime_types);