OpusEncoderPlugin.cxx 9.13 KB
Newer Older
1
/*
Max Kellermann's avatar
Max Kellermann committed
2
 * Copyright 2003-2021 The Music Player Daemon Project
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20
 * http://www.musicpd.org
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
 */

#include "OpusEncoderPlugin.hxx"
21
#include "OggEncoder.hxx"
22
#include "pcm/AudioFormat.hxx"
23
#include "util/ByteOrder.hxx"
24
#include "util/StringUtil.hxx"
25 26 27 28

#include <opus.h>
#include <ogg/ogg.h>

29
#include <cassert>
30 31
#include <stdexcept>

32
#include <stdlib.h>
33

34
namespace {
35

36
class OpusEncoder final : public OggEncoder {
37
	const AudioFormat audio_format;
38

39
	const size_t frame_size;
40

41 42 43
	const size_t buffer_frames, buffer_size;
	size_t buffer_position = 0;
	uint8_t *const buffer;
44

45
	::OpusEncoder *const enc;
46 47 48

	unsigned char buffer2[1275 * 3 + 7];

49 50
	int lookahead;

51
	ogg_int64_t packetno = 0;
52

53
	ogg_int64_t granulepos = 0;
54

55
public:
56
	OpusEncoder(AudioFormat &_audio_format, ::OpusEncoder *_enc, bool _chaining);
57
	~OpusEncoder() noexcept override;
58

59
	/* virtual methods from class Encoder */
60 61
	void End() override;
	void Write(const void *data, size_t length) override;
62

63 64
	void PreTag() override;
	void SendTag(const Tag &tag) override;
65

66
private:
67 68
	void DoEncode(bool eos);
	void WriteSilence(unsigned fill_frames);
69

70 71 72
	void GenerateHeaders(const Tag *tag) noexcept;
	void GenerateHead() noexcept;
	void GenerateTags(const Tag *tag) noexcept;
73 74
};

75
class PreparedOpusEncoder final : public PreparedEncoder {
76 77 78
	opus_int32 bitrate;
	int complexity;
	int signal;
79
	const bool chaining;
80

81
public:
Max Kellermann's avatar
Max Kellermann committed
82
	explicit PreparedOpusEncoder(const ConfigBlock &block);
83 84

	/* virtual methods from class PreparedEncoder */
85
	Encoder *Open(AudioFormat &audio_format) override;
86

87
	[[nodiscard]] const char *GetMimeType() const noexcept override {
88 89
		return "audio/ogg";
	}
90 91
};

92
PreparedOpusEncoder::PreparedOpusEncoder(const ConfigBlock &block)
93
	:chaining(block.GetBlockValue("opustags", false))
94
{
95
	const char *value = block.GetBlockValue("bitrate", "auto");
96
	if (strcmp(value, "auto") == 0)
97
		bitrate = OPUS_AUTO;
98
	else if (strcmp(value, "max") == 0)
99
		bitrate = OPUS_BITRATE_MAX;
100 101
	else {
		char *endptr;
102
		bitrate = strtoul(value, &endptr, 10);
103
		if (endptr == value || *endptr != 0 ||
104 105
		    bitrate < 500 || bitrate > 512000)
			throw std::runtime_error("Invalid bit rate");
106 107
	}

108
	complexity = block.GetBlockValue("complexity", 10U);
109 110
	if (complexity > 10)
		throw std::runtime_error("Invalid complexity");
111

112
	value = block.GetBlockValue("signal", "auto");
113
	if (strcmp(value, "auto") == 0)
114
		signal = OPUS_AUTO;
115
	else if (strcmp(value, "voice") == 0)
116
		signal = OPUS_SIGNAL_VOICE;
117
	else if (strcmp(value, "music") == 0)
118
		signal = OPUS_SIGNAL_MUSIC;
119 120
	else
		throw std::runtime_error("Invalid signal");
121 122
}

123
PreparedEncoder *
124
opus_encoder_init(const ConfigBlock &block)
125
{
126
	return new PreparedOpusEncoder(block);
127 128
}

129 130
OpusEncoder::OpusEncoder(AudioFormat &_audio_format, ::OpusEncoder *_enc, bool _chaining)
	:OggEncoder(_chaining),
131 132 133 134
	 audio_format(_audio_format),
	 frame_size(_audio_format.GetFrameSize()),
	 buffer_frames(_audio_format.sample_rate / 50),
	 buffer_size(frame_size * buffer_frames),
135
	 buffer(new uint8_t[buffer_size]),
136 137 138
	 enc(_enc)
{
	opus_encoder_ctl(enc, OPUS_GET_LOOKAHEAD(&lookahead));
139
	GenerateHeaders(nullptr);
140 141 142
}

Encoder *
143
PreparedOpusEncoder::Open(AudioFormat &audio_format)
144 145
{
	/* libopus supports only 48 kHz */
146
	audio_format.sample_rate = 48000;
147

148 149
	if (audio_format.channels > 2)
		audio_format.channels = 1;
150

151
	switch (audio_format.format) {
152 153
	case SampleFormat::S16:
	case SampleFormat::FLOAT:
154 155
		break;

156
	case SampleFormat::S8:
157
		audio_format.format = SampleFormat::S16;
158 159 160
		break;

	default:
161
		audio_format.format = SampleFormat::FLOAT;
162 163 164
		break;
	}

165
	int error_code;
166 167 168 169
	auto *enc = opus_encoder_create(audio_format.sample_rate,
					audio_format.channels,
					OPUS_APPLICATION_AUDIO,
					&error_code);
170 171
	if (enc == nullptr)
		throw std::runtime_error(opus_strerror(error_code));
172

173 174 175
	opus_encoder_ctl(enc, OPUS_SET_BITRATE(bitrate));
	opus_encoder_ctl(enc, OPUS_SET_COMPLEXITY(complexity));
	opus_encoder_ctl(enc, OPUS_SET_SIGNAL(signal));
176

177
	return new OpusEncoder(audio_format, enc, chaining);
178 179
}

180
OpusEncoder::~OpusEncoder() noexcept
181
{
182
	delete[] buffer;
183 184 185
	opus_encoder_destroy(enc);
}

186 187
void
OpusEncoder::DoEncode(bool eos)
188
{
189
	assert(buffer_position == buffer_size || eos);
190 191

	opus_int32 result =
192 193
		audio_format.format == SampleFormat::S16
		? opus_encode(enc,
194 195 196 197
		              (const opus_int16 *)buffer,
		              buffer_frames,
		              buffer2,
		              sizeof(buffer2))
198
		: opus_encode_float(enc,
199 200 201 202
		                    (const float *)buffer,
		                    buffer_frames,
		                    buffer2,
		                    sizeof(buffer2));
203 204
	if (result < 0)
		throw std::runtime_error("Opus encoder error");
205

206
	granulepos += buffer_position / frame_size;
207

208
	ogg_packet packet;
209
	packet.packet = buffer2;
210 211 212
	packet.bytes = result;
	packet.b_o_s = false;
	packet.e_o_s = eos;
213 214 215
	packet.granulepos = granulepos;
	packet.packetno = packetno++;
	stream.PacketIn(packet);
216

217
	buffer_position = 0;
218 219
}

220 221
void
OpusEncoder::End()
222
{
223 224
	memset(buffer + buffer_position, 0,
	       buffer_size - buffer_position);
225
	DoEncode(true);
226
	Flush();
227 228
}

229 230
void
OpusEncoder::WriteSilence(unsigned fill_frames)
231 232
{
	size_t fill_bytes = fill_frames * frame_size;
233 234

	while (fill_bytes > 0) {
235
		size_t nbytes = buffer_size - buffer_position;
236 237 238
		if (nbytes > fill_bytes)
			nbytes = fill_bytes;

239 240
		memset(buffer + buffer_position, 0, nbytes);
		buffer_position += nbytes;
241 242
		fill_bytes -= nbytes;

243 244
		if (buffer_position == buffer_size)
			DoEncode(false);
245 246 247
	}
}

248 249
void
OpusEncoder::Write(const void *_data, size_t length)
250
{
Max Kellermann's avatar
Max Kellermann committed
251
	const auto *data = (const uint8_t *)_data;
252

253
	if (lookahead > 0) {
254 255 256
		/* generate some silence at the beginning of the
		   stream */

257
		assert(buffer_position == 0);
258

259
		WriteSilence(lookahead);
260
		lookahead = 0;
261 262
	}

263
	while (length > 0) {
264
		size_t nbytes = buffer_size - buffer_position;
265 266 267
		if (nbytes > length)
			nbytes = length;

268
		memcpy(buffer + buffer_position, data, nbytes);
269 270
		data += nbytes;
		length -= nbytes;
271
		buffer_position += nbytes;
272

273 274
		if (buffer_position == buffer_size)
			DoEncode(false);
275 276 277
	}
}

278
void
279
OpusEncoder::GenerateHeaders(const Tag *tag) noexcept
280 281 282 283 284
{
	GenerateHead();
	GenerateTags(tag);
}

285
void
286
OpusEncoder::GenerateHead() noexcept
287 288 289 290
{
	unsigned char header[19];
	memcpy(header, "OpusHead", 8);
	header[8] = 1;
291 292 293
	header[9] = audio_format.channels;
	*(uint16_t *)(header + 10) = ToLE16(lookahead);
	*(uint32_t *)(header + 12) = ToLE32(audio_format.sample_rate);
294 295 296 297 298 299
	header[16] = 0;
	header[17] = 0;
	header[18] = 0;

	ogg_packet packet;
	packet.packet = header;
300
	packet.bytes = sizeof(header);
301 302 303
	packet.b_o_s = true;
	packet.e_o_s = false;
	packet.granulepos = 0;
304 305
	packet.packetno = packetno++;
	stream.PacketIn(packet);
306
	// flush not needed because libogg autoflushes on b_o_s flag
307 308
}

309
void
310
OpusEncoder::GenerateTags(const Tag *tag) noexcept
311 312 313 314
{
	const char *version = opus_get_version_string();
	size_t version_length = strlen(version);

315
	// len("OpusTags") + 4 byte version length + len(version) + 4 byte tag count
316
	size_t comments_size = 8 + 4 + version_length + 4;
317 318 319 320 321 322 323 324 325
	uint32_t tag_count = 0;
	if (tag) {
		for (const auto &item: *tag) {
			++tag_count;
			// 4 byte length + len(tagname) + len('=') + len(value)
			comments_size += 4 + strlen(tag_item_names[item.type]) + 1 + strlen(item.value);
		}
	}

Max Kellermann's avatar
Max Kellermann committed
326
	auto *comments = new unsigned char[comments_size];
327 328
	unsigned char *p = comments;

329
	memcpy(comments, "OpusTags", 8);
330
	*(uint32_t *)(comments + 8) = ToLE32(version_length);
331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358
	p += 12;

	memcpy(p, version, version_length);
	p += version_length;

	tag_count = ToLE32(tag_count);
	memcpy(p, &tag_count, 4);
	p += 4;

	if (tag) {
		for (const auto &item: *tag) {
			size_t tag_name_len = strlen(tag_item_names[item.type]);
			size_t tag_val_len = strlen(item.value);
			uint32_t tag_len_le = ToLE32(tag_name_len + 1 + tag_val_len);

			memcpy(p, &tag_len_le, 4);
			p += 4;

			ToUpperASCII((char *)p, tag_item_names[item.type], tag_name_len + 1);
			p += tag_name_len;

			*p++ = '=';

			memcpy(p, item.value, tag_val_len);
			p += tag_val_len;
		}
	}
	assert(comments + comments_size == p);
359 360 361 362 363 364 365

	ogg_packet packet;
	packet.packet = comments;
	packet.bytes = comments_size;
	packet.b_o_s = false;
	packet.e_o_s = false;
	packet.granulepos = 0;
366 367
	packet.packetno = packetno++;
	stream.PacketIn(packet);
368
	Flush();
369

370
	delete[] comments;
371 372
}

373 374
void
OpusEncoder::PreTag()
375
{
376 377 378 379 380
	End();
	packetno = 0;
	granulepos = 0; // not really required, but useful to prevent wraparound
	opus_encoder_ctl(enc, OPUS_RESET_STATE);
}
381

382 383 384 385 386 387
void
OpusEncoder::SendTag(const Tag &tag)
{
	stream.Reinitialize(GenerateOggSerial());
	opus_encoder_ctl(enc, OPUS_GET_LOOKAHEAD(&lookahead));
	GenerateHeaders(&tag);
388
}
389

390
} // namespace
391

392
const EncoderPlugin opus_encoder_plugin = {
393 394 395
	"opus",
	opus_encoder_init,
};