forked from sbooth/SFBAudioEngine
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathSFBFLACEncoder.mm
495 lines (393 loc) · 17.7 KB
/
SFBFLACEncoder.mm
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
//
// Copyright (c) 2020-2025 Stephen F. Booth <[email protected]>
// Part of https://github.com/sbooth/SFBAudioEngine
// MIT license
//
#import <algorithm>
#import <memory>
#import <os/log.h>
#import <FLAC/metadata.h>
#import <FLAC/stream_encoder.h>
#import "SFBFLACEncoder.h"
SFBAudioEncoderName const SFBAudioEncoderNameFLAC = @"org.sbooth.AudioEngine.Encoder.FLAC";
SFBAudioEncoderName const SFBAudioEncoderNameOggFLAC = @"org.sbooth.AudioEngine.Encoder.OggFLAC";
SFBAudioEncodingSettingsKey const SFBAudioEncodingSettingsKeyFLACCompressionLevel = @"Compression Level";
SFBAudioEncodingSettingsKey const SFBAudioEncodingSettingsKeyFLACVerifyEncoding = @"Verify Encoding";
namespace {
constexpr uint32_t kDefaultPaddingSize = 8192;
/// A `std::unique_ptr` deleter for `FLAC__StreamEncoder` objects
struct flac__stream_encoder_deleter {
void operator()(FLAC__StreamEncoder *encoder) { FLAC__stream_encoder_delete(encoder); }
};
/// A `std::unique_ptr` deleter for `FLAC__StreamMetadata` objects
struct flac__stream_metadata_deleter {
void operator()(FLAC__StreamMetadata *metadata) { FLAC__metadata_object_delete(metadata); }
};
using flac__stream_encoder_unique_ptr = std::unique_ptr<FLAC__StreamEncoder, flac__stream_encoder_deleter>;
using flac__stream_metadata_unique_ptr = std::unique_ptr<FLAC__StreamMetadata, flac__stream_metadata_deleter>;
} /* namespace */
@interface SFBFLACEncoder ()
{
@private
flac__stream_encoder_unique_ptr _flac;
flac__stream_metadata_unique_ptr _seektable;
flac__stream_metadata_unique_ptr _padding;
FLAC__StreamMetadata *_metadata [2];
@package
AVAudioFramePosition _framePosition;
}
- (BOOL)initializeFLACStreamEncoder:(FLAC__StreamEncoder *)encoder error:(NSError **)error;
@end
#pragma mark FLAC Callbacks
namespace {
FLAC__StreamEncoderReadStatus read_callback(const FLAC__StreamEncoder *encoder, FLAC__byte buffer[], size_t *bytes, void *client_data) noexcept
{
#pragma unused(encoder)
NSCParameterAssert(client_data != NULL);
SFBFLACEncoder *flacEncoder = (__bridge SFBFLACEncoder *)client_data;
SFBOutputSource *outputSource = flacEncoder->_outputSource;
NSInteger bytesRead;
if(![outputSource readBytes:buffer length:static_cast<NSInteger>(*bytes) bytesRead:&bytesRead error:nil])
return FLAC__STREAM_ENCODER_READ_STATUS_ABORT;
*bytes = static_cast<size_t>(bytesRead);
if(bytesRead == 0 && outputSource.atEOF)
return FLAC__STREAM_ENCODER_READ_STATUS_END_OF_STREAM;
return FLAC__STREAM_ENCODER_READ_STATUS_CONTINUE;
}
FLAC__StreamEncoderWriteStatus write_callback(const FLAC__StreamEncoder *encoder, const FLAC__byte buffer[], size_t bytes, uint32_t samples, uint32_t current_frame, void *client_data) noexcept
{
#pragma unused(encoder)
NSCParameterAssert(client_data != nullptr);
SFBFLACEncoder *flacEncoder = (__bridge SFBFLACEncoder *)client_data;
SFBOutputSource *outputSource = flacEncoder->_outputSource;
NSInteger bytesWritten;
if(![outputSource writeBytes:static_cast<const void *>(buffer) length:static_cast<NSInteger>(bytes) bytesWritten:&bytesWritten error:nil] || bytesWritten != static_cast<NSInteger>(bytes))
return FLAC__STREAM_ENCODER_WRITE_STATUS_FATAL_ERROR;
if(samples > 0)
flacEncoder->_framePosition = current_frame;
return FLAC__STREAM_ENCODER_WRITE_STATUS_OK;
}
FLAC__StreamEncoderSeekStatus seek_callback(const FLAC__StreamEncoder *encoder, FLAC__uint64 absolute_byte_offset, void *client_data) noexcept
{
#pragma unused(encoder)
NSCParameterAssert(client_data != nullptr);
SFBFLACEncoder *flacEncoder = (__bridge SFBFLACEncoder *)client_data;
SFBOutputSource *outputSource = flacEncoder->_outputSource;
if(!outputSource.supportsSeeking)
return FLAC__STREAM_ENCODER_SEEK_STATUS_UNSUPPORTED;
if(![outputSource seekToOffset:static_cast<NSInteger>(absolute_byte_offset) error:nil])
return FLAC__STREAM_ENCODER_SEEK_STATUS_ERROR;
return FLAC__STREAM_ENCODER_SEEK_STATUS_OK;
}
FLAC__StreamEncoderTellStatus tell_callback(const FLAC__StreamEncoder *encoder, FLAC__uint64 *absolute_byte_offset, void *client_data) noexcept
{
#pragma unused(encoder)
NSCParameterAssert(client_data != nullptr);
SFBFLACEncoder *flacEncoder = (__bridge SFBFLACEncoder *)client_data;
SFBOutputSource *outputSource = flacEncoder->_outputSource;
NSInteger offset;
if(![outputSource getOffset:&offset error:nil])
return FLAC__STREAM_ENCODER_TELL_STATUS_ERROR;
*absolute_byte_offset = static_cast<FLAC__uint64>(offset);
return FLAC__STREAM_ENCODER_TELL_STATUS_OK;
}
void metadata_callback(const FLAC__StreamEncoder *encoder, const FLAC__StreamMetadata *metadata, void *client_data) noexcept
{
#pragma unused(encoder)
#pragma unused(metadata)
#pragma unused(client_data)
}
} /* namespace */
@implementation SFBFLACEncoder
+ (void)load
{
[SFBAudioEncoder registerSubclass:[self class]];
}
+ (NSSet *)supportedPathExtensions
{
return [NSSet setWithObject:@"flac"];
}
+ (NSSet *)supportedMIMETypes
{
return [NSSet setWithObject:@"audio/flac"];
}
+ (SFBAudioEncoderName)encoderName
{
return SFBAudioEncoderNameFLAC;
}
- (BOOL)encodingIsLossless
{
return YES;
}
- (AVAudioFormat *)processingFormatForSourceFormat:(AVAudioFormat *)sourceFormat
{
NSParameterAssert(sourceFormat != nil);
// Validate format
if(sourceFormat.streamDescription->mFormatFlags & kAudioFormatFlagIsFloat || sourceFormat.channelCount < 1 || sourceFormat.channelCount > 8)
return nil;
// Set up the processing format
AudioStreamBasicDescription streamDescription{};
streamDescription.mFormatID = kAudioFormatLinearPCM;
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wdeprecated-anon-enum-enum-conversion"
streamDescription.mFormatFlags = kAudioFormatFlagsNativeEndian | kAudioFormatFlagIsSignedInteger;
#pragma clang diagnostic pop
streamDescription.mSampleRate = sourceFormat.sampleRate;
streamDescription.mChannelsPerFrame = sourceFormat.channelCount;
streamDescription.mBitsPerChannel = ((sourceFormat.streamDescription->mBitsPerChannel + 7) / 8) * 8;
if(streamDescription.mBitsPerChannel == 32)
streamDescription.mFormatFlags |= kAudioFormatFlagIsPacked;
else
streamDescription.mFormatFlags |= kAudioFormatFlagIsAlignedHigh;
streamDescription.mBytesPerPacket = sizeof(int32_t) * streamDescription.mChannelsPerFrame;
streamDescription.mFramesPerPacket = 1;
streamDescription.mBytesPerFrame = streamDescription.mBytesPerPacket / streamDescription.mFramesPerPacket;
AVAudioChannelLayout *channelLayout = nil;
switch(sourceFormat.channelCount) {
case 1: channelLayout = [AVAudioChannelLayout layoutWithLayoutTag:kAudioChannelLayoutTag_Mono]; break;
case 2: channelLayout = [AVAudioChannelLayout layoutWithLayoutTag:kAudioChannelLayoutTag_Stereo]; break;
case 3: channelLayout = [AVAudioChannelLayout layoutWithLayoutTag:kAudioChannelLayoutTag_MPEG_3_0_A]; break;
case 4: channelLayout = [AVAudioChannelLayout layoutWithLayoutTag:kAudioChannelLayoutTag_WAVE_4_0_B]; break;
case 5: channelLayout = [AVAudioChannelLayout layoutWithLayoutTag:kAudioChannelLayoutTag_WAVE_5_0_B]; break;
case 6: channelLayout = [AVAudioChannelLayout layoutWithLayoutTag:kAudioChannelLayoutTag_WAVE_5_1_B]; break;
case 7: channelLayout = [AVAudioChannelLayout layoutWithLayoutTag:kAudioChannelLayoutTag_WAVE_6_1]; break;
case 8: channelLayout = [AVAudioChannelLayout layoutWithLayoutTag:kAudioChannelLayoutTag_WAVE_7_1]; break;
}
return [[AVAudioFormat alloc] initWithStreamDescription:&streamDescription channelLayout:channelLayout];
}
- (BOOL)openReturningError:(NSError **)error
{
if(![super openReturningError:error])
return NO;
// Create FLAC encoder
flac__stream_encoder_unique_ptr flac{FLAC__stream_encoder_new()};
if(!flac) {
if(error)
*error = [NSError errorWithDomain:NSPOSIXErrorDomain code:ENOMEM userInfo:nil];
return NO;
}
// Output format
// As long as the FLAC encoder is non-null and uninitialized these setters will succeed
FLAC__stream_encoder_set_sample_rate(flac.get(), static_cast<uint32_t>(_processingFormat.sampleRate));
FLAC__stream_encoder_set_channels(flac.get(), _processingFormat.channelCount);
FLAC__stream_encoder_set_bits_per_sample(flac.get(), _processingFormat.streamDescription->mBitsPerChannel);
if(_estimatedFramesToEncode > 0)
FLAC__stream_encoder_set_total_samples_estimate(flac.get(), static_cast<FLAC__uint64>(_estimatedFramesToEncode));
// Encoder compression level
NSNumber *compressionLevel = [_settings objectForKey:SFBAudioEncodingSettingsKeyFLACCompressionLevel];
if(compressionLevel != nil) {
unsigned int value = compressionLevel.unsignedIntValue;
switch(value) {
case 0 ... 8:
if(!FLAC__stream_encoder_set_compression_level(flac.get(), value)) {
os_log_error(gSFBAudioEncoderLog, "FLAC__stream_encoder_set_compression_level failed: %{public}s", FLAC__stream_encoder_get_resolved_state_string(flac.get()));
if(error)
*error = [NSError errorWithDomain:SFBAudioEncoderErrorDomain code:SFBAudioEncoderErrorCodeInternalError userInfo:nil];
return NO;
}
break;
default:
os_log_info(gSFBAudioEncoderLog, "Ignoring invalid FLAC compression level: %d", value);
break;
}
}
if(NSNumber *verifyEncoding = [_settings objectForKey:SFBAudioEncodingSettingsKeyFLACVerifyEncoding]; verifyEncoding != nil)
FLAC__stream_encoder_set_verify(flac.get(), verifyEncoding.boolValue != 0);
// Create the padding metadata block
flac__stream_metadata_unique_ptr padding{FLAC__metadata_object_new(FLAC__METADATA_TYPE_PADDING)};
if(!padding) {
os_log_error(gSFBAudioEncoderLog, "FLAC__metadata_object_new failed");
if(error)
*error = [NSError errorWithDomain:NSPOSIXErrorDomain code:ENOMEM userInfo:nil];
return NO;
}
padding->length = kDefaultPaddingSize;
// Create a seektable when possible
flac__stream_metadata_unique_ptr seektable;
if(_estimatedFramesToEncode > 0) {
seektable = flac__stream_metadata_unique_ptr{FLAC__metadata_object_new(FLAC__METADATA_TYPE_SEEKTABLE)};
if(!seektable) {
os_log_error(gSFBAudioEncoderLog, "FLAC__metadata_object_new failed");
if(error)
*error = [NSError errorWithDomain:NSPOSIXErrorDomain code:ENOMEM userInfo:nil];
return NO;
}
// Append seekpoints (one every 10 seconds)
if(!FLAC__metadata_object_seektable_template_append_spaced_points_by_samples(seektable.get(), static_cast<uint32_t>(10 * _processingFormat.sampleRate), static_cast<FLAC__uint64>(_estimatedFramesToEncode))) {
os_log_error(gSFBAudioEncoderLog, "FLAC__metadata_object_seektable_template_append_spaced_points_by_samples failed");
if(error)
*error = [NSError errorWithDomain:NSPOSIXErrorDomain code:ENOMEM userInfo:nil];
return NO;
}
// Sort the table
if(!FLAC__metadata_object_seektable_template_sort(seektable.get(), false)) {
os_log_error(gSFBAudioEncoderLog, "FLAC__metadata_object_seektable_template_sort failed");
if(error)
*error = [NSError errorWithDomain:NSPOSIXErrorDomain code:ENOMEM userInfo:nil];
return NO;
}
}
_metadata[0] = padding.get();
if(seektable)
_metadata[1] = seektable.get();
if(!FLAC__stream_encoder_set_metadata(flac.get(), _metadata, seektable ? 2 : 1)) {
os_log_error(gSFBAudioEncoderLog, "FLAC__stream_encoder_set_metadata failed: %{public}s", FLAC__stream_encoder_get_resolved_state_string(flac.get()));
if(error)
*error = [NSError errorWithDomain:SFBAudioEncoderErrorDomain code:SFBAudioEncoderErrorCodeInternalError userInfo:nil];
return NO;
}
// Initialize the FLAC encoder
if(![self initializeFLACStreamEncoder:flac.get() error:error])
return NO;
AudioStreamBasicDescription outputStreamDescription{};
outputStreamDescription.mFormatID = kAudioFormatFLAC;
outputStreamDescription.mSampleRate = _processingFormat.sampleRate;
outputStreamDescription.mChannelsPerFrame = _processingFormat.channelCount;
outputStreamDescription.mBitsPerChannel = _processingFormat.streamDescription->mBitsPerChannel;
switch(outputStreamDescription.mBitsPerChannel) {
case 16:
outputStreamDescription.mFormatFlags = kAppleLosslessFormatFlag_16BitSourceData;
break;
case 20:
outputStreamDescription.mFormatFlags = kAppleLosslessFormatFlag_20BitSourceData;
break;
case 24:
outputStreamDescription.mFormatFlags = kAppleLosslessFormatFlag_24BitSourceData;
break;
case 32:
outputStreamDescription.mFormatFlags = kAppleLosslessFormatFlag_32BitSourceData;
break;
}
outputStreamDescription.mFramesPerPacket = FLAC__stream_encoder_get_blocksize(flac.get());
_outputFormat = [[AVAudioFormat alloc] initWithStreamDescription:&outputStreamDescription channelLayout:_processingFormat.channelLayout];
_flac = std::move(flac);
_seektable = std::move(seektable);
_padding = std::move(padding);
return YES;
}
- (BOOL)closeReturningError:(NSError **)error
{
_flac.reset();
_seektable.reset();
_padding.reset();
return [super closeReturningError:error];
}
- (BOOL)isOpen
{
return _flac != nullptr;
}
- (AVAudioFramePosition)framePosition
{
return _framePosition;
}
- (BOOL)encodeFromBuffer:(AVAudioPCMBuffer *)buffer frameLength:(AVAudioFrameCount)frameLength error:(NSError **)error
{
NSParameterAssert(buffer != nil);
NSParameterAssert([buffer.format isEqual:_processingFormat]);
if(frameLength > buffer.frameLength)
frameLength = buffer.frameLength;
if(frameLength == 0)
return YES;
// The libFLAC encoder expects signed 32-bit samples in the range of the audio bit depth
// (e.g. for 16 bit samples the interval is [-32768, 32767]).
//
// Samples in the processing format needs to be massaged slightly before the handoff
// to libFLAC.
// Probably unnecessary sanity check
static_assert(std::is_same_v<int32_t, FLAC__int32>, "int32_t and FLAC__int32 are different types");
// Ensure implementation-defined right shift for negative numbers is arithmetic
static_assert(~0 >> 1 == ~0, "signed right shift is not arithmetic");
const auto format = _processingFormat.streamDescription;
if(const auto bits = format->mBitsPerChannel; bits != 32) {
int32_t dst [512];
const AVAudioFrameCount frameCapacity = sizeof(dst) / format->mBytesPerFrame;
const auto shift = 32 - bits;
const auto stride = buffer.stride;
auto framesRemaining = frameLength;
while(framesRemaining > 0) {
const auto frameCount = std::min(frameCapacity, framesRemaining);
const auto frameOffset = frameLength - framesRemaining;
const auto byteOffset = frameOffset * format->mBytesPerFrame;
const auto src = static_cast<int32_t *>(reinterpret_cast<void *>(reinterpret_cast<uintptr_t>(buffer.audioBufferList->mBuffers[0].mData) + byteOffset));
// Shift from high alignment, sign extending in the process
for(AVAudioFrameCount i = 0; i < frameCount * stride; ++i)
dst[i] = src[i] >> shift;
if(!FLAC__stream_encoder_process_interleaved(_flac.get(), dst, frameCount)) {
os_log_error(gSFBAudioEncoderLog, "FLAC__stream_encoder_process_interleaved failed: %{public}s", FLAC__stream_encoder_get_resolved_state_string(_flac.get()));
if(error)
*error = [NSError errorWithDomain:SFBAudioEncoderErrorDomain code:SFBAudioEncoderErrorCodeInternalError userInfo:nil];
return NO;
}
framesRemaining -= frameCount;
}
}
// Pass 32-bit samples straight through
else {
if(!FLAC__stream_encoder_process_interleaved(_flac.get(), static_cast<int32_t *>(buffer.audioBufferList->mBuffers[0].mData), frameLength)) {
os_log_error(gSFBAudioEncoderLog, "FLAC__stream_encoder_process_interleaved failed: %{public}s", FLAC__stream_encoder_get_resolved_state_string(_flac.get()));
if(error)
*error = [NSError errorWithDomain:SFBAudioEncoderErrorDomain code:SFBAudioEncoderErrorCodeInternalError userInfo:nil];
return NO;
}
}
return YES;
}
- (BOOL)finishEncodingReturningError:(NSError **)error
{
if(!FLAC__stream_encoder_finish(_flac.get())) {
os_log_error(gSFBAudioEncoderLog, "FLAC__stream_encoder_finish failed: %{public}s", FLAC__stream_encoder_get_resolved_state_string(_flac.get()));
if(error)
*error = [NSError errorWithDomain:SFBAudioEncoderErrorDomain code:SFBAudioEncoderErrorCodeInternalError userInfo:nil];
return NO;
}
return YES;
}
- (BOOL)initializeFLACStreamEncoder:(FLAC__StreamEncoder *)encoder error:(NSError **)error
{
NSParameterAssert(encoder != nullptr);
auto encoderStatus = FLAC__stream_encoder_init_stream(encoder, write_callback, seek_callback, tell_callback, metadata_callback, (__bridge void *)self);
if(encoderStatus != FLAC__STREAM_ENCODER_INIT_STATUS_OK) {
os_log_error(gSFBAudioEncoderLog, "FLAC__stream_encoder_init_stream failed: %{public}s", FLAC__stream_encoder_get_resolved_state_string(encoder));
if(error)
*error = [NSError errorWithDomain:SFBAudioEncoderErrorDomain code:SFBAudioEncoderErrorCodeInternalError userInfo:nil];
return NO;
}
return YES;
}
@end
@implementation SFBOggFLACEncoder
+ (void)load
{
[SFBAudioEncoder registerSubclass:[self class]];
}
+ (NSSet *)supportedPathExtensions
{
return [NSSet setWithObject:@"oga"];
}
+ (NSSet *)supportedMIMETypes
{
return [NSSet setWithObject:@"audio/ogg; codecs=flac"];
}
+ (SFBAudioEncoderName)encoderName
{
return SFBAudioEncoderNameOggFLAC;
}
- (BOOL)encodingIsLossless
{
return YES;
}
- (BOOL)initializeFLACStreamEncoder:(FLAC__StreamEncoder *)encoder error:(NSError **)error
{
NSParameterAssert(encoder != nullptr);
// As long as the FLAC encoder is non-null and uninitialized this setter will succeed
FLAC__stream_encoder_set_ogg_serial_number(encoder, static_cast<int>(arc4random()));
auto encoderStatus = FLAC__stream_encoder_init_ogg_stream(encoder, read_callback, write_callback, seek_callback, tell_callback, metadata_callback, (__bridge void *)self);
if(encoderStatus != FLAC__STREAM_ENCODER_INIT_STATUS_OK) {
os_log_error(gSFBAudioEncoderLog, "FLAC__stream_encoder_init_ogg_stream failed: %{public}s", FLAC__stream_encoder_get_resolved_state_string(encoder));
if(error)
*error = [NSError errorWithDomain:SFBAudioEncoderErrorDomain code:SFBAudioEncoderErrorCodeInternalError userInfo:nil];
return NO;
}
return YES;
}
@end