LibAudio: Add a FLAC encoder

This encoder can handle all integer formats and sample rates, though only two channels well. It uses fixed LPC and performs a close-to-optimal parameter search on the LPC order and residual Rice parameter, leading to decent compression already.
2025-07-27 16:57:46 +00:00 · 2023-07-05 00:10:35 +02:00 · 2023-07-05 00:10:35 +02:00 · 625aac2367
commit 625aac2367
parent 252b1328ea
7 changed files with 795 additions and 0 deletions
--- a/Userland/Libraries/LibAudio/FlacWriter.h
+++ b/Userland/Libraries/LibAudio/FlacWriter.h
@ -0,0 +1,118 @@
+/*
+ * Copyright (c) 2023, kleines Filmröllchen <filmroellchen@serenityos.org>
+ *
+ * SPDX-License-Identifier: BSD-2-Clause
+ */
+
+#pragma once
+
+#include <AK/MaybeOwned.h>
+#include <AK/Noncopyable.h>
+#include <AK/RefPtr.h>
+#include <AK/Stream.h>
+#include <AK/StringView.h>
+#include <LibAudio/Encoder.h>
+#include <LibAudio/FlacTypes.h>
+#include <LibAudio/Sample.h>
+#include <LibAudio/SampleFormats.h>
+#include <LibCore/Forward.h>
+
+namespace Audio {
+
+// Encodes the sign representation method used in Rice coding.
+// Numbers alternate between positive and negative: 0, 1, -1, 2, -2, 3, -3, 4, -4, 5, -5, ...
+ALWAYS_INLINE u32 signed_to_rice(i32 x);
+
+// Encode a single number encoded with exponential golomb encoding of the specified order (k).
+ALWAYS_INLINE ErrorOr<void> encode_unsigned_exp_golomb(u8 k, i32 value, BigEndianOutputBitStream& bit_stream);
+
+size_t count_exp_golomb_bits_in(u8 k, ReadonlySpan<i64> residuals);
+
+void predict_fixed_lpc(FlacFixedLPC order, ReadonlySpan<i64> samples, Span<i64> predicted_output);
+
+// A simple FLAC encoder that writes FLAC files compatible with the streamable subset.
+// The encoder currently has the following simple output properties:
+// FIXME: All frames have a fixed sample size, see below.
+// FIXME: All frames are encoded with the best fixed LPC predictor.
+// FIXME: All residuals are encoded in one Rice partition.
+class FlacWriter : public Encoder {
+    AK_MAKE_NONCOPYABLE(FlacWriter);
+    AK_MAKE_NONMOVABLE(FlacWriter);
+
+    /// Tunable static parameters. Please try to improve these; only some have already been well-tuned!
+
+    // Constant block size.
+    static constexpr size_t block_size = 1024;
+    // Used as a percentage to check residual costs before the estimated "necessary" estimation point.
+    // We usually over-estimate residual costs, so this prevents us from overshooting the actual bail point.
+    static constexpr double residual_cost_margin = 0.07;
+    // At what sample index to first estimate residuals, so that the residual parameter can "stabilize" through more encoded values.
+    static constexpr size_t first_residual_estimation = 16;
+    // How many samples to advance at minimum before estimating residuals again.
+    static constexpr size_t min_residual_estimation_step = 20;
+    // After how many useless (i.e. worse than current optimal) Rice parameters to abort parameter search.
+    // Note that due to the zig-zag search, we start with searching the parameters that are most likely to be good.
+    static constexpr size_t useless_parameter_threshold = 2;
+
+    enum class WriteState {
+        // Header has not been written at all, audio data cannot be written.
+        HeaderUnwritten,
+        // Header was written, i.e. sample format is finalized,
+        // but audio data has not been finalized and therefore some header information is still missing.
+        FormatFinalized,
+        // File is fully finalized, no more sample data can be written.
+        FullyFinalized,
+    };
+
+public:
+    static ErrorOr<NonnullOwnPtr<FlacWriter>> create(NonnullOwnPtr<SeekableStream> stream, u32 sample_rate = 44100, u8 num_channels = 2, u16 bits_per_sample = 16);
+    virtual ~FlacWriter();
+
+    virtual ErrorOr<void> write_samples(ReadonlySpan<Sample> samples) override;
+
+    virtual ErrorOr<void> finalize() override;
+
+    u32 sample_rate() const { return m_sample_rate; }
+    u8 num_channels() const { return m_num_channels; }
+    PcmSampleFormat sample_format() const { return integer_sample_format_for(m_bits_per_sample).value(); }
+    Stream const& output_stream() const { return *m_stream; }
+
+    ErrorOr<void> set_num_channels(u8 num_channels);
+    ErrorOr<void> set_sample_rate(u32 sample_rate);
+    ErrorOr<void> set_bits_per_sample(u16 bits_per_sample);
+    ErrorOr<void> finalize_header_format();
+
+private:
+    FlacWriter(NonnullOwnPtr<SeekableStream>);
+    ErrorOr<void> write_header();
+
+    ErrorOr<void> write_frame();
+    ErrorOr<void> write_subframe(ReadonlySpan<i64> subframe, BigEndianOutputBitStream& bit_stream);
+    ErrorOr<void> write_lpc_subframe(FlacLPCEncodedSubframe lpc_subframe, BigEndianOutputBitStream& bit_stream);
+    ErrorOr<void> write_verbatim_subframe(ReadonlySpan<i64> subframe, BigEndianOutputBitStream& bit_stream);
+    // Assumes 4-bit k for now.
+    ErrorOr<void> write_rice_partition(u8 k, ReadonlySpan<i64> residuals, BigEndianOutputBitStream& bit_stream);
+
+    // Aborts encoding once the costs exceed the previous minimum, thereby speeding up the encoder's parameter search.
+    // In this case, an empty Optional is returned.
+    ErrorOr<Optional<FlacLPCEncodedSubframe>> encode_fixed_lpc(FlacFixedLPC order, ReadonlySpan<i64> subframe, size_t current_min_cost);
+
+    NonnullOwnPtr<SeekableStream> m_stream;
+    WriteState m_state { WriteState::HeaderUnwritten };
+
+    Vector<Sample, block_size> m_sample_buffer {};
+    size_t m_current_frame { 0 };
+
+    u32 m_sample_rate;
+    u8 m_num_channels;
+    u16 m_bits_per_sample;
+
+    // Data updated during encoding; written to the header at the end.
+    u32 m_max_frame_size { 0 };
+    u32 m_min_frame_size { NumericLimits<u32>::max() };
+    size_t m_sample_count { 0 };
+    // Remember where the STREAMINFO block was written in the stream.
+    size_t m_streaminfo_start_index;
+};
+
+}