AK: Increase LittleEndianOutputBitStream's buffer size and remove loops

This is very similar to the LittleEndianInputBitStream bit buffer change
from 8e834d4bb2.

We currently buffer one byte of data for the underlying stream. And when
we put bits onto that buffer, we do so 1 bit at a time.

This replaces the u8 buffer with a u64. And instead of looping at all,
we perform bitwise operations to write the desired number of bits.

Using the "enwik8" file as a test (100MB uncompressed, commonly used in
benchmarks: https://www.mattmahoney.net/dc/enwik8.zip), compression time
decreases from:

    13.62s to 10.9s on Serenity (cold)
    13.62s to 9.22s on Serenity (warm)
    2.93s to 2.32s on Linux

One caveat is that this requires explicitly flushing any leftover bits
when the caller is done with the stream. The byte buffer implementation
implicitly flushed its data every time the buffer was byte-aligned, as
doing so would always fill the byte. This is no longer the case. But for
now, this should be fine as the one user of this class, DEFLATE, already
has a "flush everything now that we're done" finalizer.
This commit is contained in:
Timothy Flynn 2023-04-01 16:19:21 -04:00 committed by Andreas Kling
parent d74fa5e283
commit eed956b473
3 changed files with 84 additions and 49 deletions

View file

@ -117,9 +117,18 @@ private:
MaybeOwned<Stream> m_stream;
};
/// A stream wrapper class that allows you to read arbitrary amounts of bits
/// in little-endian order from another stream.
class LittleEndianInputBitStream : public Stream {
class LittleEndianBitStream : public Stream {
protected:
using BufferType = u64;
static constexpr size_t bits_per_byte = 8u;
static constexpr size_t bit_buffer_size = sizeof(BufferType) * bits_per_byte;
explicit LittleEndianBitStream(MaybeOwned<Stream> stream)
: m_stream(move(stream))
{
}
template<Unsigned T>
static constexpr T lsb_mask(T bits)
{
@ -129,9 +138,26 @@ class LittleEndianInputBitStream : public Stream {
return bits == 0 ? 0 : max >> (digits - bits);
}
ALWAYS_INLINE BufferType lsb_aligned_buffer() const
{
return m_bit_offset == bit_buffer_size ? 0 : m_bit_buffer >> m_bit_offset;
}
ALWAYS_INLINE bool is_aligned_to_byte_boundary() const { return m_bit_count % bits_per_byte == 0; }
MaybeOwned<Stream> m_stream;
BufferType m_bit_buffer { 0 };
u8 m_bit_offset { 0 };
u8 m_bit_count { 0 };
};
/// A stream wrapper class that allows you to read arbitrary amounts of bits
/// in little-endian order from another stream.
class LittleEndianInputBitStream : public LittleEndianBitStream {
public:
explicit LittleEndianInputBitStream(MaybeOwned<Stream> stream)
: m_stream(move(stream))
: LittleEndianBitStream(move(stream))
{
}
@ -217,17 +243,7 @@ public:
return remaining_bits;
}
/// Whether we are (accidentally or intentionally) at a byte boundary right now.
ALWAYS_INLINE bool is_aligned_to_byte_boundary() const { return m_bit_count % bits_per_byte == 0; }
private:
using BufferType = u64;
ALWAYS_INLINE BufferType lsb_aligned_buffer() const
{
return m_bit_offset == bit_buffer_size ? 0 : m_bit_buffer >> m_bit_offset;
}
ErrorOr<void> refill_buffer_from_stream()
{
size_t bits_to_read = bit_buffer_size - m_bit_count;
@ -242,15 +258,6 @@ private:
return {};
}
static constexpr size_t bits_per_byte = 8u;
static constexpr size_t bit_buffer_size = sizeof(BufferType) * bits_per_byte;
MaybeOwned<Stream> m_stream;
BufferType m_bit_buffer { 0 };
u8 m_bit_offset { 0 };
u8 m_bit_count { 0 };
};
/// A stream wrapper class that allows you to write arbitrary amounts of bits
@ -333,10 +340,10 @@ private:
/// A stream wrapper class that allows you to write arbitrary amounts of bits
/// in little-endian order to another stream.
class LittleEndianOutputBitStream : public Stream {
class LittleEndianOutputBitStream : public LittleEndianBitStream {
public:
explicit LittleEndianOutputBitStream(MaybeOwned<Stream> stream)
: m_stream(move(stream))
: LittleEndianBitStream(move(stream))
{
}
@ -347,28 +354,52 @@ public:
virtual ErrorOr<size_t> write_some(ReadonlyBytes bytes) override
{
VERIFY(m_bit_offset == 0);
VERIFY(is_aligned_to_byte_boundary());
if (m_bit_count > 0)
TRY(flush_buffer_to_stream());
return m_stream->write_some(bytes);
}
template<Unsigned T>
ErrorOr<void> write_bits(T value, size_t bit_count)
ErrorOr<void> write_bits(T value, size_t count)
{
VERIFY(m_bit_offset <= 7);
if (m_bit_count == bit_buffer_size) {
TRY(flush_buffer_to_stream());
} else if (auto remaining = bit_buffer_size - m_bit_count; count >= remaining) {
m_bit_buffer |= (static_cast<BufferType>(value) & lsb_mask<BufferType>(remaining)) << m_bit_count;
m_bit_count = bit_buffer_size;
size_t input_offset = 0;
while (input_offset < bit_count) {
u8 next_bit = (value >> input_offset) & 1;
input_offset++;
if (remaining != sizeof(value) * bits_per_byte)
value >>= remaining;
count -= remaining;
m_current_byte |= next_bit << m_bit_offset;
m_bit_offset++;
TRY(flush_buffer_to_stream());
}
if (m_bit_offset > 7) {
TRY(m_stream->write_value(m_current_byte));
m_bit_offset = 0;
m_current_byte = 0;
}
if (count == 0)
return {};
m_bit_buffer |= static_cast<BufferType>(value) << m_bit_count;
m_bit_count += count;
return {};
}
ALWAYS_INLINE ErrorOr<void> flush_buffer_to_stream()
{
auto bytes_to_write = m_bit_count / bits_per_byte;
TRY(m_stream->write_until_depleted({ &m_bit_buffer, bytes_to_write }));
if (m_bit_count == bit_buffer_size) {
m_bit_buffer = 0;
m_bit_count = 0;
} else {
auto bits_written = bytes_to_write * bits_per_byte;
m_bit_buffer >>= bits_written;
m_bit_count -= bits_written;
}
return {};
@ -390,23 +421,16 @@ public:
size_t bit_offset() const
{
return m_bit_offset;
return m_bit_count;
}
ErrorOr<void> align_to_byte_boundary()
{
if (m_bit_offset == 0)
return {};
if (auto offset = m_bit_count % bits_per_byte; offset != 0)
TRY(write_bits<u8>(0u, bits_per_byte - offset));
TRY(write_bits(0u, 8 - m_bit_offset));
VERIFY(m_bit_offset == 0);
return {};
}
private:
MaybeOwned<Stream> m_stream;
u8 m_current_byte { 0 };
size_t m_bit_offset { 0 };
};
}

View file

@ -22,6 +22,8 @@ TEST_CASE(little_endian_bit_stream_input_output_match)
{
MUST(bit_write_stream.write_bits(0b1111u, 4));
MUST(bit_write_stream.write_bits(0b1111u, 4));
MUST(bit_write_stream.flush_buffer_to_stream());
auto result = MUST(bit_read_stream.read_bits(4));
EXPECT_EQ(0b1111u, result);
result = MUST(bit_read_stream.read_bits(4));
@ -30,6 +32,8 @@ TEST_CASE(little_endian_bit_stream_input_output_match)
{
MUST(bit_write_stream.write_bits(0b0000u, 4));
MUST(bit_write_stream.write_bits(0b0000u, 4));
MUST(bit_write_stream.flush_buffer_to_stream());
auto result = MUST(bit_read_stream.read_bits(4));
EXPECT_EQ(0b0000u, result);
result = MUST(bit_read_stream.read_bits(4));
@ -40,6 +44,8 @@ TEST_CASE(little_endian_bit_stream_input_output_match)
{
MUST(bit_write_stream.write_bits(0b1000u, 4));
MUST(bit_write_stream.write_bits(0b1000u, 4));
MUST(bit_write_stream.flush_buffer_to_stream());
auto result = MUST(bit_read_stream.read_bits(4));
EXPECT_EQ(0b1000u, result);
result = MUST(bit_read_stream.read_bits(4));
@ -50,6 +56,8 @@ TEST_CASE(little_endian_bit_stream_input_output_match)
{
MUST(bit_write_stream.write_bits(0b1000u, 4));
MUST(bit_write_stream.write_bits(0b0100u, 4));
MUST(bit_write_stream.flush_buffer_to_stream());
auto result = MUST(bit_read_stream.read_bits(4));
EXPECT_EQ(0b1000u, result);
result = MUST(bit_read_stream.read_bits(4));
@ -59,6 +67,8 @@ TEST_CASE(little_endian_bit_stream_input_output_match)
// Test a pattern that spans multiple bytes.
{
MUST(bit_write_stream.write_bits(0b1101001000100001u, 16));
MUST(bit_write_stream.flush_buffer_to_stream());
auto result = MUST(bit_read_stream.read_bits(16));
EXPECT_EQ(0b1101001000100001u, result);
}

View file

@ -1050,6 +1050,7 @@ ErrorOr<void> DeflateCompressor::final_flush()
VERIFY(!m_finished);
m_finished = true;
TRY(flush());
TRY(m_output_stream->flush_buffer_to_stream());
return {};
}