doxygen/Lz4Decompressor_8cpp_source.html

/*

 * Copyright (C) 2020 Niek Linnenbank

 *

 * This program is free software: you can redistribute it and/or modify

 * it under the terms of the GNU General Public License as published by

 * the Free Software Foundation, either version 3 of the License, or

 * (at your option) any later version.

 *

 * This program is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 * GNU General Public License for more details.

 *

 * You should have received a copy of the GNU General Public License

 * along with this program.  If not, see <http://www.gnu.org/licenses/>.

 */


#include <FreeNOS/User.h>

#include <Log.h>

#include <ByteOrder.h>

#include <MemoryBlock.h>

#include "Lz4Decompressor.h"


Lz4Decompressor::Lz4Decompressor(const void *data, const Size size)

    : m_inputData(static_cast<const u8 *>(data))

    , m_inputSize(size)

    , m_frameDescSize(3)

    , m_blockChecksums(false)

    , m_contentChecksum(false)

    , m_contentSize(0)

    , m_blockMaximumSize(0)

{

}


Lz4Decompressor::Result Lz4Decompressor::initialize()

{

    // Reset state

    m_frameDescSize = 3;


    // Verify minimum input size

    if (m_inputSize < 27)

    {

        ERROR("invalid size of input data: " << m_inputSize);

        return InvalidArgument;

    }


    // Verify the input is an actual LZ4 frame

    if (readLe32(m_inputData) != FrameMagic)

    {

        ERROR("invalid magic value " << readLe32(m_inputData) << " != " << FrameMagic);

        return InvalidArgument;

    }


    // Read the FLG byte

    const u8 flg = *(m_inputData + sizeof(u32));


    // Verify the version bits

    const u8 version = flg >> FrameVersionShift;

    if (version != FrameVersion)

    {

        ERROR("invalid version value " << version << " != " << FrameVersion);

        return InvalidArgument;

    }


    // This code only supports independent blocks

    const bool independent = (flg >> FrameBlockIndShift) & 0x1;

    if (!independent)

    {

        ERROR("inter-dependent blocks not supported");

        return NotSupported;

    }


    // Check for block checksum flag

    m_blockChecksums = (flg >> FrameBlockChkShift) & 0x1;


    // Check for content size flag

    if ((flg >> FrameContentSzShift) & 0x1)

    {

        m_contentSize = readLe64(m_inputData + sizeof(u32) + (sizeof(u8) * 2));

        m_frameDescSize += 8;

    }


    // Content size must be non-zero

    if (m_contentSize == 0)

    {

        ERROR("content size must not be zero");

        return NotSupported;

    }


    // Check for the content checksum flag

    m_contentChecksum = (flg >> FrameContentChkShift) & 0x1 ? true : false;


    // Check for the DictID flag

    if ((flg >> FrameDictIdShift) & 0x1)

    {

        m_frameDescSize += 4;

    }


    // Read the BD byte which contains the maximum block size

    const u8 bd = *(m_inputData + sizeof(u32) + sizeof(u8));

    switch (bd >> 4)

    {

        case 4:

            m_blockMaximumSize = KiloByte(64);

            break;

        case 5:

            m_blockMaximumSize = KiloByte(256);

            break;

        case 6:

            m_blockMaximumSize = MegaByte(1);

            break;

        case 7:

            m_blockMaximumSize = MegaByte(4);

            break;

        default:

        {

            ERROR("invalid maximum block size value: " << (bd >> 4));

            return InvalidArgument;

        }

    }


    return Success;

}


u64 Lz4Decompressor::getUncompressedSize() const

{

    return m_contentSize;

}


Lz4Decompressor::Result Lz4Decompressor::read(void *buffer,

                                              const Size size) const

{

    const u8 *input = m_inputData + m_frameDescSize + sizeof(u32);

    const u8 *inputEnd = m_inputData + m_inputSize;

    u8 *output = static_cast<u8 *>(buffer);

    Size copied = 0;


    while (copied < size && input < inputEnd)

    {

        // Fetch the next block

        const u32 blockSizeByte = readLe32(input);

        const u32 blockSize = blockSizeByte & ~(1 << 31);

        const bool isCompressed = blockSizeByte & (1 << 31) ? false : true;

        Size uncompSize;


        // Last block has the EndMark as size value

        if (blockSize == EndMark)

        {

            break;

        }

        assert(blockSize <= m_blockMaximumSize);

        input += sizeof(u32);


        // Decompress the block

        if (isCompressed)

        {

            uncompSize = decompress(input, blockSize, output, size - copied);

        }

        // Return data as-is when the block is not compressed

        else

        {

            MemoryBlock::copy(output, input, blockSize);

            uncompSize = blockSize;

        }


        // Move to the next block

        copied += uncompSize;

        output += uncompSize;

        input += blockSize;

        if (m_blockChecksums)

        {

            input += sizeof(u32);

        }

    }


    return Success;

}


inline const u32 Lz4Decompressor::integerDecode(const u32 initial,

                                                const u8 *next,

                                                Size &byteCount) const

{

    u32 value = initial;


    if (initial < 0xf)

    {

        return initial;

    }


    for (byteCount = 1; ; byteCount++)

    {

        const u8 byte = *next++;

        value += byte;


        if (byte < 0xff)

        {

            break;

        }

    }


    return value;

}


const u32 Lz4Decompressor::decompress(const u8 *input,

                                      const Size inputSize,

                                      u8 *output,

                                      const Size outputSize) const

{

    const u8 *inputEnd = input + inputSize;

    Size outputOffset = 0;


    // Decompress the whole block

    while (input < inputEnd && outputOffset < outputSize)

    {

        u32 literalBytes = 0;

        u32 matchBytes = 0;


        // Read the token

        const u8 token = *input;

        input++;


        // Read literals count

        const u32 literalsCount = integerDecode(token >> 4, input, literalBytes);

        input += literalBytes;

        DEBUG("token = " << token << " literalsCount = " << literalsCount << " literalBytes = " << literalBytes);


        // Copy literals

        if (literalsCount > 0)

        {

            MemoryBlock::copy(output + outputOffset, input, literalsCount);

            input += literalsCount;

            outputOffset += literalsCount;

        }


        // End of block reached? Last 5 bytes are only literals

        if (input >= inputEnd)

        {

            break;

        }


        // Read match offset

        const u16 off = readLe16(input);

        assert(off <= outputOffset);

        const u32 matchOffset = outputOffset - off;

        input += sizeof(u16);


        // Read match length

        const u32 matchCount = integerDecode(token & 0xf, input, matchBytes) + 4u;

        input += matchBytes;


        // Copy the match from previous decoded bytes

        DEBUG("matchOffset = " << matchOffset << " matchCount = " << matchCount);

        MemoryBlock::copy(output + outputOffset, output + matchOffset, matchCount);

        outputOffset += matchCount;

    }


    assert(outputOffset <= m_blockMaximumSize);

    return outputOffset;

}


ByteOrder.h

Log.h

Lz4Decompressor.h

MemoryBlock.h

Lz4Decompressor::initialize
Result initialize()
Initialize the decompressor.
Definition Lz4Decompressor.cpp:35

Lz4Decompressor::m_contentSize
u64 m_contentSize
Content size as specified in the frame header.
Definition Lz4Decompressor.h:160

Lz4Decompressor::m_inputSize
const Size m_inputSize
Total size in bytes of the compressed input data.
Definition Lz4Decompressor.h:148

Lz4Decompressor::integerDecode
const u32 integerDecode(const u32 initial, const u8 *next, Size &byteCount) const
Decode input data as integer (little-endian, 32-bit unsigned)
Definition Lz4Decompressor.cpp:179

Lz4Decompressor::m_blockMaximumSize
Size m_blockMaximumSize
Maximum block size in bytes of the uncompressed content.
Definition Lz4Decompressor.h:163

Lz4Decompressor::getUncompressedSize
u64 getUncompressedSize() const
Get size of the uncompressed data.
Definition Lz4Decompressor.cpp:125

Lz4Decompressor::m_inputData
const u8 * m_inputData
Compressed input data.
Definition Lz4Decompressor.h:145

Lz4Decompressor::m_frameDescSize
Size m_frameDescSize
Size of the frame descriptor in bytes.
Definition Lz4Decompressor.h:151

Lz4Decompressor::m_blockChecksums
bool m_blockChecksums
True if blocks have checksums enabled.
Definition Lz4Decompressor.h:154

Lz4Decompressor::EndMark
static const u32 EndMark
EndMark marks the end of the data stream.
Definition Lz4Decompressor.h:63

Lz4Decompressor::m_contentChecksum
bool m_contentChecksum
True if the input data buffer contains content checksum.
Definition Lz4Decompressor.h:157

Lz4Decompressor::Lz4Decompressor
Lz4Decompressor(const void *data, const Size size)
Constructor function.
Definition Lz4Decompressor.cpp:24

Lz4Decompressor::FrameVersionShift
@ FrameVersionShift
Definition Lz4Decompressor.h:56

Lz4Decompressor::FrameContentSzShift
@ FrameContentSzShift
Definition Lz4Decompressor.h:53

Lz4Decompressor::FrameBlockIndShift
@ FrameBlockIndShift
Definition Lz4Decompressor.h:55

Lz4Decompressor::FrameDictIdShift
@ FrameDictIdShift
Definition Lz4Decompressor.h:51

Lz4Decompressor::FrameContentChkShift
@ FrameContentChkShift
Definition Lz4Decompressor.h:52

Lz4Decompressor::FrameBlockChkShift
@ FrameBlockChkShift
Definition Lz4Decompressor.h:54

Lz4Decompressor::decompress
const u32 decompress(const u8 *input, const Size inputSize, u8 *output, const Size outputSize) const
Decompress a block of compressed data.
Definition Lz4Decompressor.cpp:204

Lz4Decompressor::Result
Result
Result codes.
Definition Lz4Decompressor.h:71

Lz4Decompressor::Success
@ Success
Definition Lz4Decompressor.h:72

Lz4Decompressor::InvalidArgument
@ InvalidArgument
Definition Lz4Decompressor.h:74

Lz4Decompressor::NotSupported
@ NotSupported
Definition Lz4Decompressor.h:75

Lz4Decompressor::FrameMagic
static const u32 FrameMagic
Magic number value marks the start of the frame header.
Definition Lz4Decompressor.h:44

Lz4Decompressor::read
Result read(void *buffer, const Size size) const
Reads compressed data.
Definition Lz4Decompressor.cpp:130

Lz4Decompressor::FrameVersion
static const u8 FrameVersion
Current supported version of the LZ4 algorithm.
Definition Lz4Decompressor.h:60

MemoryBlock::copy
static Size copy(void *dest, const void *src, Size count)
Copy memory from one place to another.
Definition MemoryBlock.cpp:41

assert
#define assert(exp)
Insert program diagnostics.
Definition assert.h:60

u32
unsigned int u32
Unsigned 32-bit number.
Definition Types.h:53

MegaByte
#define MegaByte(v)
Convert megabytes to bytes.
Definition Macros.h:57

ERROR
#define ERROR(msg)
Output an error message.
Definition Log.h:61

readLe16
const u16 readLe16(const void *data)
Read 16-bit little endian integer.
Definition ByteOrder.h:356

readLe64
const u64 readLe64(const void *data)
Read 64-bit little endian integer.
Definition ByteOrder.h:328

u16
unsigned short u16
Unsigned 16-bit number.
Definition Types.h:56

KiloByte
#define KiloByte(v)
Convert kilobytes to bytes.
Definition Macros.h:54

Size
unsigned int Size
Any sane size indicator cannot go negative.
Definition Types.h:128

u64
unsigned long long u64
Unsigned 64-bit number.
Definition Types.h:50

readLe32
const u32 readLe32(const void *data)
Read 32-bit little endian integer.
Definition ByteOrder.h:342

DEBUG
#define DEBUG(msg)
Output a debug message to standard output.
Definition Log.h:89

u8
unsigned char u8
Unsigned 8-bit number.
Definition Types.h:59