Skip to content

Commit

Permalink
log
Browse files Browse the repository at this point in the history
Signed-off-by: Lloyd-Pottiger <yan1579196623@gmail.com>
  • Loading branch information
Lloyd-Pottiger committed May 17, 2024
1 parent f0269b0 commit 2c92c81
Show file tree
Hide file tree
Showing 3 changed files with 47 additions and 5 deletions.
29 changes: 25 additions & 4 deletions dbms/src/IO/Compression/CompressionCodecIntegerLightweight.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -52,6 +52,12 @@ UInt32 CompressionCodecIntegerLightweight::getMaxCompressedDataSize(UInt32 uncom
return 1 + 1 + LZ4_COMPRESSBOUND(uncompressed_size);
}

CompressionCodecIntegerLightweight::~CompressionCodecIntegerLightweight()
{
if (ctx.isCompression())
LOG_INFO(Logger::get(), "lightweight codec: {}", ctx.toDebugString());
}

template <typename T>
size_t CompressionCodecIntegerLightweight::compressDataForType(const char * source, UInt32 source_size, char * dest)
const
Expand Down Expand Up @@ -166,6 +172,18 @@ void CompressionCodecIntegerLightweight::decompressDataForType(
}
}

String CompressionCodecIntegerLightweight::CompressContext::toDebugString() const
{
return fmt::format(
"lz4: {} times, {} -> {}, lightweight: {} times, {} -> {}",
lz4_counter,
lz4_uncompressed_size,
lz4_compressed_size,
lw_counter,
lw_uncompressed_size,
lw_compressed_size);
}

void CompressionCodecIntegerLightweight::CompressContext::update(size_t uncompressed_size, size_t compressed_size)
{
if (mode == Mode::LZ4)
Expand Down Expand Up @@ -219,7 +237,10 @@ void CompressionCodecIntegerLightweight::CompressContext::analyze(std::span<cons
}

if (!needAnalyze())
{
RUNTIME_CHECK(mode == Mode::LZ4);
return;
}

// Check CONSTANT
T min_value = *std::min_element(values.begin(), values.end());
Expand Down Expand Up @@ -261,7 +282,7 @@ void CompressionCodecIntegerLightweight::CompressContext::analyze(std::span<cons
}

// RLE
std::vector<std::pair<T, UInt8>> rle;
Compression::RLEPairs<T> rle;
if (needAnalyzeRLE())
{
rle.reserve(values.size());
Expand All @@ -281,8 +302,8 @@ void CompressionCodecIntegerLightweight::CompressContext::analyze(std::span<cons
// Assume that the compression ratio of LZ4 is 3.0
// The official document says that the compression ratio of LZ4 is 2.1, https://github.com/lz4/lz4
size_t estimate_lz_size = values.size() * sizeof(T) / 3;
size_t rle_size = Compression::RLEPairsSize(rle);
if (rle_size < delta_for_size && rle_size < for_size && rle_size < estimate_lz_size)
size_t rle_size = rle.empty() ? std::numeric_limits<size_t>::max() : Compression::RLEPairsSize(rle);
if (needAnalyzeRLE() && rle_size < delta_for_size && rle_size < for_size && rle_size < estimate_lz_size)
{
state = std::move(rle);
mode = Mode::RLE;
Expand All @@ -293,7 +314,7 @@ void CompressionCodecIntegerLightweight::CompressContext::analyze(std::span<cons
state = FORState<T>{std::move(values_copy), min_value, for_width};
mode = Mode::FOR;
}
else if (delta_for_size < estimate_lz_size)
else if (needAnalyzeDelta() && delta_for_size < estimate_lz_size)
{
state = DeltaFORState<T>{std::move(deltas), min_delta, delta_for_width};
mode = Mode::DELTA_FOR;
Expand Down
5 changes: 5 additions & 0 deletions dbms/src/IO/Compression/CompressionCodecIntegerLightweight.h
Original file line number Diff line number Diff line change
Expand Up @@ -29,6 +29,8 @@ class CompressionCodecIntegerLightweight : public ICompressionCodec

UInt8 getMethodByte() const override;

~CompressionCodecIntegerLightweight() override;

protected:
UInt32 doCompressData(const char * source, UInt32 source_size, char * dest) const override;
void doDecompressData(const char * source, UInt32 source_size, char * dest, UInt32 uncompressed_size)
Expand Down Expand Up @@ -93,6 +95,9 @@ class CompressionCodecIntegerLightweight : public ICompressionCodec

void update(size_t uncompressed_size, size_t compressed_size);

String toDebugString() const;
bool isCompression() const { return lz4_counter > 0 || lw_counter > 0; }

Mode mode = Mode::LZ4;

private:
Expand Down
18 changes: 17 additions & 1 deletion dbms/src/Storages/DeltaMerge/File/DMFileWriter.h
Original file line number Diff line number Diff line change
Expand Up @@ -65,9 +65,25 @@ class DMFileWriter
/*flags*/ -1,
/*mode*/ 0666,
max_compress_block_size))
, compressed_buf(CompressedWriteBuffer<>::build(*plain_file, compression_settings, !dmfile->configuration))
, minmaxes(do_index ? std::make_shared<MinMaxIndex>(*type) : nullptr)
{
// TODO: better, now only for test
if (type->isInteger())
{
assert(compression_settings.settings.size() == 1);
CompressionSettings settings(CompressionMethod::Lightweight);
auto & setting = settings.settings[0];
setting.type_bytes_size = type->getSizeOfValueInMemory();
compressed_buf = CompressedWriteBuffer<>::build(*plain_file, settings, !dmfile->configuration);
}
else
{
compressed_buf = CompressedWriteBuffer<>::build( //
*plain_file,
compression_settings,
!dmfile->configuration);
}

if (!dmfile->useMetaV2())
{
mark_file = ChecksumWriteBufferBuilder::
Expand Down

0 comments on commit 2c92c81

Please sign in to comment.