summaryrefslogtreecommitdiff
path: root/Userland/Libraries/LibCompress
diff options
context:
space:
mode:
authorTim Schumacher <timschumi@gmx.de>2023-05-13 17:55:31 +0200
committerAndreas Kling <kling@serenityos.org>2023-05-17 09:08:53 +0200
commitdf071d8a76fd254c0b03424c3279a90433c6586d (patch)
tree4cca7bd91faac4a25eb86e672d0bed87702da029 /Userland/Libraries/LibCompress
parente8067ac2ee2e08c3c8d19e386003be175492cec7 (diff)
downloadserenity-df071d8a76fd254c0b03424c3279a90433c6586d.zip
LibCompress: Add a lot of debug logging to LZMA
Diffstat (limited to 'Userland/Libraries/LibCompress')
-rw-r--r--Userland/Libraries/LibCompress/Lzma.cpp58
1 files changed, 53 insertions, 5 deletions
diff --git a/Userland/Libraries/LibCompress/Lzma.cpp b/Userland/Libraries/LibCompress/Lzma.cpp
index 73e2a64ce5..f5b8751f98 100644
--- a/Userland/Libraries/LibCompress/Lzma.cpp
+++ b/Userland/Libraries/LibCompress/Lzma.cpp
@@ -322,6 +322,8 @@ ErrorOr<u8> LzmaDecompressor::decode_bit_with_probability(Probability& probabili
u32 bound = (m_range_decoder_range >> probability_bit_count) * probability;
+ dbgln_if(LZMA_DEBUG, "Decoding bit {} with probability = {:#x}, bound = {:#x}, code = {:#x}, range = {:#x}", m_range_decoder_code < bound ? 0 : 1, probability, bound, m_range_decoder_code, m_range_decoder_range);
+
if (m_range_decoder_code < bound) {
probability += ((1 << probability_bit_count) - probability) >> probability_shift_width;
m_range_decoder_range = bound;
@@ -342,6 +344,8 @@ ErrorOr<void> LzmaCompressor::encode_bit_with_probability(Probability& probabili
u32 bound = (m_range_encoder_range >> probability_bit_count) * probability;
+ dbgln_if(LZMA_DEBUG, "Encoding bit {} with probability = {:#x}, bound = {:#x}, code = {:#x}, range = {:#x}", value, probability, bound, m_range_encoder_code, m_range_encoder_range);
+
if (value == 0) {
probability += ((1 << probability_bit_count) - probability) >> probability_shift_width;
m_range_encoder_range = bound;
@@ -372,6 +376,8 @@ ErrorOr<u16> LzmaDecompressor::decode_symbol_using_bit_tree(size_t bit_count, Sp
tree_index = (tree_index << 1) | next_bit;
}
+ dbgln_if(LZMA_DEBUG, "Decoded value {:#x} with {} bits using bit tree", result, bit_count);
+
return result;
}
@@ -381,6 +387,8 @@ ErrorOr<void> LzmaCompressor::encode_symbol_using_bit_tree(size_t bit_count, Spa
VERIFY(probability_tree.size() >= 1ul << bit_count);
VERIFY(value <= (1 << bit_count) - 1);
+ auto original_value = value;
+
// Shift value to make the first sent byte the most significant bit. This makes the shifting logic a lot easier to read.
value <<= sizeof(u16) * 8 - bit_count;
@@ -393,6 +401,8 @@ ErrorOr<void> LzmaCompressor::encode_symbol_using_bit_tree(size_t bit_count, Spa
tree_index = (tree_index << 1) | next_bit;
}
+ dbgln_if(LZMA_DEBUG, "Encoded value {:#x} with {} bits using bit tree", original_value, bit_count);
+
return {};
}
@@ -410,6 +420,8 @@ ErrorOr<u16> LzmaDecompressor::decode_symbol_using_reverse_bit_tree(size_t bit_c
tree_index = (tree_index << 1) | next_bit;
}
+ dbgln_if(LZMA_DEBUG, "Decoded value {:#x} with {} bits using reverse bit tree", result, bit_count);
+
return result;
}
@@ -419,6 +431,8 @@ ErrorOr<void> LzmaCompressor::encode_symbol_using_reverse_bit_tree(size_t bit_co
VERIFY(probability_tree.size() >= 1ul << bit_count);
VERIFY(value <= (1 << bit_count) - 1);
+ auto original_value = value;
+
size_t tree_index = 1;
for (size_t i = 0; i < bit_count; i++) {
@@ -428,6 +442,8 @@ ErrorOr<void> LzmaCompressor::encode_symbol_using_reverse_bit_tree(size_t bit_co
tree_index = (tree_index << 1) | next_bit;
}
+ dbgln_if(LZMA_DEBUG, "Encoded value {:#x} with {} bits using reverse bit tree", original_value, bit_count);
+
return {};
}
@@ -463,6 +479,8 @@ ErrorOr<void> LzmaDecompressor::decode_literal_to_output_buffer()
auto read_bytes = TRY(m_dictionary->read_with_seekback({ &matched_byte, sizeof(matched_byte) }, current_repetition_offset()));
VERIFY(read_bytes.size() == sizeof(matched_byte));
+ dbgln_if(LZMA_DEBUG, "Decoding literal using match byte {:#x}", matched_byte);
+
do {
u8 match_bit = (matched_byte >> 7) & 1;
matched_byte <<= 1;
@@ -484,6 +502,8 @@ ErrorOr<void> LzmaDecompressor::decode_literal_to_output_buffer()
VERIFY(written_bytes == sizeof(actual_result));
m_total_processed_bytes += sizeof(actual_result);
+ dbgln_if(LZMA_DEBUG, "Decoded literal {:#x} in state {} using literal state {:#x} (previous byte is {:#x})", actual_result, m_state, literal_state, previous_byte);
+
return {};
}
@@ -505,6 +525,7 @@ ErrorOr<void> LzmaCompressor::encode_literal(u8 literal)
Span<Probability> selected_probability_table = m_literal_probabilities.span().slice(literal_probability_table_size * literal_state, literal_probability_table_size);
+ auto original_literal = literal;
u16 result = 1;
if (m_state >= 7) {
@@ -512,6 +533,8 @@ ErrorOr<void> LzmaCompressor::encode_literal(u8 literal)
auto read_bytes = TRY(m_dictionary->read_with_seekback({ &matched_byte, sizeof(matched_byte) }, current_repetition_offset() + m_dictionary->used_space() + 1));
VERIFY(read_bytes.size() == sizeof(matched_byte));
+ dbgln_if(LZMA_DEBUG, "Encoding literal using match byte {:#x}", matched_byte);
+
do {
u8 const match_bit = (matched_byte >> 7) & 1;
matched_byte <<= 1;
@@ -538,6 +561,8 @@ ErrorOr<void> LzmaCompressor::encode_literal(u8 literal)
m_total_processed_bytes += sizeof(literal);
+ dbgln_if(LZMA_DEBUG, "Encoded literal {:#x} in state {} using literal state {:#x} (previous byte is {:#x})", original_literal, m_state, literal_state, previous_byte);
+
update_state_after_literal();
return {};
@@ -851,14 +876,18 @@ ErrorOr<LzmaDecompressor::MatchType> LzmaDecompressor::decode_match_type()
//
// IsMatch[state2] decode
// 0 - the Literal"
- if (TRY(decode_bit_with_probability(m_is_match_probabilities[state2])) == 0)
+ if (TRY(decode_bit_with_probability(m_is_match_probabilities[state2])) == 0) {
+ dbgln_if(LZMA_DEBUG, "Decoded match type 'Literal'");
return MatchType::Literal;
+ }
// " 1 - the Match
// IsRep[state] decode
// 0 - Simple Match"
- if (TRY(decode_bit_with_probability(m_is_rep_probabilities[m_state])) == 0)
+ if (TRY(decode_bit_with_probability(m_is_rep_probabilities[m_state])) == 0) {
+ dbgln_if(LZMA_DEBUG, "Decoded match type 'SimpleMatch'");
return MatchType::SimpleMatch;
+ }
// " 1 - Rep Match
// IsRepG0[state] decode
@@ -866,26 +895,34 @@ ErrorOr<LzmaDecompressor::MatchType> LzmaDecompressor::decode_match_type()
if (TRY(decode_bit_with_probability(m_is_rep_g0_probabilities[m_state])) == 0) {
// " IsRep0Long[state2] decode
// 0 - Short Rep Match"
- if (TRY(decode_bit_with_probability(m_is_rep0_long_probabilities[state2])) == 0)
+ if (TRY(decode_bit_with_probability(m_is_rep0_long_probabilities[state2])) == 0) {
+ dbgln_if(LZMA_DEBUG, "Decoded match type 'ShortRepMatch'");
return MatchType::ShortRepMatch;
+ }
// " 1 - Rep Match 0"
+ dbgln_if(LZMA_DEBUG, "Decoded match type 'RepMatch0'");
return MatchType::RepMatch0;
}
// " 1 -
// IsRepG1[state] decode
// 0 - Rep Match 1"
- if (TRY(decode_bit_with_probability(m_is_rep_g1_probabilities[m_state])) == 0)
+ if (TRY(decode_bit_with_probability(m_is_rep_g1_probabilities[m_state])) == 0) {
+ dbgln_if(LZMA_DEBUG, "Decoded match type 'RepMatch1'");
return MatchType::RepMatch1;
+ }
// " 1 -
// IsRepG2[state] decode
// 0 - Rep Match 2"
- if (TRY(decode_bit_with_probability(m_is_rep_g2_probabilities[m_state])) == 0)
+ if (TRY(decode_bit_with_probability(m_is_rep_g2_probabilities[m_state])) == 0) {
+ dbgln_if(LZMA_DEBUG, "Decoded match type 'RepMatch2'");
return MatchType::RepMatch2;
+ }
// " 1 - Rep Match 3"
+ dbgln_if(LZMA_DEBUG, "Decoded match type 'RepMatch3'");
return MatchType::RepMatch3;
}
@@ -896,12 +933,14 @@ ErrorOr<void> LzmaCompressor::encode_match_type(MatchType match_type)
if (match_type == MatchType::Literal) {
TRY(encode_bit_with_probability(m_is_match_probabilities[state2], 0));
+ dbgln_if(LZMA_DEBUG, "Encoded match type 'Literal'");
return {};
}
TRY(encode_bit_with_probability(m_is_match_probabilities[state2], 1));
if (match_type == MatchType::SimpleMatch) {
TRY(encode_bit_with_probability(m_is_rep_probabilities[m_state], 0));
+ dbgln_if(LZMA_DEBUG, "Encoded match type 'SimpleMatch'");
return {};
}
TRY(encode_bit_with_probability(m_is_rep_probabilities[m_state], 1));
@@ -909,21 +948,30 @@ ErrorOr<void> LzmaCompressor::encode_match_type(MatchType match_type)
if (match_type == MatchType::ShortRepMatch || match_type == MatchType::RepMatch0) {
TRY(encode_bit_with_probability(m_is_rep_g0_probabilities[m_state], 0));
TRY(encode_bit_with_probability(m_is_rep0_long_probabilities[state2], match_type == MatchType::RepMatch0));
+ if constexpr (LZMA_DEBUG) {
+ if (match_type == RepMatch0)
+ dbgln("Encoded match type 'RepMatch0'");
+ else
+ dbgln("Encoded match type 'ShortRepMatch'");
+ }
return {};
}
TRY(encode_bit_with_probability(m_is_rep_g0_probabilities[m_state], 1));
if (match_type == MatchType::RepMatch1) {
TRY(encode_bit_with_probability(m_is_rep_g1_probabilities[m_state], 0));
+ dbgln_if(LZMA_DEBUG, "Encoded match type 'RepMatch1'");
return {};
}
TRY(encode_bit_with_probability(m_is_rep_g1_probabilities[m_state], 1));
if (match_type == MatchType::RepMatch2) {
TRY(encode_bit_with_probability(m_is_rep_g2_probabilities[m_state], 0));
+ dbgln_if(LZMA_DEBUG, "Encoded match type 'RepMatch2'");
return {};
}
TRY(encode_bit_with_probability(m_is_rep_g2_probabilities[m_state], 1));
+ dbgln_if(LZMA_DEBUG, "Encoded match type 'RepMatch3'");
return {};
}