/* * Copyright (c) 2021, Matthew Olsson * * SPDX-License-Identifier: BSD-2-Clause */ #include #include #include #include #include namespace PDF { ErrorOr Filter::decode(ReadonlyBytes bytes, DeprecatedFlyString const& encoding_type, RefPtr decode_parms) { int predictor = 1; int columns = 1; int colors = 1; int bits_per_component = 8; if (decode_parms) { if (decode_parms->contains(CommonNames::Predictor)) predictor = decode_parms->get_value(CommonNames::Predictor).get(); if (decode_parms->contains(CommonNames::Columns)) columns = decode_parms->get_value(CommonNames::Columns).get(); if (decode_parms->contains(CommonNames::Colors)) colors = decode_parms->get_value(CommonNames::Colors).get(); if (decode_parms->contains(CommonNames::BitsPerComponent)) bits_per_component = decode_parms->get_value(CommonNames::BitsPerComponent).get(); } if (encoding_type == CommonNames::ASCIIHexDecode) return decode_ascii_hex(bytes); if (encoding_type == CommonNames::ASCII85Decode) return decode_ascii85(bytes); if (encoding_type == CommonNames::LZWDecode) return decode_lzw(bytes); if (encoding_type == CommonNames::FlateDecode) return decode_flate(bytes, predictor, columns, colors, bits_per_component); if (encoding_type == CommonNames::RunLengthDecode) return decode_run_length(bytes); if (encoding_type == CommonNames::CCITTFaxDecode) return decode_ccitt(bytes); if (encoding_type == CommonNames::JBIG2Decode) return decode_jbig2(bytes); if (encoding_type == CommonNames::DCTDecode) return decode_dct(bytes); if (encoding_type == CommonNames::JPXDecode) return decode_jpx(bytes); if (encoding_type == CommonNames::Crypt) return decode_crypt(bytes); return AK::Error::from_string_literal("Unrecognized filter encoding"); } ErrorOr Filter::decode_ascii_hex(ReadonlyBytes bytes) { if (bytes.size() % 2 == 0) return decode_hex(bytes); // FIXME: Integrate this padding into AK/Hex? auto output = TRY(ByteBuffer::create_zeroed(bytes.size() / 2 + 1)); for (size_t i = 0; i < bytes.size() / 2; ++i) { auto const c1 = decode_hex_digit(static_cast(bytes[i * 2])); if (c1 >= 16) return AK::Error::from_string_literal("Hex string contains invalid digit"); auto const c2 = decode_hex_digit(static_cast(bytes[i * 2 + 1])); if (c2 >= 16) return AK::Error::from_string_literal("Hex string contains invalid digit"); output[i] = (c1 << 4) + c2; } // Process last byte with a padded zero output[output.size() - 1] = decode_hex_digit(static_cast(bytes[bytes.size() - 1])) * 16; return { move(output) }; }; ErrorOr Filter::decode_ascii85(ReadonlyBytes bytes) { Vector buff; buff.ensure_capacity(bytes.size()); size_t byte_index = 0; while (byte_index < bytes.size()) { if (bytes[byte_index] == ' ') { byte_index++; continue; } if (bytes[byte_index] == 'z') { byte_index++; for (int i = 0; i < 4; i++) buff.append(0); continue; } u32 number = 0; if (byte_index + 5 >= bytes.size()) { auto to_write = bytes.size() - byte_index; for (int i = 0; i < 5; i++) { auto byte = byte_index >= bytes.size() ? 'u' : bytes[byte_index++]; if (byte == ' ') { i--; continue; } number = number * 85 + byte - 33; } for (size_t i = 0; i < to_write - 1; i++) buff.append(reinterpret_cast(&number)[3 - i]); break; } else { for (int i = 0; i < 5; i++) { auto byte = bytes[byte_index++]; if (byte == ' ') { i--; continue; } number = number * 85 + byte - 33; } } for (int i = 0; i < 4; i++) buff.append(reinterpret_cast(&number)[3 - i]); } return ByteBuffer::copy(buff.span()); }; ErrorOr Filter::decode_png_prediction(Bytes bytes, int bytes_per_row) { int number_of_rows = bytes.size() / bytes_per_row; ByteBuffer decoded; decoded.ensure_capacity(bytes.size() - number_of_rows); auto empty_row = TRY(ByteBuffer::create_zeroed(bytes_per_row)); auto previous_row = empty_row.data(); for (int row_index = 0; row_index < number_of_rows; ++row_index) { auto row = bytes.data() + row_index * bytes_per_row; u8 algorithm_tag = row[0]; switch (algorithm_tag) { case 0: break; case 1: for (int i = 2; i < bytes_per_row; ++i) row[i] += row[i - 1]; break; case 2: for (int i = 1; i < bytes_per_row; ++i) row[i] += previous_row[i]; break; case 3: for (int i = 1; i < bytes_per_row; ++i) { u8 left = 0; if (i > 1) left = row[i - 1]; u8 above = previous_row[i]; row[i] += (left + above) / 2; } break; case 4: for (int i = 1; i < bytes_per_row; ++i) { u8 left = 0; u8 upper_left = 0; if (i > 1) { left = row[i - 1]; upper_left = previous_row[i - 1]; } u8 above = previous_row[i]; u8 p = left + above - upper_left; int left_distance = abs(p - left); int above_distance = abs(p - above); int upper_left_distance = abs(p - upper_left); u8 paeth = min(left_distance, min(above_distance, upper_left_distance)); row[i] += paeth; } break; default: return AK::Error::from_string_literal("Unknown PNG algorithm tag"); } previous_row = row; decoded.append(row + 1, bytes_per_row - 1); } return decoded; } ErrorOr Filter::decode_lzw(ReadonlyBytes) { dbgln("LZW decoding is not supported"); VERIFY_NOT_REACHED(); }; ErrorOr Filter::decode_flate(ReadonlyBytes bytes, int predictor, int columns, int colors, int bits_per_component) { auto buff = Compress::DeflateDecompressor::decompress_all(bytes.slice(2)).value(); if (predictor == 1) return buff; // Check if we are dealing with a PNG prediction if (predictor == 2) return AK::Error::from_string_literal("The TIFF predictor is not supported"); if (predictor < 10 || predictor > 15) return AK::Error::from_string_literal("Invalid predictor value"); // Rows are always a whole number of bytes long, starting with an algorithm tag int bytes_per_row = AK::ceil_div(columns * colors * bits_per_component, 8) + 1; if (buff.size() % bytes_per_row) return AK::Error::from_string_literal("Flate input data is not divisible into columns"); return decode_png_prediction(buff, bytes_per_row); }; ErrorOr Filter::decode_run_length(ReadonlyBytes bytes) { constexpr size_t END_OF_DECODING = 128; ByteBuffer buffer {}; while (true) { VERIFY(bytes.size() > 0); auto length = bytes[0]; bytes = bytes.slice(1); if (length == END_OF_DECODING) { VERIFY(bytes.is_empty()); break; } if (length < 128) { TRY(buffer.try_append(bytes.slice(0, length + 1))); bytes = bytes.slice(length + 1); } else { VERIFY(bytes.size() > 1); auto byte_to_append = bytes[0]; bytes = bytes.slice(1); size_t n_chars = 257 - length; for (size_t i = 0; i < n_chars; ++i) { TRY(buffer.try_append(byte_to_append)); } } } return buffer; }; ErrorOr Filter::decode_ccitt(ReadonlyBytes) { // FIXME: Support CCITT decoding TODO(); }; ErrorOr Filter::decode_jbig2(ReadonlyBytes) { // FIXME: Support JBIG2 decoding TODO(); }; ErrorOr Filter::decode_dct(ReadonlyBytes bytes) { if (Gfx::JPGImageDecoderPlugin::sniff({ bytes.data(), bytes.size() }).release_value_but_fixme_should_propagate_errors()) { auto decoder = Gfx::JPGImageDecoderPlugin::create({ bytes.data(), bytes.size() }).release_value_but_fixme_should_propagate_errors(); if (decoder->initialize()) { auto frame = TRY(decoder->frame(0)); return frame.image->serialize_to_byte_buffer(); } } return AK::Error::from_string_literal("Not a JPG image!"); }; ErrorOr Filter::decode_jpx(ReadonlyBytes) { // FIXME: Support JPX decoding TODO(); }; ErrorOr Filter::decode_crypt(ReadonlyBytes) { // FIXME: Support Crypt decoding TODO(); }; }