// Copyright (c) the JPEG XL Project Authors. All rights reserved. // // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. #include "lib/jxl/jpeg/enc_jpeg_data.h" #include #include #include "lib/jxl/jpeg/enc_jpeg_data_reader.h" #include "lib/jxl/sanitizers.h" namespace jxl { namespace jpeg { namespace { constexpr int BITS_IN_JSAMPLE = 8; using ByteSpan = Span; // TODO(eustas): move to jpeg_data, to use from codec_jpg as well. // See if there is a canonically chunked ICC profile and mark corresponding // app-tags with AppMarkerType::kICC. Status DetectIccProfile(JPEGData& jpeg_data) { JXL_DASSERT(jpeg_data.app_data.size() == jpeg_data.app_marker_type.size()); size_t num_icc = 0; size_t num_icc_jpeg = 0; for (size_t i = 0; i < jpeg_data.app_data.size(); i++) { const auto& app = jpeg_data.app_data[i]; size_t pos = 0; if (app[pos++] != 0xE2) continue; // At least APPn + size; otherwise it should be intermarker-data. JXL_DASSERT(app.size() >= 3); size_t tag_length = (app[pos] << 8) + app[pos + 1]; pos += 2; JXL_DASSERT(app.size() == tag_length + 1); // Empty payload is 2 bytes for tag length itself + signature if (tag_length < 2 + sizeof kIccProfileTag) continue; if (memcmp(&app[pos], kIccProfileTag, sizeof kIccProfileTag) != 0) continue; pos += sizeof kIccProfileTag; uint8_t chunk_id = app[pos++]; uint8_t num_chunks = app[pos++]; if (chunk_id != num_icc + 1) continue; if (num_icc_jpeg == 0) num_icc_jpeg = num_chunks; if (num_icc_jpeg != num_chunks) continue; num_icc++; jpeg_data.app_marker_type[i] = AppMarkerType::kICC; } if (num_icc != num_icc_jpeg) { return JXL_FAILURE("Invalid ICC chunks"); } return true; } bool GetMarkerPayload(const uint8_t* data, size_t size, ByteSpan* payload) { if (size < 3) { return false; } size_t hi = data[1]; size_t lo = data[2]; size_t internal_size = (hi << 8u) | lo; // Second byte of marker is not counted towards size. if (internal_size != size - 1) { return false; } // cut second marker byte and "length" from payload. *payload = ByteSpan(data, size); payload->remove_prefix(3); return true; } Status DetectBlobs(jpeg::JPEGData& jpeg_data) { JXL_DASSERT(jpeg_data.app_data.size() == jpeg_data.app_marker_type.size()); bool have_exif = false, have_xmp = false; for (size_t i = 0; i < jpeg_data.app_data.size(); i++) { auto& marker = jpeg_data.app_data[i]; if (marker.empty() || marker[0] != kApp1) { continue; } ByteSpan payload; if (!GetMarkerPayload(marker.data(), marker.size(), &payload)) { // Something is wrong with this marker; does not care. continue; } if (!have_exif && payload.size() >= sizeof kExifTag && !memcmp(payload.data(), kExifTag, sizeof kExifTag)) { jpeg_data.app_marker_type[i] = AppMarkerType::kExif; have_exif = true; } if (!have_xmp && payload.size() >= sizeof kXMPTag && !memcmp(payload.data(), kXMPTag, sizeof kXMPTag)) { jpeg_data.app_marker_type[i] = AppMarkerType::kXMP; have_xmp = true; } } return true; } Status ParseChunkedMarker(const jpeg::JPEGData& src, uint8_t marker_type, const ByteSpan& tag, PaddedBytes* output, bool allow_permutations = false) { output->clear(); std::vector chunks; std::vector presence; size_t expected_number_of_parts = 0; bool is_first_chunk = true; size_t ordinal = 0; for (const auto& marker : src.app_data) { if (marker.empty() || marker[0] != marker_type) { continue; } ByteSpan payload; if (!GetMarkerPayload(marker.data(), marker.size(), &payload)) { // Something is wrong with this marker; does not care. continue; } if ((payload.size() < tag.size()) || memcmp(payload.data(), tag.data(), tag.size()) != 0) { continue; } payload.remove_prefix(tag.size()); if (payload.size() < 2) { return JXL_FAILURE("Chunk is too small."); } uint8_t index = payload[0]; uint8_t total = payload[1]; ordinal++; if (!allow_permutations) { if (index != ordinal) return JXL_FAILURE("Invalid chunk order."); } payload.remove_prefix(2); JXL_RETURN_IF_ERROR(total != 0); if (is_first_chunk) { is_first_chunk = false; expected_number_of_parts = total; // 1-based indices; 0-th element is added for convenience. chunks.resize(total + 1); presence.resize(total + 1); } else { JXL_RETURN_IF_ERROR(expected_number_of_parts == total); } if (index == 0 || index > total) { return JXL_FAILURE("Invalid chunk index."); } if (presence[index]) { return JXL_FAILURE("Duplicate chunk."); } presence[index] = true; chunks[index] = payload; } for (size_t i = 0; i < expected_number_of_parts; ++i) { // 0-th element is not used. size_t index = i + 1; if (!presence[index]) { return JXL_FAILURE("Missing chunk."); } output->append(chunks[index]); } return true; } Status SetBlobsFromJpegData(const jpeg::JPEGData& jpeg_data, Blobs* blobs) { for (size_t i = 0; i < jpeg_data.app_data.size(); i++) { auto& marker = jpeg_data.app_data[i]; if (marker.empty() || marker[0] != kApp1) { continue; } ByteSpan payload; if (!GetMarkerPayload(marker.data(), marker.size(), &payload)) { // Something is wrong with this marker; does not care. continue; } if (payload.size() >= sizeof kExifTag && !memcmp(payload.data(), kExifTag, sizeof kExifTag)) { if (blobs->exif.empty()) { blobs->exif.resize(payload.size() - sizeof kExifTag); memcpy(blobs->exif.data(), payload.data() + sizeof kExifTag, payload.size() - sizeof kExifTag); } else { JXL_WARNING( "ReJPEG: multiple Exif blobs, storing only first one in the JPEG " "XL container\n"); } } if (payload.size() >= sizeof kXMPTag && !memcmp(payload.data(), kXMPTag, sizeof kXMPTag)) { if (blobs->xmp.empty()) { blobs->xmp.resize(payload.size() - sizeof kXMPTag); memcpy(blobs->xmp.data(), payload.data() + sizeof kXMPTag, payload.size() - sizeof kXMPTag); } else { JXL_WARNING( "ReJPEG: multiple XMP blobs, storing only first one in the JPEG " "XL container\n"); } } } return true; } static inline bool IsJPG(const Span bytes) { return bytes.size() >= 2 && bytes[0] == 0xFF && bytes[1] == 0xD8; } } // namespace Status SetColorEncodingFromJpegData(const jpeg::JPEGData& jpg, ColorEncoding* color_encoding) { PaddedBytes icc_profile; if (!ParseChunkedMarker(jpg, kApp2, ByteSpan(kIccProfileTag), &icc_profile)) { JXL_WARNING("ReJPEG: corrupted ICC profile\n"); icc_profile.clear(); } if (icc_profile.empty()) { bool is_gray = (jpg.components.size() == 1); *color_encoding = ColorEncoding::SRGB(is_gray); return true; } return color_encoding->SetICC(std::move(icc_profile)); } Status EncodeJPEGData(JPEGData& jpeg_data, PaddedBytes* bytes, const CompressParams& cparams) { jpeg_data.app_marker_type.resize(jpeg_data.app_data.size(), AppMarkerType::kUnknown); JXL_RETURN_IF_ERROR(DetectIccProfile(jpeg_data)); JXL_RETURN_IF_ERROR(DetectBlobs(jpeg_data)); BitWriter writer; JXL_RETURN_IF_ERROR(Bundle::Write(jpeg_data, &writer, 0, nullptr)); writer.ZeroPadToByte(); *bytes = std::move(writer).TakeBytes(); BrotliEncoderState* brotli_enc = BrotliEncoderCreateInstance(nullptr, nullptr, nullptr); int effort = cparams.brotli_effort; if (effort < 0) effort = 11 - static_cast(cparams.speed_tier); BrotliEncoderSetParameter(brotli_enc, BROTLI_PARAM_QUALITY, effort); size_t total_data = 0; for (size_t i = 0; i < jpeg_data.app_data.size(); i++) { if (jpeg_data.app_marker_type[i] != AppMarkerType::kUnknown) { continue; } total_data += jpeg_data.app_data[i].size(); } for (size_t i = 0; i < jpeg_data.com_data.size(); i++) { total_data += jpeg_data.com_data[i].size(); } for (size_t i = 0; i < jpeg_data.inter_marker_data.size(); i++) { total_data += jpeg_data.inter_marker_data[i].size(); } total_data += jpeg_data.tail_data.size(); size_t initial_size = bytes->size(); size_t brotli_capacity = BrotliEncoderMaxCompressedSize(total_data); BrotliEncoderSetParameter(brotli_enc, BROTLI_PARAM_SIZE_HINT, total_data); bytes->resize(bytes->size() + brotli_capacity); size_t enc_size = 0; auto br_append = [&](const std::vector& data, bool last) { size_t available_in = data.size(); const uint8_t* in = data.data(); uint8_t* out = &(*bytes)[initial_size + enc_size]; do { uint8_t* out_before = out; msan::MemoryIsInitialized(in, available_in); JXL_CHECK(BrotliEncoderCompressStream( brotli_enc, last ? BROTLI_OPERATION_FINISH : BROTLI_OPERATION_PROCESS, &available_in, &in, &brotli_capacity, &out, &enc_size)); msan::UnpoisonMemory(out_before, out - out_before); } while (BrotliEncoderHasMoreOutput(brotli_enc) || available_in > 0); }; for (size_t i = 0; i < jpeg_data.app_data.size(); i++) { if (jpeg_data.app_marker_type[i] != AppMarkerType::kUnknown) { continue; } br_append(jpeg_data.app_data[i], /*last=*/false); } for (size_t i = 0; i < jpeg_data.com_data.size(); i++) { br_append(jpeg_data.com_data[i], /*last=*/false); } for (size_t i = 0; i < jpeg_data.inter_marker_data.size(); i++) { br_append(jpeg_data.inter_marker_data[i], /*last=*/false); } br_append(jpeg_data.tail_data, /*last=*/true); BrotliEncoderDestroyInstance(brotli_enc); bytes->resize(initial_size + enc_size); return true; } Status DecodeImageJPG(const Span bytes, CodecInOut* io) { if (!IsJPG(bytes)) return false; io->frames.clear(); io->frames.reserve(1); io->frames.emplace_back(&io->metadata.m); io->Main().jpeg_data = make_unique(); jpeg::JPEGData* jpeg_data = io->Main().jpeg_data.get(); if (!jpeg::ReadJpeg(bytes.data(), bytes.size(), jpeg::JpegReadMode::kReadAll, jpeg_data)) { return JXL_FAILURE("Error reading JPEG"); } JXL_RETURN_IF_ERROR( SetColorEncodingFromJpegData(*jpeg_data, &io->metadata.m.color_encoding)); JXL_RETURN_IF_ERROR(SetBlobsFromJpegData(*jpeg_data, &io->blobs)); size_t nbcomp = jpeg_data->components.size(); if (nbcomp != 1 && nbcomp != 3) { return JXL_FAILURE("Cannot recompress JPEGs with neither 1 nor 3 channels"); } YCbCrChromaSubsampling cs; if (nbcomp == 3) { uint8_t hsample[3], vsample[3]; for (size_t i = 0; i < nbcomp; i++) { hsample[i] = jpeg_data->components[i].h_samp_factor; vsample[i] = jpeg_data->components[i].v_samp_factor; } JXL_RETURN_IF_ERROR(cs.Set(hsample, vsample)); } else if (nbcomp == 1) { uint8_t hsample[3], vsample[3]; for (size_t i = 0; i < 3; i++) { hsample[i] = jpeg_data->components[0].h_samp_factor; vsample[i] = jpeg_data->components[0].v_samp_factor; } JXL_RETURN_IF_ERROR(cs.Set(hsample, vsample)); } bool is_rgb = false; { const auto& markers = jpeg_data->marker_order; // If there is a JFIF marker, this is YCbCr. Otherwise... if (std::find(markers.begin(), markers.end(), 0xE0) == markers.end()) { // Try to find an 'Adobe' marker. size_t app_markers = 0; size_t i = 0; for (; i < markers.size(); i++) { // This is an APP marker. if ((markers[i] & 0xF0) == 0xE0) { JXL_CHECK(app_markers < jpeg_data->app_data.size()); // APP14 marker if (markers[i] == 0xEE) { const auto& data = jpeg_data->app_data[app_markers]; if (data.size() == 15 && data[3] == 'A' && data[4] == 'd' && data[5] == 'o' && data[6] == 'b' && data[7] == 'e') { // 'Adobe' marker. is_rgb = data[14] == 0; break; } } app_markers++; } } if (i == markers.size()) { // No 'Adobe' marker, guess from component IDs. is_rgb = nbcomp == 3 && jpeg_data->components[0].id == 'R' && jpeg_data->components[1].id == 'G' && jpeg_data->components[2].id == 'B'; } } } io->Main().chroma_subsampling = cs; io->Main().color_transform = (!is_rgb || nbcomp == 1) ? ColorTransform::kYCbCr : ColorTransform::kNone; io->metadata.m.SetIntensityTarget(kDefaultIntensityTarget); io->metadata.m.SetUintSamples(BITS_IN_JSAMPLE); io->SetFromImage(Image3F(jpeg_data->width, jpeg_data->height), io->metadata.m.color_encoding); SetIntensityTarget(io); return true; } } // namespace jpeg } // namespace jxl