// Copyright (c) the JPEG XL Project Authors. All rights reserved. // // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. #include #include #include #include #include #if defined(_WIN32) || defined(_WIN64) #include "third_party/dirent.h" #else #include #include #endif #include #include #include #include #include #include #if JPEGXL_ENABLE_JPEG #include "lib/extras/enc/jpg.h" #endif #include "lib/jxl/aux_out.h" #include "lib/jxl/base/data_parallel.h" #include "lib/jxl/base/file_io.h" #include "lib/jxl/base/override.h" #include "lib/jxl/base/span.h" #include "lib/jxl/base/thread_pool_internal.h" #include "lib/jxl/codec_in_out.h" #include "lib/jxl/enc_ans.h" #include "lib/jxl/enc_cache.h" #include "lib/jxl/enc_color_management.h" #include "lib/jxl/enc_external_image.h" #include "lib/jxl/enc_file.h" #include "lib/jxl/enc_params.h" #include "lib/jxl/encode_internal.h" #include "lib/jxl/jpeg/enc_jpeg_data.h" #include "lib/jxl/modular/encoding/context_predict.h" namespace { const size_t kMaxWidth = 50000; const size_t kMaxHeight = 50000; const size_t kMaxPixels = 20 * (1 << 20); // 20 MP const size_t kMaxBitDepth = 24; // The maximum reasonable bit depth supported. std::mutex stderr_mutex; typedef std::function PixelGenerator; // ImageSpec needs to be a packed struct to allow us to use the raw memory of // the struct for hashing to create a consistent. #pragma pack(push, 1) struct ImageSpec { bool Validate() const { if (width > kMaxWidth || height > kMaxHeight || width * height > kMaxPixels) { return false; } if (bit_depth > kMaxBitDepth || bit_depth == 0) return false; if (num_frames == 0) return false; // JPEG doesn't support all formats, so reconstructible JPEG isn't always // valid. if (is_reconstructible_jpeg && (bit_depth != 8 || num_channels != 3 || alpha_bit_depth != 0 || num_frames != 1)) return false; return true; } friend std::ostream& operator<<(std::ostream& o, const ImageSpec& spec) { o << "ImageSpec<" << "size=" << spec.width << "x" << spec.height << " * chan=" << spec.num_channels << " depth=" << spec.bit_depth << " alpha=" << spec.alpha_bit_depth << " (premult=" << spec.alpha_is_premultiplied << ") x frames=" << spec.num_frames << " seed=" << spec.seed << ", speed=" << static_cast(spec.params.speed_tier) << ", butteraugli=" << spec.params.butteraugli_distance << ", modular_mode=" << spec.params.modular_mode << ", lossy_palette=" << spec.params.lossy_palette << ", noise=" << spec.params.noise << ", preview=" << spec.params.preview << ", fuzzer_friendly=" << spec.fuzzer_friendly << ", is_reconstructible_jpeg=" << spec.is_reconstructible_jpeg << ", orientation=" << static_cast(spec.orientation) << ">"; return o; } void SpecHash(uint8_t hash[16]) const { const uint8_t* from = reinterpret_cast(this); std::seed_seq hasher(from, from + sizeof(*this)); uint32_t* to = reinterpret_cast(hash); hasher.generate(to, to + 4); } uint64_t width = 256; uint64_t height = 256; // Number of channels *not* including alpha. uint64_t num_channels = 3; uint64_t bit_depth = 8; // Bit depth for the alpha channel. A value of 0 means no alpha channel. uint64_t alpha_bit_depth = 8; int32_t alpha_is_premultiplied = false; // Whether the ANS fuzzer friendly setting is currently enabled. uint32_t fuzzer_friendly = false; // Number of frames, all the frames will have the same size. uint64_t num_frames = 1; // The seed for the PRNG. uint32_t seed = 7777; // Flags used for compression. These are mapped to the CompressedParams. struct CjxlParams { float butteraugli_distance = 1.f; // Must not use Weighted - see force_no_wp jxl::Predictor modular_predictor = jxl::Predictor::Gradient; jxl::ColorTransform color_transform = jxl::ColorTransform::kXYB; jxl::SpeedTier speed_tier = jxl::SpeedTier::kTortoise; bool modular_mode = false; bool lossy_palette = false; bool noise = false; bool preview = false; // CjxlParams is packed; re-add padding when sum of sizes of members is not // multiple of 4. // uint8_t padding_[0] = {}; } params; uint32_t is_reconstructible_jpeg = false; // Use 0xFFFFFFFF if any random spec is good; otherwise set the desired value. uint32_t override_decoder_spec = 0xFFFFFFFF; // Orientation. uint8_t orientation = 0; uint8_t padding_[3] = {}; }; #pragma pack(pop) static_assert(sizeof(ImageSpec) % 4 == 0, "Add padding to ImageSpec."); bool GenerateFile(const char* output_dir, const ImageSpec& spec, bool regenerate, bool quiet) { // Compute a checksum of the ImageSpec to name the file. This is just to keep // the output of this program repeatable. uint8_t checksum[16]; spec.SpecHash(checksum); std::string hash_str(sizeof(checksum) * 2, ' '); static const char* hex_chars = "0123456789abcdef"; for (size_t i = 0; i < sizeof(checksum); i++) { hash_str[2 * i] = hex_chars[checksum[i] >> 4]; hash_str[2 * i + 1] = hex_chars[checksum[i] % 0x0f]; } std::string output_fn = std::string(output_dir) + "/" + hash_str + ".jxl"; // Don't regenerate files if they already exist on disk to speed-up // consecutive calls when --regenerate is not used. struct stat st; if (!regenerate && stat(output_fn.c_str(), &st) == 0 && S_ISREG(st.st_mode)) { return true; } if (!quiet) { std::unique_lock lock(stderr_mutex); std::cerr << "Generating " << spec << " as " << hash_str << std::endl; } jxl::CodecInOut io; if (spec.bit_depth == 32) { io.metadata.m.SetFloat32Samples(); } else { io.metadata.m.SetUintSamples(spec.bit_depth); } io.metadata.m.SetAlphaBits(spec.alpha_bit_depth, spec.alpha_is_premultiplied); io.metadata.m.orientation = spec.orientation; io.dec_pixels = spec.width * spec.height; io.frames.clear(); io.frames.reserve(spec.num_frames); jxl::ColorEncoding c; if (spec.num_channels == 1) { c = jxl::ColorEncoding::LinearSRGB(true); } else if (spec.num_channels == 3) { c = jxl::ColorEncoding::SRGB(); } uint8_t hash[16]; spec.SpecHash(hash); std::mt19937 mt(spec.seed); // Compress the image. jxl::PaddedBytes compressed; std::uniform_int_distribution<> dis(1, 6); PixelGenerator gen = [&]() -> uint8_t { return dis(mt); }; for (uint32_t frame = 0; frame < spec.num_frames; frame++) { jxl::ImageBundle ib(&io.metadata.m); const bool has_alpha = spec.alpha_bit_depth != 0; const size_t bytes_per_sample = jxl::DivCeil(io.metadata.m.bit_depth.bits_per_sample, 8); const size_t bytes_per_pixel = bytes_per_sample * (io.metadata.m.color_encoding.Channels() + has_alpha); const size_t row_size = spec.width * bytes_per_pixel; std::vector img_data(row_size * spec.height, 0); for (size_t y = 0; y < spec.height; y++) { size_t pos = row_size * y; for (size_t x = 0; x < spec.width; x++) { for (size_t b = 0; b < bytes_per_pixel; b++) { img_data[pos++] = gen(); } } } const jxl::Span span(img_data.data(), img_data.size()); JXL_RETURN_IF_ERROR(ConvertFromExternal( span, spec.width, spec.height, io.metadata.m.color_encoding, bytes_per_pixel / bytes_per_sample, /*alpha_is_premultiplied=*/spec.alpha_is_premultiplied, io.metadata.m.bit_depth.bits_per_sample, JXL_LITTLE_ENDIAN, false /* flipped_y */, nullptr, &ib, /*float_in=*/false, /*align=*/0)); io.frames.push_back(std::move(ib)); } jxl::CompressParams params; params.speed_tier = spec.params.speed_tier; #if JPEGXL_ENABLE_JPEG if (spec.is_reconstructible_jpeg) { // If this image is supposed to be a reconstructible JPEG, collect the JPEG // metadata and encode it in the beginning of the compressed bytes. std::vector jpeg_bytes; JXL_RETURN_IF_ERROR(EncodeImageJPG( &io, jxl::extras::JpegEncoder::kLibJpeg, /*quality=*/70, jxl::YCbCrChromaSubsampling(), /*pool=*/nullptr, &jpeg_bytes)); JXL_RETURN_IF_ERROR(jxl::jpeg::DecodeImageJPG( jxl::Span(jpeg_bytes.data(), jpeg_bytes.size()), &io)); jxl::PaddedBytes jpeg_data; JXL_RETURN_IF_ERROR( EncodeJPEGData(*io.Main().jpeg_data, &jpeg_data, params)); std::vector header; header.insert(header.end(), jxl::kContainerHeader, jxl::kContainerHeader + sizeof(jxl::kContainerHeader)); jxl::AppendBoxHeader(jxl::MakeBoxType("jbrd"), jpeg_data.size(), false, &header); header.insert(header.end(), jpeg_data.data(), jpeg_data.data() + jpeg_data.size()); jxl::AppendBoxHeader(jxl::MakeBoxType("jxlc"), 0, true, &header); compressed.append(header); } #endif params.modular_mode = spec.params.modular_mode; params.color_transform = spec.params.color_transform; params.butteraugli_distance = spec.params.butteraugli_distance; params.options.predictor = {spec.params.modular_predictor}; params.lossy_palette = spec.params.lossy_palette; if (spec.params.preview) params.preview = jxl::Override::kOn; if (spec.params.noise) params.noise = jxl::Override::kOn; jxl::AuxOut aux_out; jxl::PassesEncoderState passes_encoder_state; // EncodeFile replaces output; pass a temporary storage for it. jxl::PaddedBytes compressed_image; bool ok = jxl::EncodeFile(params, &io, &passes_encoder_state, &compressed_image, jxl::GetJxlCms(), &aux_out, nullptr); if (!ok) return false; compressed.append(compressed_image); // Append 4 bytes with the flags used by djxl_fuzzer to select the decoding // output. std::uniform_int_distribution<> dis256(0, 255); if (spec.override_decoder_spec == 0xFFFFFFFF) { for (size_t i = 0; i < 4; ++i) compressed.push_back(dis256(mt)); } else { for (size_t i = 0; i < 4; ++i) { compressed.push_back(spec.override_decoder_spec >> (8 * i)); } } if (!jxl::WriteFile(compressed, output_fn)) return 1; if (!quiet) { std::unique_lock lock(stderr_mutex); std::cerr << "Stored " << output_fn << " size: " << compressed.size() << std::endl; } return true; } std::vector CompressParamsList() { std::vector ret; { ImageSpec::CjxlParams params; params.butteraugli_distance = 1.5; ret.push_back(params); } { // Lossless ImageSpec::CjxlParams params; params.modular_mode = true; params.color_transform = jxl::ColorTransform::kNone; params.butteraugli_distance = 0.f; params.modular_predictor = {jxl::Predictor::Weighted}; ret.push_back(params); } return ret; } void Usage() { fprintf(stderr, "Use: fuzzer_corpus [-r] [-q] [-j THREADS] [output_dir]\n" "\n" " -r Regenerate files if already exist.\n" " -q Be quiet.\n" " -j THREADS Number of parallel jobs to run.\n"); } } // namespace int main(int argc, const char** argv) { const char* dest_dir = nullptr; bool regenerate = false; bool quiet = false; int num_threads = std::thread::hardware_concurrency(); for (int optind = 1; optind < argc;) { if (!strcmp(argv[optind], "-r")) { regenerate = true; optind++; } else if (!strcmp(argv[optind], "-q")) { quiet = true; optind++; } else if (!strcmp(argv[optind], "-j")) { optind++; if (optind < argc) { num_threads = atoi(argv[optind++]); } else { fprintf(stderr, "-j needs an argument value.\n"); Usage(); return 1; } } else if (dest_dir == nullptr) { dest_dir = argv[optind++]; } else { fprintf(stderr, "Unknown parameter: \"%s\".\n", argv[optind]); Usage(); return 1; } } if (!dest_dir) { dest_dir = "corpus"; } struct stat st; memset(&st, 0, sizeof(st)); if (stat(dest_dir, &st) != 0 || !S_ISDIR(st.st_mode)) { fprintf(stderr, "Output path \"%s\" is not a directory.\n", dest_dir); Usage(); return 1; } // Create the corpus directory if doesn't already exist. std::mt19937 mt(77777); std::vector> image_sizes = { {8, 8}, {32, 32}, {128, 128}, // Degenerated cases. {10000, 1}, {10000, 2}, {1, 10000}, {2, 10000}, // Large case. {555, 256}, {257, 513}, }; const std::vector params_list = CompressParamsList(); ImageSpec spec; // The ans_fuzzer_friendly setting is not thread safe and therefore done in // an outer loop. This determines whether to use fuzzer-friendly ANS encoding. for (uint32_t fuzzer_friendly = 0; fuzzer_friendly < 2; ++fuzzer_friendly) { jxl::SetANSFuzzerFriendly(fuzzer_friendly); spec.fuzzer_friendly = fuzzer_friendly; std::vector specs; for (auto img_size : image_sizes) { spec.width = img_size.first; spec.height = img_size.second; for (uint32_t bit_depth : {1, 2, 8, 16}) { spec.bit_depth = bit_depth; for (uint32_t num_channels : {1, 3}) { spec.num_channels = num_channels; for (uint32_t alpha_bit_depth : {0, 8, 16}) { spec.alpha_bit_depth = alpha_bit_depth; if (bit_depth == 16 && alpha_bit_depth == 8) { // This mode is not supported in CopyTo(). continue; } for (uint32_t num_frames : {1, 3}) { spec.num_frames = num_frames; for (uint32_t preview : {0, 1}) { #if JPEGXL_ENABLE_JPEG for (bool reconstructible_jpeg : {false, true}) { spec.is_reconstructible_jpeg = reconstructible_jpeg; #else // JPEGXL_ENABLE_JPEG spec.is_reconstructible_jpeg = false; #endif // JPEGXL_ENABLE_JPEG for (const auto& params : params_list) { spec.params = params; spec.params.preview = preview; if (alpha_bit_depth) { spec.alpha_is_premultiplied = mt() % 2; } if (spec.width * spec.height > 1000) { // Increase the encoder speed for larger images. spec.params.speed_tier = jxl::SpeedTier::kWombat; } spec.seed = mt() % 777777; // Pick the orientation at random. It is orthogonal to all // other features. Valid values are 1 to 8. spec.orientation = 1 + (mt() % 8); if (!spec.Validate()) { if (!quiet) { std::cerr << "Skipping " << spec << std::endl; } } else { specs.push_back(spec); } } #if JPEGXL_ENABLE_JPEG } #endif // JPEGXL_ENABLE_JPEG } } } } } } specs.emplace_back(ImageSpec()); specs.back().params.lossy_palette = true; specs.back().override_decoder_spec = 0; specs.emplace_back(ImageSpec()); specs.back().params.noise = true; specs.back().override_decoder_spec = 0; jxl::ThreadPoolInternal pool{num_threads}; if (!RunOnPool( &pool, 0, specs.size(), jxl::ThreadPool::NoInit, [&specs, dest_dir, regenerate, quiet](const uint32_t task, size_t /* thread */) { const ImageSpec& spec = specs[task]; GenerateFile(dest_dir, spec, regenerate, quiet); }, "FuzzerCorpus")) { std::cerr << "Error generating fuzzer corpus" << std::endl; return 1; } } std::cerr << "Finished generating fuzzer corpus" << std::endl; return 0; }