// Copyright (c) the JPEG XL Project Authors. All rights reserved. // // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. #ifndef LIB_JXL_IMAGE_H_ #define LIB_JXL_IMAGE_H_ // SIMD/multicore-friendly planar image representation with row accessors. #include #include #include #include #include #include #include // std::move #include "lib/jxl/base/cache_aligned.h" #include "lib/jxl/base/compiler_specific.h" #include "lib/jxl/base/status.h" #include "lib/jxl/common.h" namespace jxl { // Helper function to create rows that are multiples of SIMD vector size. size_t VectorSize(); // Type-independent parts of Plane<> - reduces code duplication and facilitates // moving member function implementations to cc file. struct PlaneBase { PlaneBase() : xsize_(0), ysize_(0), orig_xsize_(0), orig_ysize_(0), bytes_per_row_(0), bytes_(nullptr) {} PlaneBase(size_t xsize, size_t ysize, size_t sizeof_t); // Copy construction/assignment is forbidden to avoid inadvertent copies, // which can be very expensive. Use CopyImageTo() instead. PlaneBase(const PlaneBase& other) = delete; PlaneBase& operator=(const PlaneBase& other) = delete; // Move constructor (required for returning Image from function) PlaneBase(PlaneBase&& other) noexcept = default; // Move assignment (required for std::vector) PlaneBase& operator=(PlaneBase&& other) noexcept = default; void Swap(PlaneBase& other); // Useful for pre-allocating image with some padding for alignment purposes // and later reporting the actual valid dimensions. May also be used to // un-shrink the image. Caller is responsible for ensuring xsize/ysize are <= // the original dimensions. void ShrinkTo(const size_t xsize, const size_t ysize) { JXL_CHECK(xsize <= orig_xsize_); JXL_CHECK(ysize <= orig_ysize_); xsize_ = static_cast(xsize); ysize_ = static_cast(ysize); // NOTE: we can't recompute bytes_per_row for more compact storage and // better locality because that would invalidate the image contents. } // How many pixels. JXL_INLINE size_t xsize() const { return xsize_; } JXL_INLINE size_t ysize() const { return ysize_; } // NOTE: do not use this for copying rows - the valid xsize may be much less. JXL_INLINE size_t bytes_per_row() const { return bytes_per_row_; } // Raw access to byte contents, for interfacing with other libraries. // Unsigned char instead of char to avoid surprises (sign extension). JXL_INLINE uint8_t* bytes() { void* p = bytes_.get(); return static_cast(JXL_ASSUME_ALIGNED(p, 64)); } JXL_INLINE const uint8_t* bytes() const { const void* p = bytes_.get(); return static_cast(JXL_ASSUME_ALIGNED(p, 64)); } protected: // Returns pointer to the start of a row. JXL_INLINE void* VoidRow(const size_t y) const { #if defined(ADDRESS_SANITIZER) || defined(MEMORY_SANITIZER) || \ defined(THREAD_SANITIZER) if (y >= ysize_) { JXL_ABORT("Row(%" PRIu64 ") in (%u x %u) image\n", (uint64_t)y, xsize_, ysize_); } #endif void* row = bytes_.get() + y * bytes_per_row_; return JXL_ASSUME_ALIGNED(row, 64); } enum class Padding { // Allow Load(d, row + x) for x = 0; x < xsize(); x += Lanes(d). Default. kRoundUp, // Allow LoadU(d, row + x) for x = xsize() - 1. This requires an extra // vector to be initialized. If done by default, this would suppress // legitimate msan warnings. We therefore require users to explicitly call // InitializePadding before using unaligned loads (e.g. convolution). kUnaligned }; // Initializes the minimum bytes required to suppress msan warnings from // legitimate (according to Padding mode) vector loads/stores on the right // border, where some lanes are uninitialized and assumed to be unused. void InitializePadding(size_t sizeof_t, Padding padding); // (Members are non-const to enable assignment during move-assignment.) uint32_t xsize_; // In valid pixels, not including any padding. uint32_t ysize_; uint32_t orig_xsize_; uint32_t orig_ysize_; size_t bytes_per_row_; // Includes padding. CacheAlignedUniquePtr bytes_; }; // Single channel, aligned rows separated by padding. T must be POD. // // 'Single channel' (one 2D array per channel) simplifies vectorization // (repeating the same operation on multiple adjacent components) without the // complexity of a hybrid layout (8 R, 8 G, 8 B, ...). In particular, clients // can easily iterate over all components in a row and Image requires no // knowledge of the pixel format beyond the component type "T". // // 'Aligned' means each row is aligned to the L1 cache line size. This prevents // false sharing between two threads operating on adjacent rows. // // 'Padding' is still relevant because vectors could potentially be larger than // a cache line. By rounding up row sizes to the vector size, we allow // reading/writing ALIGNED vectors whose first lane is a valid sample. This // avoids needing a separate loop to handle remaining unaligned lanes. // // This image layout could also be achieved with a vector and a row accessor // function, but a class wrapper with support for "deleter" allows wrapping // existing memory allocated by clients without copying the pixels. It also // provides convenient accessors for xsize/ysize, which shortens function // argument lists. Supports move-construction so it can be stored in containers. template class Plane : public PlaneBase { public: using T = ComponentType; static constexpr size_t kNumPlanes = 1; Plane() = default; Plane(const size_t xsize, const size_t ysize) : PlaneBase(xsize, ysize, sizeof(T)) {} void InitializePaddingForUnalignedAccesses() { InitializePadding(sizeof(T), Padding::kUnaligned); } JXL_INLINE T* Row(const size_t y) { return static_cast(VoidRow(y)); } // Returns pointer to const (see above). JXL_INLINE const T* Row(const size_t y) const { return static_cast(VoidRow(y)); } // Documents that the access is const. JXL_INLINE const T* ConstRow(const size_t y) const { return static_cast(VoidRow(y)); } // Returns number of pixels (some of which are padding) per row. Useful for // computing other rows via pointer arithmetic. WARNING: this must // NOT be used to determine xsize. JXL_INLINE intptr_t PixelsPerRow() const { return static_cast(bytes_per_row_ / sizeof(T)); } }; using ImageSB = Plane; using ImageB = Plane; using ImageS = Plane; // signed integer or half-float using ImageU = Plane; using ImageI = Plane; using ImageF = Plane; using ImageD = Plane; // Also works for Image3 and mixed argument types. template bool SameSize(const Image1& image1, const Image2& image2) { return image1.xsize() == image2.xsize() && image1.ysize() == image2.ysize(); } template class Image3; // Rectangular region in image(s). Factoring this out of Image instead of // shifting the pointer by x0/y0 allows this to apply to multiple images with // different resolutions (e.g. color transform and quantization field). // Can compare using SameSize(rect1, rect2). template class RectT { public: // Most windows are xsize_max * ysize_max, except those on the borders where // begin + size_max > end. constexpr RectT(T xbegin, T ybegin, size_t xsize_max, size_t ysize_max, T xend, T yend) : x0_(xbegin), y0_(ybegin), xsize_(ClampedSize(xbegin, xsize_max, xend)), ysize_(ClampedSize(ybegin, ysize_max, yend)) {} // Construct with origin and known size (typically from another Rect). constexpr RectT(T xbegin, T ybegin, size_t xsize, size_t ysize) : x0_(xbegin), y0_(ybegin), xsize_(xsize), ysize_(ysize) {} // Construct a rect that covers a whole image/plane/ImageBundle etc. template explicit RectT(const ImageT& image) : RectT(0, 0, image.xsize(), image.ysize()) {} RectT() : RectT(0, 0, 0, 0) {} RectT(const RectT&) = default; RectT& operator=(const RectT&) = default; // Construct a subrect that resides in an image/plane/ImageBundle etc. template RectT Crop(const ImageT& image) const { return Intersection(RectT(image)); } // Construct a subrect that resides in the [0, ysize) x [0, xsize) region of // the current rect. RectT Crop(size_t area_xsize, size_t area_ysize) const { return Intersection(RectT(0, 0, area_xsize, area_ysize)); } // Returns a rect that only contains `num` lines with offset `y` from `y0()`. RectT Lines(size_t y, size_t num) const { JXL_DASSERT(y + num <= ysize_); return RectT(x0_, y0_ + y, xsize_, num); } RectT Line(size_t y) const { return Lines(y, 1); } JXL_MUST_USE_RESULT RectT Intersection(const RectT& other) const { return RectT(std::max(x0_, other.x0_), std::max(y0_, other.y0_), xsize_, ysize_, std::min(x1(), other.x1()), std::min(y1(), other.y1())); } JXL_MUST_USE_RESULT RectT Translate(int64_t x_offset, int64_t y_offset) const { return RectT(x0_ + x_offset, y0_ + y_offset, xsize_, ysize_); } template V* Row(Plane* image, size_t y) const { JXL_DASSERT(y + y0_ >= 0); return image->Row(y + y0_) + x0_; } template const V* Row(const Plane* image, size_t y) const { JXL_DASSERT(y + y0_ >= 0); return image->Row(y + y0_) + x0_; } template V* PlaneRow(Image3* image, const size_t c, size_t y) const { JXL_DASSERT(y + y0_ >= 0); return image->PlaneRow(c, y + y0_) + x0_; } template const V* ConstRow(const Plane& image, size_t y) const { JXL_DASSERT(y + y0_ >= 0); return image.ConstRow(y + y0_) + x0_; } template const V* ConstPlaneRow(const Image3& image, size_t c, size_t y) const { JXL_DASSERT(y + y0_ >= 0); return image.ConstPlaneRow(c, y + y0_) + x0_; } bool IsInside(const RectT& other) const { return x0_ >= other.x0() && x1() <= other.x1() && y0_ >= other.y0() && y1() <= other.y1(); } // Returns true if this Rect fully resides in the given image. ImageT could be // Plane or Image3; however if ImageT is Rect, results are nonsensical. template bool IsInside(const ImageT& image) const { return IsInside(RectT(image)); } T x0() const { return x0_; } T y0() const { return y0_; } size_t xsize() const { return xsize_; } size_t ysize() const { return ysize_; } T x1() const { return x0_ + xsize_; } T y1() const { return y0_ + ysize_; } RectT ShiftLeft(size_t shiftx, size_t shifty) const { return RectT(x0_ * (1 << shiftx), y0_ * (1 << shifty), xsize_ << shiftx, ysize_ << shifty); } RectT ShiftLeft(size_t shift) const { return ShiftLeft(shift, shift); } // Requires x0(), y0() to be multiples of 1< CeilShiftRight(size_t shiftx, size_t shifty) const { JXL_ASSERT(x0_ % (1 << shiftx) == 0); JXL_ASSERT(y0_ % (1 << shifty) == 0); return RectT(x0_ / (1 << shiftx), y0_ / (1 << shifty), DivCeil(xsize_, T{1} << shiftx), DivCeil(ysize_, T{1} << shifty)); } RectT CeilShiftRight(std::pair shift) const { return CeilShiftRight(shift.first, shift.second); } RectT CeilShiftRight(size_t shift) const { return CeilShiftRight(shift, shift); } template RectT As() const { return RectT(U(x0_), U(y0_), U(xsize_), U(ysize_)); } private: // Returns size_max, or whatever is left in [begin, end). static constexpr size_t ClampedSize(T begin, size_t size_max, T end) { return (static_cast(begin + size_max) <= end) ? size_max : (end > begin ? end - begin : 0); } T x0_; T y0_; size_t xsize_; size_t ysize_; }; template std::string Description(RectT r) { std::ostringstream os; os << "[" << r.x0() << ".." << r.x1() << ")x" << "[" << r.y0() << ".." << r.y1() << ")"; return os.str(); } using Rect = RectT; // Currently, we abuse Image to either refer to an image that owns its storage // or one that doesn't. In similar vein, we abuse Image* function parameters to // either mean "assign to me" or "fill the provided image with data". // Hopefully, the "assign to me" meaning will go away and most images in the // codebase will not be backed by own storage. When this happens we can redesign // Image to be a non-storage-holding view class and introduce BackedImage in // those places that actually need it. // NOTE: we can't use Image as a view because invariants are violated // (alignment and the presence of padding before/after each "row"). // A bundle of 3 same-sized images. Typically constructed by moving from three // rvalue references to Image. To overwrite an existing Image3 using // single-channel producers, we also need access to Image*. Constructing // temporary non-owning Image pointing to one plane of an existing Image3 risks // dangling references, especially if the wrapper is moved. Therefore, we // store an array of Image (which are compact enough that size is not a concern) // and provide Plane+Row accessors. template class Image3 { public: using T = ComponentType; using PlaneT = jxl::Plane; static constexpr size_t kNumPlanes = 3; Image3() : planes_{PlaneT(), PlaneT(), PlaneT()} {} Image3(const size_t xsize, const size_t ysize) : planes_{PlaneT(xsize, ysize), PlaneT(xsize, ysize), PlaneT(xsize, ysize)} {} Image3(Image3&& other) noexcept { for (size_t i = 0; i < kNumPlanes; i++) { planes_[i] = std::move(other.planes_[i]); } } Image3(PlaneT&& plane0, PlaneT&& plane1, PlaneT&& plane2) { JXL_CHECK(SameSize(plane0, plane1)); JXL_CHECK(SameSize(plane0, plane2)); planes_[0] = std::move(plane0); planes_[1] = std::move(plane1); planes_[2] = std::move(plane2); } // Copy construction/assignment is forbidden to avoid inadvertent copies, // which can be very expensive. Use CopyImageTo instead. Image3(const Image3& other) = delete; Image3& operator=(const Image3& other) = delete; Image3& operator=(Image3&& other) noexcept { for (size_t i = 0; i < kNumPlanes; i++) { planes_[i] = std::move(other.planes_[i]); } return *this; } // Returns row pointer; usage: PlaneRow(idx_plane, y)[x] = val. JXL_INLINE T* PlaneRow(const size_t c, const size_t y) { // Custom implementation instead of calling planes_[c].Row ensures only a // single multiplication is needed for PlaneRow(0..2, y). PlaneRowBoundsCheck(c, y); const size_t row_offset = y * planes_[0].bytes_per_row(); void* row = planes_[c].bytes() + row_offset; return static_cast(JXL_ASSUME_ALIGNED(row, 64)); } // Returns const row pointer; usage: val = PlaneRow(idx_plane, y)[x]. JXL_INLINE const T* PlaneRow(const size_t c, const size_t y) const { PlaneRowBoundsCheck(c, y); const size_t row_offset = y * planes_[0].bytes_per_row(); const void* row = planes_[c].bytes() + row_offset; return static_cast(JXL_ASSUME_ALIGNED(row, 64)); } // Returns const row pointer, even if called from a non-const Image3. JXL_INLINE const T* ConstPlaneRow(const size_t c, const size_t y) const { PlaneRowBoundsCheck(c, y); return PlaneRow(c, y); } JXL_INLINE const PlaneT& Plane(size_t idx) const { return planes_[idx]; } JXL_INLINE PlaneT& Plane(size_t idx) { return planes_[idx]; } void Swap(Image3& other) { for (size_t c = 0; c < 3; ++c) { other.planes_[c].Swap(planes_[c]); } } // Useful for pre-allocating image with some padding for alignment purposes // and later reporting the actual valid dimensions. May also be used to // un-shrink the image. Caller is responsible for ensuring xsize/ysize are <= // the original dimensions. void ShrinkTo(const size_t xsize, const size_t ysize) { for (PlaneT& plane : planes_) { plane.ShrinkTo(xsize, ysize); } } // Sizes of all three images are guaranteed to be equal. JXL_INLINE size_t xsize() const { return planes_[0].xsize(); } JXL_INLINE size_t ysize() const { return planes_[0].ysize(); } // Returns offset [bytes] from one row to the next row of the same plane. // WARNING: this must NOT be used to determine xsize, nor for copying rows - // the valid xsize may be much less. JXL_INLINE size_t bytes_per_row() const { return planes_[0].bytes_per_row(); } // Returns number of pixels (some of which are padding) per row. Useful for // computing other rows via pointer arithmetic. WARNING: this must NOT be used // to determine xsize. JXL_INLINE intptr_t PixelsPerRow() const { return planes_[0].PixelsPerRow(); } private: void PlaneRowBoundsCheck(const size_t c, const size_t y) const { #if defined(ADDRESS_SANITIZER) || defined(MEMORY_SANITIZER) || \ defined(THREAD_SANITIZER) if (c >= kNumPlanes || y >= ysize()) { JXL_ABORT("PlaneRow(%" PRIu64 ", %" PRIu64 ") in (%" PRIu64 " x %" PRIu64 ") image\n", static_cast(c), static_cast(y), static_cast(xsize()), static_cast(ysize())); } #endif } private: PlaneT planes_[kNumPlanes]; }; using Image3B = Image3; using Image3S = Image3; using Image3U = Image3; using Image3I = Image3; using Image3F = Image3; using Image3D = Image3; } // namespace jxl #endif // LIB_JXL_IMAGE_H_