// This file is part of OpenCV project. // It is subject to the license terms in the LICENSE file found in the top-level // directory of this distribution and at http://opencv.org/license.html #include "precomp.hpp" #ifdef HAVE_AVIF #include #include #include #include #include "opencv2/imgproc.hpp" #include "grfmt_avif.hpp" #define CV_AVIF_USE_QUALITY \ (AVIF_VERSION > ((0 * 1000000) + (11 * 10000) + (1 * 100))) #if !CV_AVIF_USE_QUALITY #define AVIF_QUALITY_LOSSLESS 100 #define AVIF_QUALITY_WORST 0 #define AVIF_QUALITY_BEST 100 #endif namespace cv { namespace { struct AvifImageDeleter { void operator()(avifImage *image) { avifImageDestroy(image); } }; using AvifImageUniquePtr = std::unique_ptr; avifResult CopyToMat(const avifImage *image, int channels, Mat *mat) { CV_Assert((int)image->height == mat->rows); CV_Assert((int)image->width == mat->cols); if (channels == 1) { const cv::Mat image_wrap = cv::Mat(image->height, image->width, CV_MAKE_TYPE((image->depth == 8) ? CV_8U : CV_16U, 1), image->yuvPlanes[0], image->yuvRowBytes[0]); if ((image->depth == 8 && mat->depth() == CV_8U) || (image->depth > 8 && mat->depth() == CV_16U)) { image_wrap.copyTo(*mat); } else { CV_Assert(image->depth > 8 && mat->depth() == CV_8U); image_wrap.convertTo(*mat, CV_8U, 1. / (1 << (image->depth - 8))); } return AVIF_RESULT_OK; } avifRGBImage rgba; avifRGBImageSetDefaults(&rgba, image); if (channels == 3) { rgba.format = AVIF_RGB_FORMAT_BGR; } else { CV_Assert(channels == 4); rgba.format = AVIF_RGB_FORMAT_BGRA; } rgba.rowBytes = mat->step[0]; rgba.depth = (mat->depth() == CV_16U) ? image->depth : 8; rgba.pixels = reinterpret_cast(mat->data); return avifImageYUVToRGB(image, &rgba); } AvifImageUniquePtr ConvertToAvif(const cv::Mat &img, bool lossless, int bit_depth) { CV_Assert(img.depth() == CV_8U || img.depth() == CV_16U); const int width = img.cols; const int height = img.rows; avifImage *result; if (img.channels() == 1) { result = avifImageCreateEmpty(); if (result == nullptr) return nullptr; result->width = width; result->height = height; result->depth = bit_depth; result->yuvFormat = AVIF_PIXEL_FORMAT_YUV400; result->colorPrimaries = AVIF_COLOR_PRIMARIES_UNSPECIFIED; result->transferCharacteristics = AVIF_TRANSFER_CHARACTERISTICS_UNSPECIFIED; result->matrixCoefficients = AVIF_MATRIX_COEFFICIENTS_IDENTITY; result->yuvRange = AVIF_RANGE_FULL; result->yuvPlanes[0] = img.data; result->yuvRowBytes[0] = img.step[0]; result->imageOwnsYUVPlanes = AVIF_FALSE; return AvifImageUniquePtr(result); } if (lossless) { result = avifImageCreate(width, height, bit_depth, AVIF_PIXEL_FORMAT_YUV444); if (result == nullptr) return nullptr; result->colorPrimaries = AVIF_COLOR_PRIMARIES_UNSPECIFIED; result->transferCharacteristics = AVIF_TRANSFER_CHARACTERISTICS_UNSPECIFIED; result->matrixCoefficients = AVIF_MATRIX_COEFFICIENTS_IDENTITY; result->yuvRange = AVIF_RANGE_FULL; } else { result = avifImageCreate(width, height, bit_depth, AVIF_PIXEL_FORMAT_YUV420); if (result == nullptr) return nullptr; result->colorPrimaries = AVIF_COLOR_PRIMARIES_BT709; result->transferCharacteristics = AVIF_TRANSFER_CHARACTERISTICS_SRGB; result->matrixCoefficients = AVIF_MATRIX_COEFFICIENTS_BT601; result->yuvRange = AVIF_RANGE_FULL; } avifRGBImage rgba; avifRGBImageSetDefaults(&rgba, result); if (img.channels() == 3) { rgba.format = AVIF_RGB_FORMAT_BGR; } else { CV_Assert(img.channels() == 4); rgba.format = AVIF_RGB_FORMAT_BGRA; } rgba.rowBytes = img.step[0]; rgba.depth = bit_depth; rgba.pixels = const_cast(reinterpret_cast(img.data)); if (avifImageRGBToYUV(result, &rgba) != AVIF_RESULT_OK) { avifImageDestroy(result); return nullptr; } return AvifImageUniquePtr(result); } } // namespace // 64Mb limit to avoid memory saturation. static const size_t kParamMaxFileSize = utils::getConfigurationParameterSizeT( "OPENCV_IMGCODECS_AVIF_MAX_FILE_SIZE", 64 * 1024 * 1024); static constexpr size_t kAvifSignatureSize = 500; AvifDecoder::AvifDecoder() { m_buf_supported = true; channels_ = 0; decoder_ = avifDecoderCreate(); } AvifDecoder::~AvifDecoder() { if (decoder_ != nullptr) avifDecoderDestroy(decoder_); } size_t AvifDecoder::signatureLength() const { return kAvifSignatureSize; } #define OPENCV_AVIF_CHECK_STATUS(X, ENCDEC) \ { \ const avifResult status = (X); \ if (status != AVIF_RESULT_OK) { \ const std::string error(ENCDEC->diag.error); \ CV_Error(Error::StsParseError, \ error + " " + avifResultToString(status)); \ return false; \ } \ } bool AvifDecoder::checkSignature(const String &signature) const { std::unique_ptr decoder( avifDecoderCreate(), avifDecoderDestroy); if (!decoder) return false; OPENCV_AVIF_CHECK_STATUS( avifDecoderSetIOMemory( decoder.get(), reinterpret_cast(signature.c_str()), signature.size()), decoder); decoder->io->sizeHint = 1e9; const avifResult status = avifDecoderParse(decoder.get()); return (status == AVIF_RESULT_OK || status == AVIF_RESULT_TRUNCATED_DATA); } ImageDecoder AvifDecoder::newDecoder() const { return makePtr(); } bool AvifDecoder::readHeader() { if (!m_buf.empty()) { CV_Assert(m_buf.type() == CV_8UC1); CV_Assert(m_buf.rows == 1); } OPENCV_AVIF_CHECK_STATUS( m_buf.empty() ? avifDecoderSetIOFile(decoder_, m_filename.c_str()) : avifDecoderSetIOMemory( decoder_, reinterpret_cast(m_buf.data), m_buf.total()), decoder_); OPENCV_AVIF_CHECK_STATUS(avifDecoderParse(decoder_), decoder_); m_width = decoder_->image->width; m_height = decoder_->image->height; channels_ = (decoder_->image->yuvFormat == AVIF_PIXEL_FORMAT_YUV400) ? 1 : 3; if (decoder_->alphaPresent) ++channels_; bit_depth_ = decoder_->image->depth; CV_Assert(bit_depth_ == 8 || bit_depth_ == 10 || bit_depth_ == 12); m_type = CV_MAKETYPE(bit_depth_ == 8 ? CV_8U : CV_16U, channels_); is_first_image_ = true; return true; } bool AvifDecoder::readData(Mat &img) { CV_CheckGE(m_width, 0, ""); CV_CheckGE(m_height, 0, ""); CV_CheckEQ(img.cols, m_width, ""); CV_CheckEQ(img.rows, m_height, ""); CV_CheckType( img.type(), (img.channels() == 1 || img.channels() == 3 || img.channels() == 4) && (img.depth() == CV_8U || img.depth() == CV_16U), "AVIF only supports 1, 3, 4 channels and CV_8U and CV_16U"); Mat read_img; if (img.channels() == channels_) { read_img = img; } else { // Use the asked depth but keep the number of channels. OpenCV and not // libavif will do the color conversion. read_img.create(m_height, m_width, CV_MAKE_TYPE(img.depth(), channels_)); } if (is_first_image_) { if (!nextPage()) return false; is_first_image_ = false; } if (CopyToMat(decoder_->image, channels_, &read_img) != AVIF_RESULT_OK) { CV_Error(Error::StsInternal, "Cannot convert from AVIF to Mat"); return false; } if (decoder_->image->exif.size > 0) { m_exif.parseExif(decoder_->image->exif.data, decoder_->image->exif.size); } if (img.channels() == channels_) { // We already wrote to the right buffer. } else { if (channels_ == 1 && img.channels() == 3) { cvtColor(read_img, img, COLOR_GRAY2BGR); } else if (channels_ == 1 && img.channels() == 4) { cvtColor(read_img, img, COLOR_GRAY2BGRA); } else if (channels_ == 3 && img.channels() == 1) { cvtColor(read_img, img, COLOR_BGR2GRAY); } else if (channels_ == 3 && img.channels() == 4) { cvtColor(read_img, img, COLOR_BGR2BGRA); } else if (channels_ == 4 && img.channels() == 1) { cvtColor(read_img, img, COLOR_BGRA2GRAY); } else if (channels_ == 4 && img.channels() == 3) { cvtColor(read_img, img, COLOR_BGRA2BGR); } else { CV_Error(Error::StsInternal, ""); } } return true; } bool AvifDecoder::nextPage() { const avifResult status = avifDecoderNextImage(decoder_); if (status == AVIF_RESULT_NO_IMAGES_REMAINING) return false; if (status != AVIF_RESULT_OK) { const std::string error(decoder_->diag.error); CV_Error(Error::StsParseError, error + " " + avifResultToString(status)); return false; } return true; } //////////////////////////////////////////////////////////////////////////////// AvifEncoder::AvifEncoder() { m_description = "AVIF files (*.avif)"; m_buf_supported = true; encoder_ = avifEncoderCreate(); } AvifEncoder::~AvifEncoder() { if (encoder_) avifEncoderDestroy(encoder_); } bool AvifEncoder::isFormatSupported(int depth) const { return (depth == CV_8U || depth == CV_16U); } bool AvifEncoder::write(const Mat &img, const std::vector ¶ms) { std::vector img_vec(1, img); return writeToOutput(img_vec, params); } bool AvifEncoder::writemulti(const std::vector &img_vec, const std::vector ¶ms) { return writeToOutput(img_vec, params); } bool AvifEncoder::writeToOutput(const std::vector &img_vec, const std::vector ¶ms) { int bit_depth = 8; int speed = AVIF_SPEED_FASTEST; for (size_t i = 0; i < params.size(); i += 2) { if (params[i] == IMWRITE_AVIF_QUALITY) { const int quality = std::min(std::max(params[i + 1], AVIF_QUALITY_WORST), AVIF_QUALITY_BEST); #if CV_AVIF_USE_QUALITY encoder_->quality = quality; #else encoder_->minQuantizer = encoder_->maxQuantizer = (AVIF_QUANTIZER_BEST_QUALITY - AVIF_QUANTIZER_WORST_QUALITY) * quality / (AVIF_QUALITY_BEST - AVIF_QUALITY_WORST) + AVIF_QUANTIZER_WORST_QUALITY; #endif } else if (params[i] == IMWRITE_AVIF_DEPTH) { bit_depth = params[i + 1]; } else if (params[i] == IMWRITE_AVIF_SPEED) { speed = params[i + 1]; } } avifRWData output_ori = AVIF_DATA_EMPTY; std::unique_ptr output(&output_ori, avifRWDataFree); #if CV_AVIF_USE_QUALITY const bool do_lossless = (encoder_->quality == AVIF_QUALITY_LOSSLESS); #else const bool do_lossless = (encoder_->minQuantizer == AVIF_QUANTIZER_BEST_QUALITY && encoder_->maxQuantizer == AVIF_QUANTIZER_BEST_QUALITY); #endif encoder_->speed = speed; const avifAddImageFlags flag = (img_vec.size() == 1) ? AVIF_ADD_IMAGE_FLAG_SINGLE : AVIF_ADD_IMAGE_FLAG_NONE; std::vector images; std::vector imgs_scaled; for (const cv::Mat &img : img_vec) { CV_CheckType( img.type(), (bit_depth == 8 && img.depth() == CV_8U) || ((bit_depth == 10 || bit_depth == 12) && img.depth() == CV_16U), "AVIF only supports bit depth of 8 with CV_8U input or " "bit depth of 10 or 12 with CV_16U input"); CV_Check(img.channels(), img.channels() == 1 || img.channels() == 3 || img.channels() == 4, "AVIF only supports 1, 3, 4 channels"); images.emplace_back(ConvertToAvif(img, do_lossless, bit_depth)); } for (const AvifImageUniquePtr &image : images) { OPENCV_AVIF_CHECK_STATUS( avifEncoderAddImage(encoder_, image.get(), /*durationInTimescale=*/1, flag), encoder_); } OPENCV_AVIF_CHECK_STATUS(avifEncoderFinish(encoder_, output.get()), encoder_); if (m_buf) { m_buf->resize(output->size); std::memcpy(m_buf->data(), output->data, output->size); } else { std::ofstream(m_filename, std::ofstream::binary) .write(reinterpret_cast(output->data), output->size); } return (output->size > 0); } ImageEncoder AvifEncoder::newEncoder() const { return makePtr(); } } // namespace cv #endif