mirror of
https://github.com/opencv/opencv.git
synced 2024-12-15 18:09:11 +08:00
934e6899f8
imgcodecs: Add rgb flag for imread and imdecode #25809 Try to `imread` images by RGB to save R-B swapping costs. ## How to use it? ``` img_rgb = cv2.imread("PATH", IMREAD_COLOR_RGB) # OpenCV decode the image by RGB format. ``` ## TODO - [x] Fix the broken code - [x] Add imread rgb test - [x] Speed test of rgb mode. ## Performance test | file name | IMREAD_COLOR | IMREAD_COLOR_RGB | | --------- | ------ | --------- | | jpg01 | 284 ms | 277 ms | | jpg02 | 376 ms | 366 ms | | png01 | 62 ms | 60 ms | | Png02 | 97 ms | 94 ms | Test with [image_test.zip](https://github.com/user-attachments/files/15982949/image_test.zip) ```.cpp string img_path = "/Users/mzh/work/data/image_test/png02.png"; int loop = 20; TickMeter t; double t0 = 10000; for (int i = 0; i < loop; i++) { t.reset(); t.start(); img_bgr = imread(img_path, IMREAD_COLOR); t.stop(); if (t.getTimeMilli() < t0) t0 = t.getTimeMilli(); } std::cout<<"bgr time = "<<t0<<std::endl; t0 = 10000; for (int i = 0; i < loop; i++) { t.reset(); t.start(); img_rgb = imread(img_path, IMREAD_COLOR_RGB); t.stop(); if (t.getTimeMilli() < t0) t0 = t.getTimeMilli(); } std::cout<<"rgb time = "<<t0<<std::endl; ``` ### Pull Request Readiness Checklist See details at https://github.com/opencv/opencv/wiki/How_to_contribute#making-a-good-pull-request - [x] I agree to contribute to the project under Apache 2 License. - [x] To the best of my knowledge, the proposed patch is not based on a code under GPL or another license that is incompatible with OpenCV - [x] The PR is proposed to the proper branch - [ ] There is a reference to the original bug report and related work - [ ] There is accuracy test, performance test and test data in opencv_extra repository, if applicable Patch to opencv_extra has the same branch name. - [ ] The feature is well documented and sample code can be built with the project CMake
265 lines
6.1 KiB
C++
265 lines
6.1 KiB
C++
// This file is part of OpenCV project.
|
|
// It is subject to the license terms in the LICENSE file found in the top-level directory
|
|
// of this distribution and at http://opencv.org/license.html.
|
|
|
|
#include "precomp.hpp"
|
|
#include "utils.hpp"
|
|
#include "grfmt_pfm.hpp"
|
|
#include <iostream>
|
|
|
|
#ifdef HAVE_IMGCODEC_PFM
|
|
|
|
namespace {
|
|
|
|
static_assert(sizeof(float) == 4, "float must be 32 bit.");
|
|
|
|
|
|
bool is_byte_order_swapped(double scale)
|
|
{
|
|
// ".pfm" format file specifies that:
|
|
// positive scale means big endianness;
|
|
// negative scale means little endianness.
|
|
|
|
#ifdef WORDS_BIGENDIAN
|
|
return scale < 0.0;
|
|
#else
|
|
return scale >= 0.0;
|
|
#endif
|
|
}
|
|
|
|
void swap_endianness(uint32_t& ui)
|
|
{
|
|
static const uint32_t A(0x000000ffU);
|
|
static const uint32_t B(0x0000ff00U);
|
|
static const uint32_t C(0x00ff0000U);
|
|
static const uint32_t D(0xff000000U);
|
|
|
|
ui = ( (ui & A) << 24 )
|
|
| ( (ui & B) << 8 )
|
|
| ( (ui & C) >> 8 )
|
|
| ( (ui & D) >> 24 );
|
|
}
|
|
|
|
template<typename T> T atoT(const std::string& s);
|
|
template<> int atoT<int>(const std::string& s) { return std::atoi(s.c_str()); }
|
|
template<> double atoT<double>(const std::string& s) { return std::atof(s.c_str()); }
|
|
|
|
template<typename T>
|
|
T read_number(cv::RLByteStream& strm)
|
|
{
|
|
// should be enough to take string representation of any number
|
|
const size_t buffer_size = 2048;
|
|
|
|
std::vector<char> buffer(buffer_size, 0);
|
|
for (size_t i = 0; i < buffer_size; ++i) {
|
|
const int intc = strm.getByte();
|
|
CV_Assert(intc >= -128 && intc < 128);
|
|
char c = static_cast<char>(intc);
|
|
if (std::isspace(c)) {
|
|
break;
|
|
}
|
|
buffer[i] = c;
|
|
}
|
|
const std::string str(buffer.begin(), buffer.end());
|
|
return atoT<T>(str);
|
|
}
|
|
|
|
template<typename T> void write_anything(cv::WLByteStream& strm, const T& t)
|
|
{
|
|
std::ostringstream ss;
|
|
ss << t;
|
|
strm.putBytes(ss.str().c_str(), static_cast<int>(ss.str().size()));
|
|
}
|
|
|
|
}
|
|
|
|
namespace cv {
|
|
|
|
PFMDecoder::~PFMDecoder()
|
|
{
|
|
}
|
|
|
|
PFMDecoder::PFMDecoder() : m_scale_factor(0), m_swap_byte_order(false)
|
|
{
|
|
m_strm.close();
|
|
}
|
|
|
|
bool PFMDecoder::readHeader()
|
|
{
|
|
if (m_buf.empty()) {
|
|
if (!m_strm.open(m_filename)) {
|
|
return false;
|
|
}
|
|
} else {
|
|
if (!m_strm.open(m_buf)) {
|
|
return false;
|
|
}
|
|
}
|
|
|
|
if (m_strm.getByte() != 'P') {
|
|
CV_Error(Error::StsError, "Unexpected file type (expected P)");
|
|
}
|
|
|
|
switch (m_strm.getByte()) {
|
|
case 'f':
|
|
m_type = CV_32FC1;
|
|
break;
|
|
case 'F':
|
|
m_type = CV_32FC3;
|
|
break;
|
|
default:
|
|
CV_Error(Error::StsError, "Unexpected file type (expected `f` or `F`)");
|
|
}
|
|
|
|
if ('\n' != m_strm.getByte()) {
|
|
CV_Error(Error::StsError, "Unexpected header format (expected line break)");
|
|
}
|
|
|
|
|
|
m_width = read_number<int>(m_strm);
|
|
m_height = read_number<int>(m_strm);
|
|
m_scale_factor = read_number<double>(m_strm);
|
|
m_swap_byte_order = is_byte_order_swapped(m_scale_factor);
|
|
|
|
return true;
|
|
}
|
|
|
|
bool PFMDecoder::readData(Mat& mat)
|
|
{
|
|
if (!m_strm.isOpened()) {
|
|
CV_Error(Error::StsError, "Unexpected status in data stream");
|
|
}
|
|
|
|
Mat buffer(mat.size(), m_type);
|
|
for (int y = m_height - 1; y >= 0; --y) {
|
|
m_strm.getBytes(buffer.ptr(y), static_cast<int>(m_width * buffer.elemSize()));
|
|
if (is_byte_order_swapped(m_scale_factor)) {
|
|
for (int i = 0; i < m_width * buffer.channels(); ++i) {
|
|
static_assert( sizeof(uint32_t) == sizeof(float),
|
|
"uint32_t and float must have same size." );
|
|
swap_endianness(buffer.ptr<uint32_t>(y)[i]);
|
|
}
|
|
}
|
|
}
|
|
|
|
if (buffer.channels() == 3 && !m_use_rgb) {
|
|
cv::cvtColor(buffer, buffer, cv::COLOR_BGR2RGB);
|
|
}
|
|
|
|
CV_Assert(fabs(m_scale_factor) > 0.0f);
|
|
buffer *= 1.f / fabs(m_scale_factor);
|
|
|
|
buffer.convertTo(mat, mat.type());
|
|
|
|
return true;
|
|
}
|
|
|
|
size_t PFMDecoder::signatureLength() const
|
|
{
|
|
return 3;
|
|
}
|
|
|
|
bool PFMDecoder::checkSignature( const String& signature ) const
|
|
{
|
|
return signature.size() >= 3
|
|
&& signature[0] == 'P'
|
|
&& ( signature[1] == 'f' || signature[1] == 'F' )
|
|
&& isspace(signature[2]);
|
|
}
|
|
|
|
void PFMDecoder::close()
|
|
{
|
|
// noop
|
|
}
|
|
|
|
//////////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
PFMEncoder::PFMEncoder()
|
|
{
|
|
m_description = "Portable image format - float (*.pfm)";
|
|
}
|
|
|
|
PFMEncoder::~PFMEncoder()
|
|
{
|
|
}
|
|
|
|
bool PFMEncoder::isFormatSupported(int depth) const
|
|
{
|
|
// any depth will be converted into 32-bit float.
|
|
CV_UNUSED(depth);
|
|
return true;
|
|
}
|
|
|
|
bool PFMEncoder::write(const Mat& img, const std::vector<int>& params)
|
|
{
|
|
CV_UNUSED(params);
|
|
|
|
WLByteStream strm;
|
|
if (m_buf) {
|
|
if (!strm.open(*m_buf)) {
|
|
return false;
|
|
} else {
|
|
m_buf->reserve(alignSize(256 + sizeof(float) * img.channels() * img.total(), 256));
|
|
}
|
|
} else if (!strm.open(m_filename)) {
|
|
return false;
|
|
}
|
|
|
|
Mat float_img;
|
|
strm.putByte('P');
|
|
switch (img.channels()) {
|
|
case 1:
|
|
strm.putByte('f');
|
|
img.convertTo(float_img, CV_32FC1);
|
|
break;
|
|
case 3:
|
|
strm.putByte('F');
|
|
img.convertTo(float_img, CV_32FC3);
|
|
break;
|
|
default:
|
|
CV_Error(Error::StsBadArg, "Expected 1 or 3 channel image.");
|
|
}
|
|
strm.putByte('\n');
|
|
|
|
|
|
write_anything(strm, float_img.cols);
|
|
strm.putByte(' ');
|
|
write_anything(strm, float_img.rows);
|
|
strm.putByte('\n');
|
|
#ifdef WORDS_BIGENDIAN
|
|
write_anything(strm, 1.0);
|
|
#else
|
|
write_anything(strm, -1.0);
|
|
#endif
|
|
|
|
strm.putByte('\n');
|
|
|
|
// Comments are not officially supported in this file format.
|
|
// write_anything(strm, "# Generated by OpenCV " CV_VERSION "\n");
|
|
|
|
for (int y = float_img.rows - 1; y >= 0; --y)
|
|
{
|
|
if (float_img.channels() == 3) {
|
|
const float* bgr_row = float_img.ptr<float>(y);
|
|
size_t row_size = float_img.cols * float_img.channels();
|
|
std::vector<float> rgb_row(row_size);
|
|
for (int x = 0; x < float_img.cols; ++x) {
|
|
rgb_row[x*3+0] = bgr_row[x*3+2];
|
|
rgb_row[x*3+1] = bgr_row[x*3+1];
|
|
rgb_row[x*3+2] = bgr_row[x*3+0];
|
|
}
|
|
strm.putBytes( reinterpret_cast<const uchar*>(rgb_row.data()),
|
|
static_cast<int>(sizeof(float) * row_size) );
|
|
} else if (float_img.channels() == 1) {
|
|
strm.putBytes(float_img.ptr(y), sizeof(float) * float_img.cols);
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
#endif // HAVE_IMGCODEC_PFM
|