From 9f4fa671d9abb8d18e438e194759386765bdedcd Mon Sep 17 00:00:00 2001 From: Pavel Krajcevski Date: Wed, 18 Sep 2013 18:03:44 -0400 Subject: [PATCH] Add a first pass at content aware downscaling. --- PVRTCEncoder/src/Image.cpp | 159 +++++++++++++++++++++++++++++++++++++ PVRTCEncoder/src/Image.h | 10 +++ 2 files changed, 169 insertions(+) diff --git a/PVRTCEncoder/src/Image.cpp b/PVRTCEncoder/src/Image.cpp index 1cc997f..fdb982b 100644 --- a/PVRTCEncoder/src/Image.cpp +++ b/PVRTCEncoder/src/Image.cpp @@ -55,12 +55,18 @@ #include #include #include +#include #include "Pixel.h" #include "Core/include/Image.h" #include "IO/include/ImageFile.h" +static float ConvertChannelToFloat(uint8 channel, uint8 bitDepth) { + float denominator = static_cast((1 << bitDepth) - 1); + return static_cast(channel) / denominator; +} + namespace PVRTCC { Image::Image(uint32 height, uint32 width) @@ -213,6 +219,159 @@ void Image::BilinearUpscale(uint32 xtimes, uint32 ytimes, m_Height = newHeight; } +void Image::ContentAwareDownscale(uint32 xtimes, uint32 ytimes, + EWrapMode wrapMode, bool bOffsetNewPixels) { + const uint32 w = GetWidth(); + const uint32 h = GetHeight(); + + const uint32 newWidth = w >> xtimes; + const uint32 newHeight = h >> ytimes; + + Pixel *downscaledPixels = new Pixel[newWidth * newHeight]; + const uint32 numDownscaledPixels = newWidth * newHeight; + + uint8 bitDepth[4]; + m_Pixels[0].GetBitDepth(bitDepth); + + for(uint32 i = 0; i < numDownscaledPixels; i++) { + downscaledPixels[i].ChangeBitDepth(bitDepth); + } + + // Allocate memory + float *imgData = new float[19 * w * h]; + float *I = imgData; + float *Ix[5] = { + imgData + (w * h), + imgData + (2 * w * h), + imgData + (3 * w * h), + imgData + (4 * w * h), + imgData + (18 * w * h), + }; + float *Iy = imgData + (5 * w * h); + float *Ixx[4] = { + imgData + (6 * w * h), + imgData + (7 * w * h), + imgData + (8 * w * h), + imgData + (9 * w * h) + }; + float *Iyy[4] = { + imgData + (10 * w * h), + imgData + (11 * w * h), + imgData + (12 * w * h), + imgData + (13 * w * h) + }; + float *Ixy[4] = { + imgData + (14 * w * h), + imgData + (15 * w * h), + imgData + (16 * w * h), + imgData + (17 * w * h) + }; + + // Then, compute the intensity of the image + for(uint32 i = 0; i < w * h; i++) { + // First convert the pixel values to floats using + // premultiplied alpha... + float a = ConvertChannelToFloat(m_Pixels[i].A(), bitDepth[0]); + float r = a * ConvertChannelToFloat(m_Pixels[i].R(), bitDepth[1]); + float g = a * ConvertChannelToFloat(m_Pixels[i].G(), bitDepth[2]); + float b = a * ConvertChannelToFloat(m_Pixels[i].B(), bitDepth[3]); + + I[i] = r * 0.21 + g * 0.71 + b * 0.07; + } + + // Use central differences to calculate Ix, Iy, Ixx, Iyy... + for(uint32 j = 0; j < h; j++) { + for(uint32 i = 0; i < w; i++) { + uint32 hm2xidx = GetPixelIndex(i-2, j); + uint32 hm1xidx = GetPixelIndex(i-1, j); + uint32 hp1xidx = GetPixelIndex(i+1, j); + uint32 hp2xidx = GetPixelIndex(i+2, j); + + uint32 hm2yidx = GetPixelIndex(i, j-2); + uint32 hm1yidx = GetPixelIndex(i, j-1); + uint32 hp1yidx = GetPixelIndex(i, j+1); + uint32 hp2yidx = GetPixelIndex(i, j+2); + + uint32 idx = GetPixelIndex(i, j); + Ix[4][idx] = (I[hm2xidx] - 8*I[hm1xidx] + 8*I[hp1xidx] - I[hp2xidx]) / 12.0f; + Iy[idx] = (I[hm2yidx] - 8*I[hm1yidx] + 8*I[hp1yidx] - I[hp2yidx]) / 12.0f; + + for(uint32 c = 0; c <= 3; c++) { + #define CPNT(dx) ConvertChannelToFloat(m_Pixels[dx].Component(c), bitDepth[c]) + Ix[c][idx] = (CPNT(hm2xidx) - 8*CPNT(hm1xidx) + 8*CPNT(hp1xidx) - CPNT(hp2xidx)) / 12.0f; + Ixx[c][idx] = (-CPNT(hm2xidx) + 16*CPNT(hm1xidx) - 30*CPNT(idx) + 16*CPNT(hp1xidx) - CPNT(hp2xidx)) / 12.0f; + Iyy[c][idx] = (-CPNT(hm2yidx) + 16*CPNT(hm1yidx) - 30*CPNT(idx) + 16*CPNT(hp1yidx) - CPNT(hp2yidx)) / 12.0f; + #undef CPNT + } + } + } + + // Finally, compute Ixy + for(uint32 j = 0; j < h; j++) { + for(uint32 i = 0; i < w; i++) { + uint32 hm2y = GetPixelIndex(i, j-2); + uint32 hm1y = GetPixelIndex(i, j-1); + uint32 hp1y = GetPixelIndex(i, j+1); + uint32 hp2y = GetPixelIndex(i, j+2); + + uint32 idx = GetPixelIndex(i, j); + for(uint32 c = 0; c <= 3; c++) { + Ixy[c][idx] = (Ix[c][hm2y] - 8*Ix[c][hm1y] + 8*Ix[c][hp1y] - Ix[c][hp2y]) / 12.0f; + } + } + } + + // Now, for each pixel that we take into consideration, use + // a smoothing step that is taken from the anisotropic diffusion + // equation: + // I_t = (I_x^2I_yy - 2I_xyI_xI_y + I_y^2I_xx)(I_x^2 + I_y^2) + for(uint32 j = 0; j < newHeight; j++) { + for(uint32 i = 0; i < newWidth; i++) { + + // Map this new pixel back into the original space... + uint32 scalex = 1 << xtimes; + uint32 scaley = 1 << ytimes; + + uint32 x = scalex * i; + uint32 y = scaley * j; + + if(bOffsetNewPixels) { + x += scalex >> 1; + y += scaley >> 1; + } + + uint32 idx = GetPixelIndex(x, y); + Pixel current = m_Pixels[idx]; + + Pixel result; + result.ChangeBitDepth(bitDepth); + + float Ixsq = Ix[4][idx] * Ix[4][idx]; + float Iysq = Iy[idx] * Iy[idx]; + float denom = Ixsq + Iysq; + + for(uint32 c = 0; c < 4; c++) { + float I0 = ConvertChannelToFloat(current.Component(c), bitDepth[c]); + float It = Ixx[c][idx] + Iyy[c][idx]; + if(fabs(denom) > 1e-6) { + It -= (Ixsq*Ixx[c][idx] + 2*Ix[4][idx]*Iy[idx]*Ixy[c][idx] + Iysq*Iyy[c][idx]); + } + float pxScale = static_cast((1 << bitDepth[c]) - 1); + result.Component(c) = static_cast(((I0 + 0.25*It) + 0.5) * pxScale); + } + + downscaledPixels[j * newHeight + i] = result; + } + } + + delete m_Pixels; + m_Pixels = downscaledPixels; + m_Width = newWidth; + m_Height = newHeight; + + delete [] imgData; +} + void Image::ChangeBitDepth(const uint8 (&depths)[4]) { for(uint32 j = 0; j < GetHeight(); j++) { for(uint32 i = 0; i < GetWidth(); i++) { diff --git a/PVRTCEncoder/src/Image.h b/PVRTCEncoder/src/Image.h index e7b35e6..a87f95f 100644 --- a/PVRTCEncoder/src/Image.h +++ b/PVRTCEncoder/src/Image.h @@ -70,6 +70,16 @@ class Image { void BilinearUpscale(uint32 xtimes, uint32 ytimes, EWrapMode wrapMode = eWrapMode_Wrap); + + // Downscales the image by taking an anisotropic diffusion approach + // with respect to the gradient of the intensity. In this way, we can + // preserve the most important image structures by not blurring across + // edge boundaries, which when upscaled will retain the structural + // image quality... + void ContentAwareDownscale(uint32 xtimes, uint32 ytimes, + EWrapMode wrapMode = eWrapMode_Wrap, + bool bOffsetNewPixels = false); + void ChangeBitDepth(const uint8 (&depths)[4]); void ExpandTo8888();