mirror of https://github.com/bsnes-emu/bsnes.git
191 lines
5.2 KiB
C++
191 lines
5.2 KiB
C++
#ifndef NALL_IMAGE_SCALE_HPP
|
|
#define NALL_IMAGE_SCALE_HPP
|
|
|
|
namespace nall {
|
|
|
|
void image::scale(unsigned outputWidth, unsigned outputHeight, bool linear) {
|
|
if(width == outputWidth && height == outputHeight) return; //no scaling necessary
|
|
if(linear == false) return scaleNearest(outputWidth, outputHeight);
|
|
|
|
if(width == outputWidth ) return scaleLinearHeight(outputHeight);
|
|
if(height == outputHeight) return scaleLinearWidth(outputWidth);
|
|
|
|
//find fastest scaling method, based on number of interpolation operations required
|
|
//magnification usually benefits from two-pass linear interpolation
|
|
//minification usually benefits from one-pass bilinear interpolation
|
|
unsigned d1wh = ((width * outputWidth ) + (outputWidth * outputHeight)) * 1;
|
|
unsigned d1hw = ((height * outputHeight) + (outputWidth * outputHeight)) * 1;
|
|
unsigned d2wh = (outputWidth * outputHeight) * 3;
|
|
|
|
if(d1wh <= d1hw && d1wh <= d2wh) return scaleLinearWidth(outputWidth), scaleLinearHeight(outputHeight);
|
|
if(d1hw <= d2wh) return scaleLinearHeight(outputHeight), scaleLinearWidth(outputWidth);
|
|
return scaleLinear(outputWidth, outputHeight);
|
|
}
|
|
|
|
void image::scaleLinearWidth(unsigned outputWidth) {
|
|
uint8_t* outputData = allocate(outputWidth, height, stride);
|
|
unsigned outputPitch = outputWidth * stride;
|
|
uint64_t xstride = ((uint64_t)(width - 1) << 32) / max(1u, outputWidth - 1);
|
|
|
|
#pragma omp parallel for
|
|
for(unsigned y = 0; y < height; y++) {
|
|
uint64_t xfraction = 0;
|
|
|
|
const uint8_t* sp = data + pitch * y;
|
|
uint8_t* dp = outputData + outputPitch * y;
|
|
|
|
uint64_t a = read(sp);
|
|
uint64_t b = read(sp + stride);
|
|
sp += stride;
|
|
|
|
unsigned x = 0;
|
|
while(true) {
|
|
while(xfraction < 0x100000000 && x++ < outputWidth) {
|
|
write(dp, interpolate4i(a, b, xfraction));
|
|
dp += stride;
|
|
xfraction += xstride;
|
|
}
|
|
if(x >= outputWidth) break;
|
|
|
|
sp += stride;
|
|
a = b;
|
|
b = read(sp);
|
|
xfraction -= 0x100000000;
|
|
}
|
|
}
|
|
|
|
free();
|
|
data = outputData;
|
|
width = outputWidth;
|
|
pitch = outputPitch;
|
|
size = height * pitch;
|
|
}
|
|
|
|
void image::scaleLinearHeight(unsigned outputHeight) {
|
|
uint8_t* outputData = allocate(width, outputHeight, stride);
|
|
uint64_t ystride = ((uint64_t)(height - 1) << 32) / max(1u, outputHeight - 1);
|
|
|
|
#pragma omp parallel for
|
|
for(unsigned x = 0; x < width; x++) {
|
|
uint64_t yfraction = 0;
|
|
|
|
const uint8_t* sp = data + stride * x;
|
|
uint8_t* dp = outputData + stride * x;
|
|
|
|
uint64_t a = read(sp);
|
|
uint64_t b = read(sp + pitch);
|
|
sp += pitch;
|
|
|
|
unsigned y = 0;
|
|
while(true) {
|
|
while(yfraction < 0x100000000 && y++ < outputHeight) {
|
|
write(dp, interpolate4i(a, b, yfraction));
|
|
dp += pitch;
|
|
yfraction += ystride;
|
|
}
|
|
if(y >= outputHeight) break;
|
|
|
|
sp += pitch;
|
|
a = b;
|
|
b = read(sp);
|
|
yfraction -= 0x100000000;
|
|
}
|
|
}
|
|
|
|
free();
|
|
data = outputData;
|
|
height = outputHeight;
|
|
size = height * pitch;
|
|
}
|
|
|
|
void image::scaleLinear(unsigned outputWidth, unsigned outputHeight) {
|
|
uint8_t* outputData = allocate(outputWidth, outputHeight, stride);
|
|
unsigned outputPitch = outputWidth * stride;
|
|
|
|
uint64_t xstride = ((uint64_t)(width - 1) << 32) / max(1u, outputWidth - 1);
|
|
uint64_t ystride = ((uint64_t)(height - 1) << 32) / max(1u, outputHeight - 1);
|
|
|
|
#pragma omp parallel for
|
|
for(unsigned y = 0; y < outputHeight; y++) {
|
|
uint64_t yfraction = ystride * y;
|
|
uint64_t xfraction = 0;
|
|
|
|
const uint8_t* sp = data + pitch * (yfraction >> 32);
|
|
uint8_t* dp = outputData + outputPitch * y;
|
|
|
|
uint64_t a = read(sp);
|
|
uint64_t b = read(sp + stride);
|
|
uint64_t c = read(sp + pitch);
|
|
uint64_t d = read(sp + pitch + stride);
|
|
sp += stride;
|
|
|
|
unsigned x = 0;
|
|
while(true) {
|
|
while(xfraction < 0x100000000 && x++ < outputWidth) {
|
|
write(dp, interpolate4i(a, b, c, d, xfraction, yfraction));
|
|
dp += stride;
|
|
xfraction += xstride;
|
|
}
|
|
if(x >= outputWidth) break;
|
|
|
|
sp += stride;
|
|
a = b;
|
|
c = d;
|
|
b = read(sp);
|
|
d = read(sp + pitch);
|
|
xfraction -= 0x100000000;
|
|
}
|
|
}
|
|
|
|
free();
|
|
data = outputData;
|
|
width = outputWidth;
|
|
height = outputHeight;
|
|
pitch = outputPitch;
|
|
size = height * pitch;
|
|
}
|
|
|
|
void image::scaleNearest(unsigned outputWidth, unsigned outputHeight) {
|
|
uint8_t* outputData = allocate(outputWidth, outputHeight, stride);
|
|
unsigned outputPitch = outputWidth * stride;
|
|
|
|
uint64_t xstride = ((uint64_t)width << 32) / outputWidth;
|
|
uint64_t ystride = ((uint64_t)height << 32) / outputHeight;
|
|
|
|
#pragma omp parallel for
|
|
for(unsigned y = 0; y < outputHeight; y++) {
|
|
uint64_t yfraction = ystride * y;
|
|
uint64_t xfraction = 0;
|
|
|
|
const uint8_t* sp = data + pitch * (yfraction >> 32);
|
|
uint8_t* dp = outputData + outputPitch * y;
|
|
|
|
uint64_t a = read(sp);
|
|
|
|
unsigned x = 0;
|
|
while(true) {
|
|
while(xfraction < 0x100000000 && x++ < outputWidth) {
|
|
write(dp, a);
|
|
dp += stride;
|
|
xfraction += xstride;
|
|
}
|
|
if(x >= outputWidth) break;
|
|
|
|
sp += stride;
|
|
a = read(sp);
|
|
xfraction -= 0x100000000;
|
|
}
|
|
}
|
|
|
|
free();
|
|
data = outputData;
|
|
width = outputWidth;
|
|
height = outputHeight;
|
|
pitch = outputPitch;
|
|
size = height * pitch;
|
|
}
|
|
|
|
}
|
|
|
|
#endif
|