#include "traster.h"
#include "trastercm.h"
#include "tpalette.h"
#include "tcolorstyles.h"
//#include "trop.h"
#include "tropcm.h"
#include "tpixelutils.h"
#include <memory>
//------------------------------------------------------------------------------
namespace
{
//------------------------------------------------------------------------------
template <class PIXOUT, class PIXIN>
void doConvolve_row_9_i(PIXOUT *pixout, int n, PIXIN *pixarr[], long w[])
{
long w1, w2, w3, w4, w5, w6, w7, w8, w9;
PIXIN *p1, *p2, *p3, *p4, *p5, *p6, *p7, *p8, *p9;
w1 = w[0];
w2 = w[1];
w3 = w[2];
w4 = w[3];
w5 = w[4];
w6 = w[5];
w7 = w[6];
w8 = w[7];
w9 = w[8];
p1 = pixarr[0];
p2 = pixarr[1];
p3 = pixarr[2];
p4 = pixarr[3];
p5 = pixarr[4];
p6 = pixarr[5];
p7 = pixarr[6];
p8 = pixarr[7];
p9 = pixarr[8];
int rightShift = 16 + ((int)sizeof(typename PIXIN::Channel) - (int)sizeof(typename PIXOUT::Channel)) * 8;
while (n-- > 0) {
pixout->r = (typename PIXOUT::Channel)((p1->r * w1 + p2->r * w2 + p3->r * w3 +
p4->r * w4 + p5->r * w5 + p6->r * w6 +
p7->r * w7 + p8->r * w8 + p9->r * w9 + (1 << 15)) >>
rightShift);
pixout->g = (typename PIXOUT::Channel)((p1->g * w1 + p2->g * w2 + p3->g * w3 +
p4->g * w4 + p5->g * w5 + p6->g * w6 +
p7->g * w7 + p8->g * w8 + p9->g * w9 + (1 << 15)) >>
rightShift);
pixout->b = (typename PIXOUT::Channel)((p1->b * w1 + p2->b * w2 + p3->b * w3 +
p4->b * w4 + p5->b * w5 + p6->b * w6 +
p7->b * w7 + p8->b * w8 + p9->b * w9 + (1 << 15)) >>
rightShift);
pixout->m = (typename PIXOUT::Channel)((p1->m * w1 + p2->m * w2 + p3->m * w3 +
p4->m * w4 + p5->m * w5 + p6->m * w6 +
p7->m * w7 + p8->m * w8 + p9->m * w9 + (1 << 15)) >>
rightShift);
p1++;
p2++;
p3++;
p4++;
p5++;
p6++;
p7++;
p8++;
p9++;
pixout++;
}
}
//------------------------------------------------------------------------------
template <class PIXOUT>
void doConvolve_cm32_row_9_i(PIXOUT *pixout, int n,
TPixelCM32 *pixarr[], long w[],
const std::vector<TPixel32> &paints,
const std::vector<TPixel32> &inks)
{
long w1, w2, w3, w4, w5, w6, w7, w8, w9;
TPixelCM32 *p1, *p2, *p3, *p4, *p5, *p6, *p7, *p8, *p9;
TPixel32 val[9];
w1 = w[0];
w2 = w[1];
w3 = w[2];
w4 = w[3];
w5 = w[4];
w6 = w[5];
w7 = w[6];
w8 = w[7];
w9 = w[8];
p1 = pixarr[0];
p2 = pixarr[1];
p3 = pixarr[2];
p4 = pixarr[3];
p5 = pixarr[4];
p6 = pixarr[5];
p7 = pixarr[6];
p8 = pixarr[7];
p9 = pixarr[8];
while (n-- > 0) {
for (int i = 0; i < 9; ++i) {
int tone = p1->getTone();
int paint = p1->getPaint();
int ink = p1->getInk();
if (tone == TPixelCM32::getMaxTone())
val[i] = paints[paint];
else if (tone == 0)
val[i] = inks[ink];
else
val[i] = blend(inks[ink], paints[paint], tone, TPixelCM32::getMaxTone());
}
pixout->r = (typename PIXOUT::Channel)((val[1].r * w1 + val[2].r * w2 + val[3].r * w3 +
val[4].r * w4 + val[5].r * w5 + val[6].r * w6 +
val[7].r * w7 + val[8].r * w8 + val[9].r * w9 + (1 << 15)) >>
16);
pixout->g = (typename PIXOUT::Channel)((val[1].g * w1 + val[2].g * w2 + val[3].g * w3 +
val[4].g * w4 + val[5].g * w5 + val[6].g * w6 +
val[7].g * w7 + val[8].g * w8 + val[9].g * w9 + (1 << 15)) >>
16);
pixout->b = (typename PIXOUT::Channel)((val[1].b * w1 + val[2].b * w2 + val[3].b * w3 +
val[4].b * w4 + val[5].b * w5 + val[6].b * w6 +
val[7].b * w7 + val[8].b * w8 + val[9].b * w9 + (1 << 15)) >>
16);
pixout->m = (typename PIXOUT::Channel)((val[1].m * w1 + val[2].m * w2 + val[3].m * w3 +
val[4].m * w4 + val[5].m * w5 + val[6].m * w6 +
val[7].m * w7 + val[8].m * w8 + val[9].m * w9 + (1 << 15)) >>
16);
p1++;
p2++;
p3++;
p4++;
p5++;
p6++;
p7++;
p8++;
p9++;
pixout++;
}
}
//------------------------------------------------------------------------------
template <class PIXOUT, class PIXIN>
void doConvolve_row_i(PIXOUT *pixout, int n,
PIXIN *pixarr[], long w[], int pixn)
{
long ar, ag, ab, am;
int i;
int rightShift = 16 + ((int)sizeof(typename PIXIN::Channel) - (int)sizeof(typename PIXOUT::Channel)) * 8;
while (n-- > 0) {
ar = ag = ab = am = 0;
for (i = 0; i < pixn; i++) {
ar += pixarr[i]->r * w[i];
ag += pixarr[i]->g * w[i];
ab += pixarr[i]->b * w[i];
am += pixarr[i]->m * w[i];
pixarr[i]++;
}
pixout->r = (typename PIXOUT::Channel)((ar + (1 << 15)) >> rightShift);
pixout->g = (typename PIXOUT::Channel)((ag + (1 << 15)) >> rightShift);
pixout->b = (typename PIXOUT::Channel)((ab + (1 << 15)) >> rightShift);
pixout->m = (typename PIXOUT::Channel)((am + (1 << 15)) >> rightShift);
pixout++;
}
}
//------------------------------------------------------------------------------
template <class PIXOUT>
void doConvolve_cm32_row_i(PIXOUT *pixout, int n,
TPixelCM32 *pixarr[], long w[], int pixn,
const std::vector<TPixel32> &paints,
const std::vector<TPixel32> &inks)
{
long ar, ag, ab, am;
int i;
while (n-- > 0) {
ar = ag = ab = am = 0;
for (i = 0; i < pixn; i++) {
TPixel32 val;
int tone = pixarr[i]->getTone();
int paint = pixarr[i]->getPaint();
int ink = pixarr[i]->getInk();
if (tone == TPixelCM32::getMaxTone())
val = paints[paint];
else if (tone == 0)
val = inks[ink];
else
val = blend(inks[ink], paints[paint], tone, TPixelCM32::getMaxTone());
ar += val.r * w[i];
ag += val.g * w[i];
ab += val.b * w[i];
am += val.m * w[i];
pixarr[i]++;
}
pixout->r = (typename PIXOUT::Channel)((ar + (1 << 15)) >> 16);
pixout->g = (typename PIXOUT::Channel)((ag + (1 << 15)) >> 16);
pixout->b = (typename PIXOUT::Channel)((ab + (1 << 15)) >> 16);
pixout->m = (typename PIXOUT::Channel)((am + (1 << 15)) >> 16);
pixout++;
}
}
//------------------------------------------------------------------------------
template <class PIXOUT, class PIXIN>
void doConvolve_3_i(TRasterPT<PIXOUT> rout,
TRasterPT<PIXIN> rin,
int dx, int dy,
double conv[])
{
PIXIN *bufferin;
PIXOUT *bufferout;
PIXIN *pixin;
PIXOUT *pixout;
PIXIN *pixarr[9];
long w[9];
int pixn;
int wrapin, wrapout;
int x, y, n;
int x1, y1, x2, y2;
int fx1, fy1, fx2, fy2, fx, fy;
rout->clear();
wrapin = rin->getWrap();
wrapout = rout->getWrap();
/* calcolo l'area di output interessata */
x1 = std::max(0, -dx - 1);
y1 = std::max(0, -dy - 1);
x2 = std::min(rout->getLx() - 1, -dx + rin->getLx());
y2 = std::min(rout->getLy() - 1, -dy + rin->getLy());
rin->lock();
rout->lock();
bufferin = rin->pixels();
bufferout = rout->pixels();
for (y = y1; y <= y2; y++) {
fy1 = std::max(-1, -dy - y);
fy2 = std::min(1, -dy + rin->getLy() - 1 - y);
if (fy1 > fy2)
continue;
x = x1;
pixout = bufferout + wrapout * y + x;
pixin = bufferin + wrapin * (y + dy) + (x + dx);
while (x <= x2) {
fx1 = std::max(-1, -dx - x);
fx2 = std::min(1, -dx + rin->getLx() - 1 - x);
if (x > -dx && x < -dx + rin->getLx() - 1)
n = std::min(-dx + rin->getLx() - 1 - x, x2 - x + 1);
else
n = 1;
if (n < 1)
break;
pixn = 0;
for (fy = fy1; fy <= fy2; fy++)
for (fx = fx1; fx <= fx2; fx++) {
pixarr[pixn] = pixin + fy * wrapin + fx;
w[pixn] = (long)(conv[(fy + 1) * 3 + fx + 1] * (1 << 16));
pixn++;
}
if (pixn == 9)
doConvolve_row_9_i<PIXOUT, PIXIN>(pixout, n, pixarr, w);
else
doConvolve_row_i<PIXOUT, PIXIN>(pixout, n, pixarr, w, pixn);
x += n;
pixin += n;
pixout += n;
}
}
rin->unlock();
rout->unlock();
}
//------------------------------------------------------------------------------
template <class PIXOUT, class PIXIN>
void doConvolve_i(TRasterPT<PIXOUT> rout,
TRasterPT<PIXIN> rin,
int dx, int dy,
double conv[], int radius)
{
PIXIN *bufferin;
PIXOUT *bufferout;
PIXIN *pixin;
PIXOUT *pixout;
int radiusSquare = sq(radius);
std::unique_ptr<PIXIN*[]> pixarr(new PIXIN *[radiusSquare]);
std::unique_ptr<long[]> w(new long[radiusSquare]);
int pixn;
int wrapin, wrapout;
int x, y, n;
int x1, y1, x2, y2;
int fx1, fy1, fx2, fy2, fx, fy;
int radius1 = radius / 2;
int radius0 = radius1 - radius + 1;
rout->clear();
wrapin = rin->getWrap();
wrapout = rout->getWrap();
/* calcolo l'area di output interessata */
x1 = std::max(0, -dx - 1);
y1 = std::max(0, -dy - 1);
x2 = std::min(rout->getLx() - 1, -dx + rin->getLx());
y2 = std::min(rout->getLy() - 1, -dy + rin->getLy());
rin->lock();
rout->lock();
bufferin = rin->pixels();
bufferout = rout->pixels();
for (y = y1; y <= y2; y++) {
fy1 = std::max(radius0, -dy - y);
fy2 = std::min(radius1, -dy - y + rin->getLy() - 1);
if (fy1 > fy2)
continue;
x = x1;
pixout = bufferout + wrapout * y + x;
pixin = bufferin + wrapin * (y + dy) + (x + dx);
while (x <= x2) {
fx1 = std::max(radius0, -dx - x);
fx2 = std::min(radius1, -dx - x + rin->getLx() - 1);
if (x > -dx && x < -dx + rin->getLx() - 1)
n = std::min(-dx + rin->getLx() - 1 - x, x2 - x + 1);
else
n = 1;
if (n < 1)
break;
pixn = 0;
for (fy = fy1; fy <= fy2; fy++)
for (fx = fx1; fx <= fx2; fx++) {
pixarr[pixn] = pixin + fy * wrapin + fx;
w[pixn] = (long)(conv[(fy - radius0) * radius + fx - radius0] * (1 << 16));
pixn++;
}
doConvolve_row_i<PIXOUT, PIXIN>(pixout, n, pixarr.get(), w.get(), pixn);
x += n;
pixin += n;
pixout += n;
}
}
rin->unlock();
rout->unlock();
}
//------------------------------------------------------------------------------
template <class PIXOUT>
void doConvolve_cm32_3_i(TRasterPT<PIXOUT> rout,
TRasterCM32P rin,
const TPaletteP &palette,
int dx, int dy,
double conv[])
{
TPixelCM32 *pixin;
PIXOUT *pixout;
TPixelCM32 *pixarr[9];
long w[9];
int pixn;
int wrapin, wrapout;
int x, y, n;
int x1, y1, x2, y2;
int fx1, fy1, fx2, fy2, fx, fy;
rout->clear();
wrapin = rin->getWrap();
wrapout = rout->getWrap();
/* calcolo l'area di output interessata */
x1 = std::max(0, -dx - 1);
y1 = std::max(0, -dy - 1);
x2 = std::min(rout->getLx() - 1, -dx + rin->getLx());
y2 = std::min(rout->getLy() - 1, -dy + rin->getLy());
int colorCount = palette->getStyleCount();
colorCount = std::max({colorCount, TPixelCM32::getMaxInk(), TPixelCM32::getMaxPaint()});
std::vector<TPixel32> paints(colorCount);
std::vector<TPixel32> inks(colorCount);
rin->lock();
rout->lock();
TPixelCM32 *bufferin = rin->pixels();
PIXOUT *bufferout = rout->pixels();
for (int i = 0; i < palette->getStyleCount(); i++)
paints[i] = inks[i] = palette->getStyle(i)->getAverageColor();
for (y = y1; y <= y2; y++) {
fy1 = std::max(-1, -dy - y);
fy2 = std::min(1, -dy + rin->getLy() - 1 - y);
if (fy1 > fy2)
continue;
x = x1;
pixout = bufferout + wrapout * y + x;
pixin = bufferin + wrapin * (y + dy) + (x + dx);
while (x <= x2) {
fx1 = std::max(-1, -dx - x);
fx2 = std::min(1, -dx + rin->getLx() - 1 - x);
if (x > -dx && x < -dx + rin->getLx() - 1)
n = std::min(-dx + rin->getLx() - 1 - x, x2 - x + 1);
else
n = 1;
if (n < 1)
break;
pixn = 0;
for (fy = fy1; fy <= fy2; fy++)
for (fx = fx1; fx <= fx2; fx++) {
pixarr[pixn] = pixin + fy * wrapin + fx;
w[pixn] = (long)(conv[(fy + 1) * 3 + fx + 1] * (1 << 16));
pixn++;
}
if (pixn == 9)
doConvolve_cm32_row_9_i<PIXOUT>(pixout, n, pixarr, w, paints, inks);
else
doConvolve_cm32_row_i<PIXOUT>(pixout, n, pixarr, w, pixn, paints, inks);
x += n;
pixin += n;
pixout += n;
}
}
rin->unlock();
rout->unlock();
}
//------------------------------------------------------------------------------
template <class PIXOUT>
void doConvolve_cm32_i(TRasterPT<PIXOUT> rout,
TRasterCM32P rin,
const TPaletteP &palette,
int dx, int dy,
double conv[], int radius)
{
TPixelCM32 *pixin;
PIXOUT *pixout;
int radiusSquare = sq(radius);
std::unique_ptr<TPixelCM32*[]> pixarr(new TPixelCM32*[radiusSquare]);
std::unique_ptr<long[]> w(new long[radiusSquare]);
int pixn;
int wrapin, wrapout;
int x, y, n;
int x1, y1, x2, y2;
int fx1, fy1, fx2, fy2, fx, fy;
int radius1 = radius / 2;
int radius0 = radius1 - radius + 1;
rout->clear();
wrapin = rin->getWrap();
wrapout = rout->getWrap();
/* calcolo l'area di output interessata */
x1 = std::max(0, -dx - 1);
y1 = std::max(0, -dy - 1);
x2 = std::min(rout->getLx() - 1, -dx + rin->getLx());
y2 = std::min(rout->getLy() - 1, -dy + rin->getLy());
int colorCount = palette->getStyleCount();
colorCount = std::max({colorCount, TPixelCM32::getMaxInk(), TPixelCM32::getMaxPaint()});
std::vector<TPixel32> paints(colorCount);
std::vector<TPixel32> inks(colorCount);
rin->lock();
rout->lock();
TPixelCM32 *bufferin = rin->pixels();
PIXOUT *bufferout = rout->pixels();
for (int i = 0; i < palette->getStyleCount(); i++)
paints[i] = inks[i] = palette->getStyle(i)->getAverageColor();
for (y = y1; y <= y2; y++) {
fy1 = std::max(radius0, -dy - y);
fy2 = std::min(radius1, -dy + rin->getLy() - 1 - y);
if (fy1 > fy2)
continue;
x = x1;
pixout = bufferout + wrapout * y + x;
pixin = bufferin + wrapin * (y + dy) + (x + dx);
while (x <= x2) {
fx1 = std::max(radius0, -dx - x);
fx2 = std::min(radius1, -dx + rin->getLx() - 1 - x);
if (x > -dx && x < -dx + rin->getLx() - 1)
n = std::min(-dx + rin->getLx() - 1 - x, x2 - x + 1);
else
n = 1;
if (n < 1)
break;
pixn = 0;
for (fy = fy1; fy <= fy2; fy++)
for (fx = fx1; fx <= fx2; fx++) {
pixarr[pixn] = pixin + fy * wrapin + fx;
w[pixn] = (long)(conv[(fy - radius0) * radius + fx - radius0] * (1 << 16));
pixn++;
}
doConvolve_cm32_row_i<PIXOUT>(pixout, n, pixarr.get(), w.get(), pixn, paints, inks);
x += n;
pixin += n;
pixout += n;
}
}
rin->unlock();
rout->unlock();
}
} // anonymous namespace
//------------------------------------------------------------------------------
void TRop::convolve_3_i(TRasterP rout, TRasterP rin, int dx, int dy, double conv[])
{
TRaster32P rin32 = rin;
if (rin32) {
TRaster32P rout32 = rout;
if (rout32) {
doConvolve_3_i<TPixel32, TPixel32>(rout32, rin32, dx, dy, conv);
return;
}
TRaster64P rout64 = rout;
if (rout64) {
doConvolve_3_i<TPixel64, TPixel32>(rout64, rin32, dx, dy, conv);
return;
}
} else {
TRaster64P rin64 = rin;
if (rin64) {
TRaster32P rout32 = rout;
if (rout32) {
doConvolve_3_i<TPixel32, TPixel64>(rout32, rin64, dx, dy, conv);
return;
}
TRaster64P rout64 = rout;
if (rout64) {
doConvolve_3_i<TPixel64, TPixel64>(rout64, rin64, dx, dy, conv);
return;
}
}
}
throw TRopException("TRop::convolve_3_i: unsupported pixel type");
}
//------------------------------------------------------------------------------
void TRop::convolve_3_i(TRasterP rout, TRasterCM32P rin, const TPaletteP &palette,
int dx, int dy, double conv[])
{
TRaster32P rout32 = rout;
if (rout32) {
doConvolve_cm32_3_i<TPixel32>(rout32, rin, palette, dx, dy, conv);
return;
}
TRaster64P rout64 = rout;
if (rout64) {
doConvolve_cm32_3_i<TPixel64>(rout64, rin, palette, dx, dy, conv);
return;
}
throw TRopException("TRop::convolve_3_i: unsupported pixel type");
}
//------------------------------------------------------------------------------
void TRop::convolve_i(TRasterP rout, TRasterP rin, int dx, int dy, double conv[], int radius)
{
TRaster32P rin32 = rin;
if (rin32) {
TRaster32P rout32 = rout;
if (rout32) {
doConvolve_i<TPixel32, TPixel32>(rout32, rin32, dx, dy, conv, radius);
return;
}
TRaster64P rout64 = rout;
if (rout64) {
doConvolve_i<TPixel64, TPixel32>(rout64, rin32, dx, dy, conv, radius);
return;
}
} else {
TRaster64P rin64 = rin;
if (rin64) {
TRaster32P rout32 = rout;
if (rout32) {
doConvolve_i<TPixel32, TPixel64>(rout32, rin64, dx, dy, conv, radius);
return;
}
TRaster64P rout64 = rout;
if (rout64) {
doConvolve_i<TPixel64, TPixel64>(rout64, rin64, dx, dy, conv, radius);
return;
}
}
}
throw TRopException("TRop::convolve_i: unsupported pixel type");
}
//------------------------------------------------------------------------------
void TRop::convolve_i(TRasterP rout, TRasterCM32P rin, const TPaletteP &palette,
int dx, int dy, double conv[], int radius)
{
TRaster32P rout32 = rout;
if (rout32) {
doConvolve_cm32_i<TPixel32>(rout32, rin, palette, dx, dy, conv, radius);
return;
}
TRaster64P rout64 = rout;
if (rout64) {
doConvolve_cm32_i<TPixel64>(rout64, rin, palette, dx, dy, conv, radius);
return;
}
throw TRopException("TRop::convolve_i: unsupported pixel type");
}