Blob Blame Raw


#include "quickputP.h"
#include "tpixelutils.h"
#include "trastercm.h"
#include "tsystem.h"
#include "tropcm.h"
#include "tpalette.h"

#ifdef _WIN32
#include <emmintrin.h> // per SSE2
#endif

//-----------------------------------------------------------------------------
namespace
{

inline bool transp(const TPixel32 &p)
{
	return p.m == 0;
}
inline bool transp(const TPixel64 &p)
{
	return p.m == 0;
}

//-----------------------------------------------------------------------------

inline bool opaque(const TPixel32 &p)
{
	return p.m == 0xff;
}
inline bool opaque(const TPixel64 &p)
{
	return p.m == 0xffff;
}

//-----------------------------------------------------------------------------

#define MODO2
#define VELOCE
template <class T>
void do_overT3(TRasterPT<T> rout, const TRasterPT<T> &rdn, const TRasterPT<T> &rup)
{

	for (int y = 0; y < rout->getLy(); y++) {
#ifdef MODO1
		const T *dn_pix = rdn->pixels(y);
		const T *up_pix = rup->pixels(y);
		T *out_pix = rout->pixels(y);

#else
#ifdef MODO2
		const T *dn_pix = ((T *)rdn->getRawData()) + y * rdn->getWrap();
		const T *up_pix = ((T *)rup->getRawData()) + y * rup->getWrap();

		T *out_pix = ((T *)rout->getRawData()) + y * rout->getWrap();
#endif
#endif

		const T *dn_limit = dn_pix + rdn->getLx();
		for (; dn_pix < dn_limit; dn_pix++, up_pix++, out_pix++) {
#ifdef VELOCE
			if (transp(*up_pix))
				*out_pix = *dn_pix;
			else if (opaque(*up_pix))
				*out_pix = *up_pix;
			else {
				*out_pix = overPix(*dn_pix, *up_pix);
			}
#else

			T topval = *up_pix;
			if (transp(topval))
				*out_pix = *dn_pix;
			else if (opaque(topval))
				*out_pix = topval;
			else {
				*out_pix = overPix(*dn_pix, topval);
			}
#endif
		}
	}
}

//-----------------------------------------------------------------------------

template <typename PixTypeOut, typename PixTypeDn, typename PixTypeUp>
void do_over(TRasterPT<PixTypeOut> rout, const TRasterPT<PixTypeDn> &rdn,
			 const TRasterPT<PixTypeUp> &rup, const TRasterGR8P rmask)
{

	for (int y = 0; y < rout->getLy(); y++) {
		const PixTypeDn *dn_pix = ((PixTypeDn *)rdn->getRawData()) + y * rdn->getWrap();
		const PixTypeUp *up_pix = ((PixTypeUp *)rup->getRawData()) + y * rup->getWrap();

		PixTypeOut *out_pix = ((PixTypeOut *)rout->getRawData()) + y * rout->getWrap();
		TPixelGR8 *mask_pix = ((TPixelGR8 *)rmask->getRawData()) + y * rmask->getWrap();

		const PixTypeDn *dn_limit = dn_pix + rout->getLx();
		for (; dn_pix < dn_limit; dn_pix++, up_pix++, out_pix++, mask_pix++) {
			if (mask_pix->value == 0x00)
				*out_pix = *dn_pix;
			else if (mask_pix->value == 0xff)
				*out_pix = *up_pix;
			else {
				PixTypeUp p(*up_pix);
				p.m = mask_pix->value;
				*out_pix = overPix(*dn_pix, p); //hei!
			}
		}
	}
}

//-----------------------------------------------------------------------------

void do_over(TRasterCM32P rout, const TRasterCM32P &rup)
{
	assert(rout->getSize() == rup->getSize());
	for (int y = 0; y < rout->getLy(); y++) {
		TPixelCM32 *out_pix = rout->pixels(y);
		TPixelCM32 *const out_end = out_pix + rout->getLx();
		const TPixelCM32 *up_pix = rup->pixels(y);

		for (; out_pix < out_end; ++out_pix, ++up_pix) {
			if (!up_pix->isPureInk() &&
				up_pix->getPaint() != 0) // BackgroundStyle)
				*out_pix = *up_pix;
			else if (!up_pix->isPurePaint()) {
				TUINT32 *outl = (TUINT32 *)out_pix, *upl = (TUINT32 *)up_pix;

				*outl = ((*upl) & (TPixelCM32::getInkMask())) |
						((*outl) & (TPixelCM32::getPaintMask())) |
						tmin(up_pix->getTone(), out_pix->getTone());
			}
		}
	}
}

//-----------------------------------------------------------------------------

template <class T, class Q>
void do_overT2(TRasterPT<T> rout, const TRasterPT<T> &rup)
{
	UINT max = T::maxChannelValue;
	double maxD = max;

	assert(rout->getSize() == rup->getSize());
	for (int y = 0; y < rout->getLy(); y++) {
		T *out_pix = rout->pixels(y);
		T *const out_end = out_pix + rout->getLx();
		const T *up_pix = rup->pixels(y);

		for (; out_pix < out_end; ++out_pix, ++up_pix) {
			if (up_pix->m == max)
				*out_pix = *up_pix;
			else if (up_pix->m > 0) {
				TUINT32 r, g, b;
				r = up_pix->r + (out_pix->r * (max - up_pix->m)) / maxD;
				g = up_pix->g + (out_pix->g * (max - up_pix->m)) / maxD;
				b = up_pix->b + (out_pix->b * (max - up_pix->m)) / maxD;

				out_pix->r = (r < max) ? (Q)r : (Q)max;
				out_pix->g = (g < max) ? (Q)g : (Q)max;
				out_pix->b = (b < max) ? (Q)b : (Q)max;
				out_pix->m = up_pix->m + (out_pix->m * (max - up_pix->m)) / maxD;
			}
		}
	}
}

//-----------------------------------------------------------------------------

#ifdef _WIN32

void do_over_SSE2(TRaster32P rout, const TRaster32P &rup)
{
	__m128i zeros = _mm_setzero_si128();
	__m128i out_pix_packed_i, up_pix_packed_i;
	__m128 out_pix_packed, up_pix_packed;

	float maxChannelValue = 255.0;
	float maxChannelValueInv = 1.0f / maxChannelValue;

	__m128 maxChanneValue_packed = _mm_load1_ps(&maxChannelValue);

	assert(rout->getSize() == rup->getSize());
	for (int y = 0; y < rout->getLy(); y++) {
		TPixel32 *out_pix = rout->pixels(y);
		TPixel32 *const out_end = out_pix + rout->getLx();
		const TPixel32 *up_pix = rup->pixels(y);

		for (; out_pix < out_end; ++out_pix, ++up_pix) {
			if (up_pix->m == 0xff)
				*out_pix = *up_pix;
			else if (up_pix->m > 0) {
				float factor = (255.0f - up_pix->m) / 255.0f;
				__m128 factor_packed = _mm_load1_ps(&factor);

				// carica up_pix e out_pix in due registri a 128 bit
				up_pix_packed_i = _mm_unpacklo_epi8(_mm_cvtsi32_si128(*(DWORD *)up_pix), zeros);
				up_pix_packed = _mm_cvtepi32_ps(_mm_unpacklo_epi16(up_pix_packed_i, zeros));

				out_pix_packed_i = _mm_unpacklo_epi8(_mm_cvtsi32_si128(*(DWORD *)out_pix), zeros);
				out_pix_packed = _mm_cvtepi32_ps(_mm_unpacklo_epi16(out_pix_packed_i, zeros));

				out_pix_packed = _mm_add_ps(up_pix_packed, _mm_mul_ps(out_pix_packed, factor_packed));
				out_pix_packed = _mm_min_ps(maxChanneValue_packed, out_pix_packed);

				out_pix_packed_i = _mm_cvtps_epi32(out_pix_packed);
				out_pix_packed_i = _mm_packs_epi32(out_pix_packed_i, zeros);
				out_pix_packed_i = _mm_packus_epi16(out_pix_packed_i, zeros);
				*(DWORD *)(out_pix) = _mm_cvtsi128_si32(out_pix_packed_i);
			}
		}
	}
}

#endif

//-----------------------------------------------------------------------------

void do_over(TRaster32P rout, const TRasterGR8P &rup)
{
	assert(rout->getSize() == rup->getSize());
	for (int y = rout->getLy(); --y >= 0;) {
		TPixel32 *out_pix = rout->pixels(y);
		TPixel32 *const out_end = out_pix + rout->getLx();
		const TPixelGR8 *up_pix = rup->pixels(y);

		for (; out_pix < out_end; ++out_pix, ++up_pix) {
			int v = up_pix->value;
			out_pix->r = out_pix->r * v / 255;
			out_pix->g = out_pix->r;
			out_pix->b = out_pix->r;
		}
	}
}

//-----------------------------------------------------------------------------

void do_over(TRasterGR8P rout, const TRaster32P &rup)
{
	assert(rout->getSize() == rup->getSize());
	for (int y = rout->getLy(); --y >= 0;) {
		TPixelGR8 *out_pix = rout->pixels(y);
		TPixelGR8 *const out_end = out_pix + rout->getLx();
		const TPixel32 *up_pix = rup->pixels(y);
		TPixel32 *temp_pix = new TPixel32();
		for (; out_pix < out_end; ++out_pix, ++up_pix) {
			temp_pix->r = out_pix->value;
			temp_pix->g = out_pix->value;
			temp_pix->b = out_pix->value;
			temp_pix->m = 0xff;
			TPixel32 out32_pix = overPix(*temp_pix, *up_pix);
			*out_pix = out_pix->from(out32_pix);
		}
	}
}

} // namespace

//-----------------------------------------------------------------------------

void do_over(TRaster32P rout, const TRasterGR8P &rup, const TPixel32 &color)
{
	assert(rout->getSize() == rup->getSize());
	for (int y = rout->getLy(); --y >= 0;) {
		TPixel32 *out_pix = rout->pixels(y);
		TPixel32 *const out_end = out_pix + rout->getLx();
		const TPixelGR8 *up_pix = rup->pixels(y);

		for (; out_pix < out_end; ++out_pix, ++up_pix) {
			double v = up_pix->value / 255.0;
			TPixel32 up(troundp(v * color.r), troundp(v * color.g), troundp(v * color.b), troundp(v * color.m));
			*out_pix = overPix(*out_pix, up);
		}
	}
}

//-----------------------------------------------------------------------------

void TRop::over(TRaster32P rout, const TRasterGR8P &rup, const TPixel32 &color)
{
	rout->lock();
	do_over(rout, rup, color);
	rout->unlock();
}

//-----------------------------------------------------------------------------

void TRop::over(const TRasterP &rout, const TRasterP &rdn, const TRasterP &rup)
{
	TRect rect = rout->getBounds() * rdn->getBounds() * rup->getBounds();
	if (rect.isEmpty())
		return;

	TRasterP cRout = rout->extract(rect);
	TRasterP cRdn = rdn->extract(rect);
	TRasterP cRup = rup->extract(rect);
	rout->lock();
	rdn->lock();
	rup->lock();
	TRaster32P rout32 = cRout, rdn32 = cRdn, rup32 = cRup;
	TRaster64P rout64 = cRout, rdn64 = cRdn, rup64 = cRup;
	if (rout32 && rdn32 && rup32)
		do_overT3<TPixel32>(rout32, rdn32, rup32);
	else if (rout64 && rdn64 && rup64)
		do_overT3<TPixel64>(rout64, rdn64, rup64);
	else {
		rout->unlock();
		rdn->unlock();
		rup->unlock();
		throw TRopException("unsupported pixel type");
	}

	rout->unlock();
	rdn->unlock();
	rup->unlock();
}

//-----------------------------------------------------------------------------

void TRop::over(const TRasterP &rout, const TRasterP &rup, const TPoint &pos)
{
	TRect outRect(rout->getBounds());
	TRect upRect(rup->getBounds() + pos);
	TRect intersection = outRect * upRect;
	if (intersection.isEmpty())
		return;

	TRasterP cRout = rout->extract(intersection);
	TRect r = intersection - pos;
	TRasterP cRup = rup->extract(r);

	TRaster32P rout32 = cRout, rup32 = cRup;
	TRaster64P rout64 = cRout, rup64 = cRup;

	TRasterGR8P rout8 = cRout, rup8 = cRup;

	TRasterCM32P routCM32 = cRout, rupCM32 = cRup;

	rout->lock();
	rup->lock();

	// TRaster64P rout64 = rout, rin64 = rin;
	if (rout32 && rup32) {
#ifdef _WIN32
		if (TSystem::getCPUExtensions() & TSystem::CpuSupportsSse2)
			do_over_SSE2(rout32, rup32);
		else
#endif
			do_overT2<TPixel32, UCHAR>(rout32, rup32);
	} else if (rout64) {
		if (!rup64) {
			TRaster64P raux(cRup->getSize());
			TRop::convert(raux, cRup);
			rup64 = raux;
		}
		do_overT2<TPixel64, USHORT>(rout64, rup64);
	} else if (rout32 && rup8)
		do_over(rout32, rup8);
	else if (rout8 && rup32)
		do_over(rout8, rup32);
	else if (rout8 && rup8)
		TRop::copy(rout8, rup8);
	else if (routCM32 && rupCM32)
		do_over(routCM32, rupCM32);
	else {
		rout->unlock();
		rup->unlock();
		throw TRopException("unsupported pixel type");
	}

	rout->unlock();
	rup->unlock();
}

//-----------------------------------------------------------------------------

static void addBackground32(TRaster32P ras, const TPixel32 &col)
{
	ras->lock();
	int nrows = ras->getLy();
	while (nrows-- > 0) {
		TPixel32 *pix = ras->pixels(nrows);
		TPixel32 *endPix = pix + ras->getLx();
		while (pix < endPix) {
			*pix = overPix(col, *pix);
			pix++;
		}
	}
	ras->unlock();
}

//-----------------------------------------------------------------------------

void TRop::addBackground(TRasterP ras, const TPixel32 &col)
{
	TRaster32P ras32 = ras;
	if (ras32)
		addBackground32(ras32, col);
	else
		throw TRopException("unsupported pixel type");
}

//===================================================================

//Usata tinylinetest
static void my_do_over(TRaster32P rout, const TRasterGR8P &rup)
{
	assert(rout->getSize() == rup->getSize());
	for (int y = rout->getLy(); --y >= 0;) {
		TPixel32 *out_pix = rout->pixels(y);
		TPixel32 *const out_end = out_pix + rout->getLx();
		const TPixelGR8 *up_pix = rup->pixels(y);

		for (; out_pix < out_end; ++out_pix, ++up_pix) {
			int v = up_pix->value;
			out_pix->r = out_pix->r * v / 255;
			out_pix->g = out_pix->r;
			out_pix->b = out_pix->r;
		}
	}
}

//===================================================================

void TRop::over(const TRasterP &out,
				const TRasterP &up,
				const TAffine &aff,
				ResampleFilterType filterType)
{
	out->lock();
	up->lock();

	if (filterType == ClosestPixel || filterType == Bilinear)
		::quickPut(out, up, aff, filterType);
	else {
		TRect rasterBounds = up->getBounds();
		TRectD dbounds(rasterBounds.x0, rasterBounds.y0, rasterBounds.x1 + 1, rasterBounds.y1 + 1);
		dbounds = aff * dbounds;
		TRect bounds(tfloor(dbounds.x0), tfloor(dbounds.y0), tceil(dbounds.x1) - 1, tceil(dbounds.y1) - 1);
		TRasterP tmp = up->create(bounds.getLx(), bounds.getLy());
		resample(tmp, up, TTranslation(-bounds.x0, -bounds.y0) * aff, filterType);
		over(out, tmp, bounds.getP00());
	}
	out->unlock();
	up->unlock();
}

void TRop::over(const TRasterP &out, const TRasterP &up, const TPoint &pos, const TAffine &aff,
				ResampleFilterType filterType)
{
	if (aff.isIdentity())
		//simple over with offset
		TRop::over(out, up, pos);
	else {
		TRect rasterBounds = up->getBounds();
		TRectD dbounds(rasterBounds.x0, rasterBounds.y0, rasterBounds.x1, rasterBounds.y1);
		dbounds = aff * dbounds;
		TRect bounds(tfloor(dbounds.x0), tfloor(dbounds.y0), tceil(dbounds.x1), tceil(dbounds.y1));
		TRasterP tmp = up->create(bounds.getLx(), bounds.getLy());
		resample(tmp, up, TTranslation(-dbounds.getP00()) * aff, filterType);
		TRop::over(out, tmp, pos);
	}
}

void TRop::over(TRasterP rout, const TRasterCM32P &rup, TPalette *palette, const TPoint &point, const TAffine &aff)
{
	TRaster32P app(rup->getSize());
	TRop::convert(app, rup, palette);
	TRop::over(rout, app, point, aff);
}

//===================================================================

void TRop::quickPut(const TRasterP &out,
					const TRasterP &up,
					const TAffine &aff,
					const TPixel32 &colorScale,
					bool doPremultiply, bool whiteTransp, bool firstColumn,
					bool doRasterDarkenBlendedView)
{
	::quickPut(out, up, aff, ClosestPixel, colorScale, doPremultiply, whiteTransp, firstColumn, doRasterDarkenBlendedView);
}

//===================================================================

void TRop::over(const TRasterP &out, const TRasterP &dn, const TRasterP &up, const TRasterGR8P &mask)
{
	out->lock();
	up->lock();
	dn->lock();

	TRaster32P out32 = out;
	TRaster32P dn32 = dn;
	TRaster32P up32 = up;

	if (out32 && dn32 && up32)
		do_over<TPixel32, TPixel32, TPixel32>(out32, dn32, up32, mask);
	else {
		TRaster64P out64 = out;
		TRaster64P dn64 = dn;
		TRaster64P up64 = up;
		if (out64 && dn64 && up64)
			do_over<TPixel64, TPixel64, TPixel64>(out64, dn64, up64, mask);
		else
			throw TRopException("unsupported pixel type");
	}
	out->unlock();
	up->unlock();
	dn->unlock();
}