|
|
|
@ -144,21 +144,11 @@ bmcr_alpha_blend_single:
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
case BM_TRANSPARENT: {
|
|
|
|
|
/* Make the current colour a bit more black, so it looks like this image is transparent.
|
|
|
|
|
* rgb = rgb * ((256/4) * 4 - (alpha/4)) / ((256/4) * 4)
|
|
|
|
|
*/
|
|
|
|
|
/* Make the current colour a bit more black, so it looks like this image is transparent. */
|
|
|
|
|
for (uint x = (uint) bp->width / 2; x > 0; x--) {
|
|
|
|
|
__m128i srcABCD = _mm_loadl_epi64((const __m128i*) src);
|
|
|
|
|
__m128i dstABCD = _mm_loadl_epi64((__m128i*) dst);
|
|
|
|
|
__m128i srcAB = _mm_unpacklo_epi8(srcABCD, _mm_setzero_si128());
|
|
|
|
|
__m128i dstAB = _mm_unpacklo_epi8(dstABCD, _mm_setzero_si128());
|
|
|
|
|
__m128i alphaAB = _mm_shufflelo_epi16(srcAB, 0x3F);
|
|
|
|
|
alphaAB = _mm_shufflehi_epi16(alphaAB, 0x3F);
|
|
|
|
|
alphaAB = _mm_srli_epi16(alphaAB, 2); // Reduce to 64 levels of shades so the max value fits in 16 bits.
|
|
|
|
|
__m128i nom = _mm_sub_epi16(tr_nom_base, alphaAB);
|
|
|
|
|
dstAB = _mm_mullo_epi16(dstAB, nom);
|
|
|
|
|
dstAB = _mm_srli_epi16(dstAB, 8);
|
|
|
|
|
dstAB = _mm_packus_epi16(dstAB, dstAB);
|
|
|
|
|
DARKEN_2();
|
|
|
|
|
_mm_storel_epi64((__m128i *) dst, dstAB);
|
|
|
|
|
src += 2;
|
|
|
|
|
dst += 2;
|
|
|
|
@ -166,15 +156,7 @@ bmcr_alpha_blend_single:
|
|
|
|
|
if (bp->width & 1) {
|
|
|
|
|
__m128i srcABCD = _mm_cvtsi32_si128(src->data);
|
|
|
|
|
__m128i dstABCD = _mm_cvtsi32_si128(dst->data);
|
|
|
|
|
__m128i srcAB = _mm_unpacklo_epi8(srcABCD, _mm_setzero_si128());
|
|
|
|
|
__m128i dstAB = _mm_unpacklo_epi8(dstABCD, _mm_setzero_si128());
|
|
|
|
|
__m128i alphaAB = _mm_shufflelo_epi16(srcAB, 0x3F);
|
|
|
|
|
alphaAB = _mm_shufflehi_epi16(alphaAB, 0x3F);
|
|
|
|
|
alphaAB = _mm_srli_epi16(alphaAB, 2);
|
|
|
|
|
__m128i nom = _mm_sub_epi16(tr_nom_base, alphaAB);
|
|
|
|
|
dstAB = _mm_mullo_epi16(dstAB, nom);
|
|
|
|
|
dstAB = _mm_srli_epi16(dstAB, 8);
|
|
|
|
|
dstAB = _mm_packus_epi16(dstAB, dstAB);
|
|
|
|
|
DARKEN_2();
|
|
|
|
|
dst->data = _mm_cvtsi128_si32(dstAB);
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|