/* * The ManaPlus Client * Copyright (C) 2011-2016 The ManaPlus Developers * * This file is part of The ManaPlus Client. * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ std::vector::const_iterator it_end = mColors.end(); const size_t sz = mColors.size(); if (!sz || !pixels) return; if (sz % 2) -- it_end; const int mod = bufSize % 4; const int bufEnd = bufSize - mod; for (int ptr = 0; ptr < bufEnd; ptr += 4) { // __m128i base = _mm_load_si128(reinterpret_cast<__m128i*>(pixels)); __m128i base = _mm_loadu_si128(reinterpret_cast<__m128i*>( &pixels[ptr])); std::vector::const_iterator it = mColors.begin(); while (it != it_end) { const DyeColor &col = *it; ++ it; const DyeColor &col2 = *it; __m128i newMask = _mm_set1_epi32(col2.valueA); __m128i cmpMask = _mm_set1_epi32(col.valueA); __m128i cmpRes = _mm_cmpeq_epi32(base, cmpMask); __m128i srcAnd = _mm_andnot_si128(cmpRes, base); __m128i dstAnd = _mm_and_si128(cmpRes, newMask); base = _mm_or_si128(srcAnd, dstAnd); ++ it; } // _mm_store_si128(reinterpret_cast<__m128i*>(pixels), base); _mm_storeu_si128(reinterpret_cast<__m128i*>(&pixels[ptr]), base); } // complete end without simd for (int ptr = bufSize - mod; ptr < bufSize; ptr ++) { uint8_t *const p = reinterpret_cast(&pixels[ptr]); const unsigned int data = pixels[ptr]; std::vector::const_iterator it = mColors.begin(); while (it != it_end) { const DyeColor &col = *it; ++ it; const DyeColor &col2 = *it; const unsigned int coldata = (col.value[3]) | (col.value[2] << 8U) | (col.value[1] << 16U) | (col.value[0] << 24U); if (data == coldata) { p[3] = col2.value[0]; p[2] = col2.value[1]; p[1] = col2.value[2]; p[0] = col2.value[3]; break; } ++ it; } }