/* * Copyright 2017 Google Inc. * * Use of this source code is governed by a BSD-style license that can be * found in the LICENSE file. */ #ifndef SkUtils_opts_DEFINED #define SkUtils_opts_DEFINED #include #include "src/base/SkVx.h" namespace SK_OPTS_NS { template static void memsetT(T buffer[], T value, int count) { #if defined(SK_CPU_SSE_LEVEL) && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_AVX static constexpr int VecSize = 32 / sizeof(T); #else static constexpr int VecSize = 16 / sizeof(T); #endif static_assert(VecSize > 0, "T is too big for memsetT"); // Create an vectorized version of value skvx::Vec wideValue(value); while (count >= VecSize) { // Copy the value into the destination buffer (VecSize elements at a time) wideValue.store(buffer); buffer += VecSize; count -= VecSize; } // If count was not an even multiple of VecSize, take care of the last few. while (count-- > 0) { *buffer++ = value; } } /*not static*/ inline void memset16(uint16_t buffer[], uint16_t value, int count) { memsetT(buffer, value, count); } /*not static*/ inline void memset32(uint32_t buffer[], uint32_t value, int count) { memsetT(buffer, value, count); } /*not static*/ inline void memset64(uint64_t buffer[], uint64_t value, int count) { memsetT(buffer, value, count); } template static void rect_memsetT(T buffer[], T value, int count, size_t rowBytes, int height) { while (height --> 0) { memsetT(buffer, value, count); buffer = (T*)((char*)buffer + rowBytes); } } /*not static*/ inline void rect_memset16(uint16_t buffer[], uint16_t value, int count, size_t rowBytes, int height) { rect_memsetT(buffer, value, count, rowBytes, height); } /*not static*/ inline void rect_memset32(uint32_t buffer[], uint32_t value, int count, size_t rowBytes, int height) { rect_memsetT(buffer, value, count, rowBytes, height); } /*not static*/ inline void rect_memset64(uint64_t buffer[], uint64_t value, int count, size_t rowBytes, int height) { rect_memsetT(buffer, value, count, rowBytes, height); } } // namespace SK_OPTS_NS #endif//SkUtils_opts_DEFINED