/****************************************************************************** * * Copyright (C) 2015 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at: * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ***************************************************************************** * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore */ /** ******************************************************************************* * @file * ih264_mem_fns_atom_intr.c * * @brief * Functions used for memory operations * * @author * Ittiam * * @par List of Functions: * * @remarks * None * ******************************************************************************* */ /*****************************************************************************/ /* File Includes */ /*****************************************************************************/ #include <stdio.h> #include <stddef.h> #include <stdlib.h> #include <string.h> #include <assert.h> #include "ih264_typedefs.h" #include "ih264_mem_fns.h" #include <immintrin.h> /** ******************************************************************************* * * @brief * memcpy of a 8,16 or 32 bytes * * @par Description: * Does memcpy of 8bit data from source to destination for 8,16 or 32 number of bytes * * @param[in] pu1_dst * UWORD8 pointer to the destination * * @param[in] pu1_src * UWORD8 pointer to the source * * @param[in] num_bytes * number of bytes to copy * @returns * * @remarks * None * ******************************************************************************* */ void ih264_memcpy_mul_8_ssse3(UWORD8 *pu1_dst, UWORD8 *pu1_src, UWORD32 num_bytes) { int col; for(col = num_bytes; col >= 8; col -= 8) { __m128i src_temp16x8b; src_temp16x8b = _mm_loadl_epi64((__m128i *)(pu1_src)); pu1_src += 8; _mm_storel_epi64((__m128i *)(pu1_dst), src_temp16x8b); pu1_dst += 8; } } /** ******************************************************************************* * * @brief * memset of a 8,16 or 32 bytes * * @par Description: * Does memset of 8bit data for 8,16 or 32 number of bytes * * @param[in] pu1_dst * UWORD8 pointer to the destination * * @param[in] value * UWORD8 value used for memset * * @param[in] num_bytes * number of bytes to set * @returns * * @remarks * None * ******************************************************************************* */ void ih264_memset_mul_8_ssse3(UWORD8 *pu1_dst, UWORD8 value, UWORD32 num_bytes) { int col; __m128i src_temp16x8b; src_temp16x8b = _mm_set1_epi8(value); for(col = num_bytes; col >= 8; col -= 8) { _mm_storel_epi64((__m128i *)(pu1_dst), src_temp16x8b); pu1_dst += 8; } } /** ******************************************************************************* * * @brief * memset of 16bit data of a 8,16 or 32 bytes * * @par Description: * Does memset of 16bit data for 8,16 or 32 number of bytes * * @param[in] pu2_dst * UWORD8 pointer to the destination * * @param[in] value * UWORD16 value used for memset * * @param[in] num_words * number of words to set * @returns * * @remarks * None * ******************************************************************************* */ void ih264_memset_16bit_mul_8_ssse3(UWORD16 *pu2_dst, UWORD16 value, UWORD32 num_words) { int col; __m128i src_temp16x8b; src_temp16x8b = _mm_set1_epi16(value); for(col = num_words; col >= 8; col -= 8) { _mm_storeu_si128((__m128i *)(pu2_dst), src_temp16x8b); pu2_dst += 8; } }