mirror of
https://github.com/cemu-project/Cemu.git
synced 2024-12-29 11:11:51 +01:00
178 lines
4.2 KiB
C
178 lines
4.2 KiB
C
/******************************************************************************
|
|
*
|
|
* Copyright (C) 2015 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at:
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*
|
|
*****************************************************************************
|
|
* Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
|
|
*/
|
|
/**
|
|
*******************************************************************************
|
|
* @file
|
|
* ih264_mem_fns_atom_intr.c
|
|
*
|
|
* @brief
|
|
* Functions used for memory operations
|
|
*
|
|
* @author
|
|
* Ittiam
|
|
*
|
|
* @par List of Functions:
|
|
*
|
|
* @remarks
|
|
* None
|
|
*
|
|
*******************************************************************************
|
|
*/
|
|
|
|
/*****************************************************************************/
|
|
/* File Includes */
|
|
/*****************************************************************************/
|
|
#include <stdio.h>
|
|
#include <stddef.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <assert.h>
|
|
|
|
#include "ih264_typedefs.h"
|
|
#include "ih264_mem_fns.h"
|
|
|
|
#include <immintrin.h>
|
|
|
|
#ifdef __GNUC__
|
|
#define ATTRIBUTE_SSSE3 __attribute__((target("ssse3")))
|
|
#else
|
|
#define ATTRIBUTE_SSSE3
|
|
#endif
|
|
|
|
/**
|
|
*******************************************************************************
|
|
*
|
|
* @brief
|
|
* memcpy of a 8,16 or 32 bytes
|
|
*
|
|
* @par Description:
|
|
* Does memcpy of 8bit data from source to destination for 8,16 or 32 number of bytes
|
|
*
|
|
* @param[in] pu1_dst
|
|
* UWORD8 pointer to the destination
|
|
*
|
|
* @param[in] pu1_src
|
|
* UWORD8 pointer to the source
|
|
*
|
|
* @param[in] num_bytes
|
|
* number of bytes to copy
|
|
* @returns
|
|
*
|
|
* @remarks
|
|
* None
|
|
*
|
|
*******************************************************************************
|
|
*/
|
|
|
|
|
|
|
|
|
|
ATTRIBUTE_SSSE3
|
|
void ih264_memcpy_mul_8_ssse3(UWORD8 *pu1_dst, UWORD8 *pu1_src, UWORD32 num_bytes)
|
|
{
|
|
int col;
|
|
for(col = num_bytes; col >= 8; col -= 8)
|
|
{
|
|
__m128i src_temp16x8b;
|
|
src_temp16x8b = _mm_loadl_epi64((__m128i *)(pu1_src));
|
|
pu1_src += 8;
|
|
_mm_storel_epi64((__m128i *)(pu1_dst), src_temp16x8b);
|
|
pu1_dst += 8;
|
|
}
|
|
}
|
|
|
|
/**
|
|
*******************************************************************************
|
|
*
|
|
* @brief
|
|
* memset of a 8,16 or 32 bytes
|
|
*
|
|
* @par Description:
|
|
* Does memset of 8bit data for 8,16 or 32 number of bytes
|
|
*
|
|
* @param[in] pu1_dst
|
|
* UWORD8 pointer to the destination
|
|
*
|
|
* @param[in] value
|
|
* UWORD8 value used for memset
|
|
*
|
|
* @param[in] num_bytes
|
|
* number of bytes to set
|
|
* @returns
|
|
*
|
|
* @remarks
|
|
* None
|
|
*
|
|
*******************************************************************************
|
|
*/
|
|
|
|
|
|
ATTRIBUTE_SSSE3
|
|
void ih264_memset_mul_8_ssse3(UWORD8 *pu1_dst, UWORD8 value, UWORD32 num_bytes)
|
|
{
|
|
int col;
|
|
__m128i src_temp16x8b;
|
|
src_temp16x8b = _mm_set1_epi8(value);
|
|
for(col = num_bytes; col >= 8; col -= 8)
|
|
{
|
|
_mm_storel_epi64((__m128i *)(pu1_dst), src_temp16x8b);
|
|
pu1_dst += 8;
|
|
}
|
|
}
|
|
|
|
/**
|
|
*******************************************************************************
|
|
*
|
|
* @brief
|
|
* memset of 16bit data of a 8,16 or 32 bytes
|
|
*
|
|
* @par Description:
|
|
* Does memset of 16bit data for 8,16 or 32 number of bytes
|
|
*
|
|
* @param[in] pu2_dst
|
|
* UWORD8 pointer to the destination
|
|
*
|
|
* @param[in] value
|
|
* UWORD16 value used for memset
|
|
*
|
|
* @param[in] num_words
|
|
* number of words to set
|
|
* @returns
|
|
*
|
|
* @remarks
|
|
* None
|
|
*
|
|
*******************************************************************************
|
|
*/
|
|
|
|
|
|
void ih264_memset_16bit_mul_8_ssse3(UWORD16 *pu2_dst, UWORD16 value, UWORD32 num_words)
|
|
{
|
|
int col;
|
|
__m128i src_temp16x8b;
|
|
src_temp16x8b = _mm_set1_epi16(value);
|
|
for(col = num_words; col >= 8; col -= 8)
|
|
{
|
|
_mm_storeu_si128((__m128i *)(pu2_dst), src_temp16x8b);
|
|
pu2_dst += 8;
|
|
}
|
|
}
|
|
|