2023-01-18 10:49:58 +01:00

71 lines
1.9 KiB
C

/******************************************************************************
*
* Copyright 2022 Google LLC
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
******************************************************************************/
#if __ARM_FEATURE_SIMD32
#include <arm_acle.h>
static inline int16x2_t __pkhbt(int16x2_t a, int16x2_t b)
{
int16x2_t r;
__asm("pkhbt %0, %1, %2" : "=r" (r) : "r" (a), "r" (b));
return r;
}
#else
#include <stdint.h>
typedef int32_t int16x2_t;
__attribute__((unused))
static int16x2_t __pkhbt(int16x2_t a, int16x2_t b)
{
uint32_t a_bot = (uint32_t)a & 0x0000ffffu;
uint32_t b_top = (uint32_t)b & 0xffff0000u;
return (int16x2_t)(a_bot | b_top);
}
__attribute__((unused))
static int32_t __smlad(int16x2_t a, int16x2_t b, int32_t u)
{
int16_t a_hi = a >> 16, a_lo = a & 0xffff;
int16_t b_hi = b >> 16, b_lo = b & 0xffff;
return u + (a_hi * b_hi) + (a_lo * b_lo);
}
__attribute__((unused))
static int64_t __smlald(int16x2_t a, int16x2_t b, int64_t u)
{
int16_t a_hi = a >> 16, a_lo = a & 0xffff;
int16_t b_hi = b >> 16, b_lo = b & 0xffff;
return u + (a_hi * b_hi) + (a_lo * b_lo);
}
__attribute__((unused))
static int64_t __smlaldx(int16x2_t a, int16x2_t b, int64_t u)
{
int16_t a_hi = a >> 16, a_lo = a & 0xffff;
int16_t b_hi = b >> 16, b_lo = b & 0xffff;
return u + (a_hi * b_lo) + (a_lo * b_hi);
}
#endif /* __ARM_FEATURE_SIMD32 */