1 /******************************************************************************
2 *
3 * Copyright 2022 Google LLC
4 *
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at:
8 *
9 * http://www.apache.org/licenses/LICENSE-2.0
10 *
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
16 *
17 ******************************************************************************/
18
19 #if __ARM_FEATURE_SIMD32
20
21 #include <arm_acle.h>
22
__pkhbt(int16x2_t a,int16x2_t b)23 static inline int16x2_t __pkhbt(int16x2_t a, int16x2_t b)
24 {
25 int16x2_t r;
26 __asm("pkhbt %0, %1, %2" : "=r" (r) : "r" (a), "r" (b));
27 return r;
28 }
29
30 #else
31
32 #include <stdint.h>
33
34 typedef int32_t int16x2_t;
35
36 __attribute__((unused))
__pkhbt(int16x2_t a,int16x2_t b)37 static int16x2_t __pkhbt(int16x2_t a, int16x2_t b)
38 {
39 uint32_t a_bot = (uint32_t)a & 0x0000ffffu;
40 uint32_t b_top = (uint32_t)b & 0xffff0000u;
41
42 return (int16x2_t)(a_bot | b_top);
43 }
44
45 __attribute__((unused))
__smlad(int16x2_t a,int16x2_t b,int32_t u)46 static int32_t __smlad(int16x2_t a, int16x2_t b, int32_t u)
47 {
48 int16_t a_hi = a >> 16, a_lo = a & 0xffff;
49 int16_t b_hi = b >> 16, b_lo = b & 0xffff;
50
51 return u + (a_hi * b_hi) + (a_lo * b_lo);
52 }
53
54 __attribute__((unused))
__smlald(int16x2_t a,int16x2_t b,int64_t u)55 static int64_t __smlald(int16x2_t a, int16x2_t b, int64_t u)
56 {
57 int16_t a_hi = a >> 16, a_lo = a & 0xffff;
58 int16_t b_hi = b >> 16, b_lo = b & 0xffff;
59 return u + (a_hi * b_hi) + (a_lo * b_lo);
60 }
61
62 __attribute__((unused))
__smlaldx(int16x2_t a,int16x2_t b,int64_t u)63 static int64_t __smlaldx(int16x2_t a, int16x2_t b, int64_t u)
64 {
65 int16_t a_hi = a >> 16, a_lo = a & 0xffff;
66 int16_t b_hi = b >> 16, b_lo = b & 0xffff;
67 return u + (a_hi * b_lo) + (a_lo * b_hi);
68 }
69
70 #endif /* __ARM_FEATURE_SIMD32 */
71