annotate gcc/config/arm/mmintrin.h @ 111:04ced10e8804

gcc 7
author kono
date Fri, 27 Oct 2017 22:46:09 +0900
parents a06113de4d67
children 84e7813d76e9
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
111
kono
parents: 0
diff changeset
1 /* Copyright (C) 2002-2017 Free Software Foundation, Inc.
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
2
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
3 This file is part of GCC.
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
4
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
5 GCC is free software; you can redistribute it and/or modify it
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
6 under the terms of the GNU General Public License as published
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
7 by the Free Software Foundation; either version 3, or (at your
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
8 option) any later version.
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
9
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
10 GCC is distributed in the hope that it will be useful, but WITHOUT
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
11 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
12 or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
13 License for more details.
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
14
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
15 Under Section 7 of GPL version 3, you are granted additional
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
16 permissions described in the GCC Runtime Library Exception, version
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
17 3.1, as published by the Free Software Foundation.
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
18
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
19 You should have received a copy of the GNU General Public License and
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
20 a copy of the GCC Runtime Library Exception along with this program;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
21 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
22 <http://www.gnu.org/licenses/>. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
23
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
24 #ifndef _MMINTRIN_H_INCLUDED
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
25 #define _MMINTRIN_H_INCLUDED
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
26
111
kono
parents: 0
diff changeset
27 #ifndef __IWMMXT__
kono
parents: 0
diff changeset
28 #error mmintrin.h included without enabling WMMX/WMMX2 instructions (e.g. -march=iwmmxt or -march=iwmmxt2)
kono
parents: 0
diff changeset
29 #endif
kono
parents: 0
diff changeset
30
kono
parents: 0
diff changeset
31
kono
parents: 0
diff changeset
32 #if defined __cplusplus
kono
parents: 0
diff changeset
33 extern "C" {
kono
parents: 0
diff changeset
34 /* Intrinsics use C name-mangling. */
kono
parents: 0
diff changeset
35 #endif /* __cplusplus */
kono
parents: 0
diff changeset
36
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
37 /* The data type intended for user use. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
38 typedef unsigned long long __m64, __int64;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
39
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
40 /* Internal data types for implementing the intrinsics. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
41 typedef int __v2si __attribute__ ((vector_size (8)));
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
42 typedef short __v4hi __attribute__ ((vector_size (8)));
111
kono
parents: 0
diff changeset
43 typedef signed char __v8qi __attribute__ ((vector_size (8)));
kono
parents: 0
diff changeset
44
kono
parents: 0
diff changeset
45 /* Provided for source compatibility with MMX. */
kono
parents: 0
diff changeset
46 extern __inline void __attribute__((__gnu_inline__, __always_inline__, __artificial__))
kono
parents: 0
diff changeset
47 _mm_empty (void)
kono
parents: 0
diff changeset
48 {
kono
parents: 0
diff changeset
49 }
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
50
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
51 /* "Convert" __m64 and __int64 into each other. */
111
kono
parents: 0
diff changeset
52 static __inline __m64
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
53 _mm_cvtsi64_m64 (__int64 __i)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
54 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
55 return __i;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
56 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
57
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
58 static __inline __int64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
59 _mm_cvtm64_si64 (__m64 __i)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
60 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
61 return __i;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
62 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
63
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
64 static __inline int
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
65 _mm_cvtsi64_si32 (__int64 __i)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
66 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
67 return __i;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
68 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
69
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
70 static __inline __int64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
71 _mm_cvtsi32_si64 (int __i)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
72 {
111
kono
parents: 0
diff changeset
73 return (__i & 0xffffffff);
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
74 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
75
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
76 /* Pack the four 16-bit values from M1 into the lower four 8-bit values of
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
77 the result, and the four 16-bit values from M2 into the upper four 8-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
78 values of the result, all with signed saturation. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
79 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
80 _mm_packs_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
81 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
82 return (__m64) __builtin_arm_wpackhss ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
83 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
84
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
85 /* Pack the two 32-bit values from M1 in to the lower two 16-bit values of
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
86 the result, and the two 32-bit values from M2 into the upper two 16-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
87 values of the result, all with signed saturation. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
88 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
89 _mm_packs_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
90 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
91 return (__m64) __builtin_arm_wpackwss ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
92 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
93
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
94 /* Copy the 64-bit value from M1 into the lower 32-bits of the result, and
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
95 the 64-bit value from M2 into the upper 32-bits of the result, all with
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
96 signed saturation for values that do not fit exactly into 32-bits. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
97 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
98 _mm_packs_pi64 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
99 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
100 return (__m64) __builtin_arm_wpackdss ((long long)__m1, (long long)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
101 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
102
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
103 /* Pack the four 16-bit values from M1 into the lower four 8-bit values of
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
104 the result, and the four 16-bit values from M2 into the upper four 8-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
105 values of the result, all with unsigned saturation. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
106 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
107 _mm_packs_pu16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
108 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
109 return (__m64) __builtin_arm_wpackhus ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
110 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
111
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
112 /* Pack the two 32-bit values from M1 into the lower two 16-bit values of
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
113 the result, and the two 32-bit values from M2 into the upper two 16-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
114 values of the result, all with unsigned saturation. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
115 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
116 _mm_packs_pu32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
117 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
118 return (__m64) __builtin_arm_wpackwus ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
119 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
120
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
121 /* Copy the 64-bit value from M1 into the lower 32-bits of the result, and
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
122 the 64-bit value from M2 into the upper 32-bits of the result, all with
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
123 unsigned saturation for values that do not fit exactly into 32-bits. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
124 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
125 _mm_packs_pu64 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
126 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
127 return (__m64) __builtin_arm_wpackdus ((long long)__m1, (long long)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
128 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
129
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
130 /* Interleave the four 8-bit values from the high half of M1 with the four
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
131 8-bit values from the high half of M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
132 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
133 _mm_unpackhi_pi8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
134 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
135 return (__m64) __builtin_arm_wunpckihb ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
136 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
137
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
138 /* Interleave the two 16-bit values from the high half of M1 with the two
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
139 16-bit values from the high half of M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
140 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
141 _mm_unpackhi_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
142 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
143 return (__m64) __builtin_arm_wunpckihh ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
144 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
145
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
146 /* Interleave the 32-bit value from the high half of M1 with the 32-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
147 value from the high half of M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
148 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
149 _mm_unpackhi_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
150 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
151 return (__m64) __builtin_arm_wunpckihw ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
152 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
153
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
154 /* Interleave the four 8-bit values from the low half of M1 with the four
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
155 8-bit values from the low half of M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
156 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
157 _mm_unpacklo_pi8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
158 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
159 return (__m64) __builtin_arm_wunpckilb ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
160 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
161
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
162 /* Interleave the two 16-bit values from the low half of M1 with the two
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
163 16-bit values from the low half of M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
164 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
165 _mm_unpacklo_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
166 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
167 return (__m64) __builtin_arm_wunpckilh ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
168 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
169
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
170 /* Interleave the 32-bit value from the low half of M1 with the 32-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
171 value from the low half of M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
172 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
173 _mm_unpacklo_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
174 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
175 return (__m64) __builtin_arm_wunpckilw ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
176 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
177
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
178 /* Take the four 8-bit values from the low half of M1, sign extend them,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
179 and return the result as a vector of four 16-bit quantities. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
180 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
181 _mm_unpackel_pi8 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
182 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
183 return (__m64) __builtin_arm_wunpckelsb ((__v8qi)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
184 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
185
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
186 /* Take the two 16-bit values from the low half of M1, sign extend them,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
187 and return the result as a vector of two 32-bit quantities. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
188 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
189 _mm_unpackel_pi16 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
190 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
191 return (__m64) __builtin_arm_wunpckelsh ((__v4hi)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
192 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
193
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
194 /* Take the 32-bit value from the low half of M1, and return it sign extended
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
195 to 64 bits. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
196 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
197 _mm_unpackel_pi32 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
198 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
199 return (__m64) __builtin_arm_wunpckelsw ((__v2si)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
200 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
201
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
202 /* Take the four 8-bit values from the high half of M1, sign extend them,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
203 and return the result as a vector of four 16-bit quantities. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
204 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
205 _mm_unpackeh_pi8 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
206 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
207 return (__m64) __builtin_arm_wunpckehsb ((__v8qi)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
208 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
209
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
210 /* Take the two 16-bit values from the high half of M1, sign extend them,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
211 and return the result as a vector of two 32-bit quantities. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
212 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
213 _mm_unpackeh_pi16 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
214 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
215 return (__m64) __builtin_arm_wunpckehsh ((__v4hi)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
216 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
217
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
218 /* Take the 32-bit value from the high half of M1, and return it sign extended
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
219 to 64 bits. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
220 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
221 _mm_unpackeh_pi32 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
222 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
223 return (__m64) __builtin_arm_wunpckehsw ((__v2si)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
224 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
225
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
226 /* Take the four 8-bit values from the low half of M1, zero extend them,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
227 and return the result as a vector of four 16-bit quantities. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
228 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
229 _mm_unpackel_pu8 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
230 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
231 return (__m64) __builtin_arm_wunpckelub ((__v8qi)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
232 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
233
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
234 /* Take the two 16-bit values from the low half of M1, zero extend them,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
235 and return the result as a vector of two 32-bit quantities. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
236 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
237 _mm_unpackel_pu16 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
238 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
239 return (__m64) __builtin_arm_wunpckeluh ((__v4hi)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
240 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
241
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
242 /* Take the 32-bit value from the low half of M1, and return it zero extended
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
243 to 64 bits. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
244 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
245 _mm_unpackel_pu32 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
246 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
247 return (__m64) __builtin_arm_wunpckeluw ((__v2si)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
248 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
249
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
250 /* Take the four 8-bit values from the high half of M1, zero extend them,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
251 and return the result as a vector of four 16-bit quantities. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
252 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
253 _mm_unpackeh_pu8 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
254 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
255 return (__m64) __builtin_arm_wunpckehub ((__v8qi)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
256 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
257
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
258 /* Take the two 16-bit values from the high half of M1, zero extend them,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
259 and return the result as a vector of two 32-bit quantities. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
260 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
261 _mm_unpackeh_pu16 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
262 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
263 return (__m64) __builtin_arm_wunpckehuh ((__v4hi)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
264 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
265
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
266 /* Take the 32-bit value from the high half of M1, and return it zero extended
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
267 to 64 bits. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
268 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
269 _mm_unpackeh_pu32 (__m64 __m1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
270 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
271 return (__m64) __builtin_arm_wunpckehuw ((__v2si)__m1);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
272 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
273
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
274 /* Add the 8-bit values in M1 to the 8-bit values in M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
275 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
276 _mm_add_pi8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
277 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
278 return (__m64) __builtin_arm_waddb ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
279 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
280
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
281 /* Add the 16-bit values in M1 to the 16-bit values in M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
282 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
283 _mm_add_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
284 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
285 return (__m64) __builtin_arm_waddh ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
286 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
287
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
288 /* Add the 32-bit values in M1 to the 32-bit values in M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
289 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
290 _mm_add_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
291 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
292 return (__m64) __builtin_arm_waddw ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
293 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
294
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
295 /* Add the 8-bit values in M1 to the 8-bit values in M2 using signed
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
296 saturated arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
297 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
298 _mm_adds_pi8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
299 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
300 return (__m64) __builtin_arm_waddbss ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
301 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
302
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
303 /* Add the 16-bit values in M1 to the 16-bit values in M2 using signed
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
304 saturated arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
305 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
306 _mm_adds_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
307 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
308 return (__m64) __builtin_arm_waddhss ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
309 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
310
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
311 /* Add the 32-bit values in M1 to the 32-bit values in M2 using signed
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
312 saturated arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
313 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
314 _mm_adds_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
315 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
316 return (__m64) __builtin_arm_waddwss ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
317 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
318
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
319 /* Add the 8-bit values in M1 to the 8-bit values in M2 using unsigned
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
320 saturated arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
321 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
322 _mm_adds_pu8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
323 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
324 return (__m64) __builtin_arm_waddbus ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
325 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
326
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
327 /* Add the 16-bit values in M1 to the 16-bit values in M2 using unsigned
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
328 saturated arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
329 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
330 _mm_adds_pu16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
331 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
332 return (__m64) __builtin_arm_waddhus ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
333 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
334
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
335 /* Add the 32-bit values in M1 to the 32-bit values in M2 using unsigned
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
336 saturated arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
337 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
338 _mm_adds_pu32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
339 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
340 return (__m64) __builtin_arm_waddwus ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
341 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
342
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
343 /* Subtract the 8-bit values in M2 from the 8-bit values in M1. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
344 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
345 _mm_sub_pi8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
346 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
347 return (__m64) __builtin_arm_wsubb ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
348 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
349
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
350 /* Subtract the 16-bit values in M2 from the 16-bit values in M1. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
351 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
352 _mm_sub_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
353 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
354 return (__m64) __builtin_arm_wsubh ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
355 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
356
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
357 /* Subtract the 32-bit values in M2 from the 32-bit values in M1. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
358 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
359 _mm_sub_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
360 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
361 return (__m64) __builtin_arm_wsubw ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
362 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
363
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
364 /* Subtract the 8-bit values in M2 from the 8-bit values in M1 using signed
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
365 saturating arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
366 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
367 _mm_subs_pi8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
368 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
369 return (__m64) __builtin_arm_wsubbss ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
370 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
371
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
372 /* Subtract the 16-bit values in M2 from the 16-bit values in M1 using
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
373 signed saturating arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
374 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
375 _mm_subs_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
376 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
377 return (__m64) __builtin_arm_wsubhss ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
378 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
379
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
380 /* Subtract the 32-bit values in M2 from the 32-bit values in M1 using
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
381 signed saturating arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
382 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
383 _mm_subs_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
384 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
385 return (__m64) __builtin_arm_wsubwss ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
386 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
387
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
388 /* Subtract the 8-bit values in M2 from the 8-bit values in M1 using
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
389 unsigned saturating arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
390 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
391 _mm_subs_pu8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
392 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
393 return (__m64) __builtin_arm_wsubbus ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
394 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
395
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
396 /* Subtract the 16-bit values in M2 from the 16-bit values in M1 using
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
397 unsigned saturating arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
398 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
399 _mm_subs_pu16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
400 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
401 return (__m64) __builtin_arm_wsubhus ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
402 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
403
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
404 /* Subtract the 32-bit values in M2 from the 32-bit values in M1 using
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
405 unsigned saturating arithmetic. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
406 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
407 _mm_subs_pu32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
408 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
409 return (__m64) __builtin_arm_wsubwus ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
410 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
411
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
412 /* Multiply four 16-bit values in M1 by four 16-bit values in M2 producing
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
413 four 32-bit intermediate results, which are then summed by pairs to
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
414 produce two 32-bit results. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
415 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
416 _mm_madd_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
417 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
418 return (__m64) __builtin_arm_wmadds ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
419 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
420
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
421 /* Multiply four 16-bit values in M1 by four 16-bit values in M2 producing
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
422 four 32-bit intermediate results, which are then summed by pairs to
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
423 produce two 32-bit results. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
424 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
425 _mm_madd_pu16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
426 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
427 return (__m64) __builtin_arm_wmaddu ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
428 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
429
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
430 /* Multiply four signed 16-bit values in M1 by four signed 16-bit values in
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
431 M2 and produce the high 16 bits of the 32-bit results. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
432 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
433 _mm_mulhi_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
434 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
435 return (__m64) __builtin_arm_wmulsm ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
436 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
437
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
438 /* Multiply four signed 16-bit values in M1 by four signed 16-bit values in
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
439 M2 and produce the high 16 bits of the 32-bit results. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
440 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
441 _mm_mulhi_pu16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
442 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
443 return (__m64) __builtin_arm_wmulum ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
444 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
445
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
446 /* Multiply four 16-bit values in M1 by four 16-bit values in M2 and produce
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
447 the low 16 bits of the results. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
448 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
449 _mm_mullo_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
450 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
451 return (__m64) __builtin_arm_wmulul ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
452 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
453
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
454 /* Shift four 16-bit values in M left by COUNT. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
455 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
456 _mm_sll_pi16 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
457 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
458 return (__m64) __builtin_arm_wsllh ((__v4hi)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
459 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
460
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
461 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
462 _mm_slli_pi16 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
463 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
464 return (__m64) __builtin_arm_wsllhi ((__v4hi)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
465 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
466
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
467 /* Shift two 32-bit values in M left by COUNT. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
468 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
469 _mm_sll_pi32 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
470 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
471 return (__m64) __builtin_arm_wsllw ((__v2si)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
472 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
473
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
474 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
475 _mm_slli_pi32 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
476 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
477 return (__m64) __builtin_arm_wsllwi ((__v2si)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
478 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
479
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
480 /* Shift the 64-bit value in M left by COUNT. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
481 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
482 _mm_sll_si64 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
483 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
484 return (__m64) __builtin_arm_wslld (__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
485 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
486
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
487 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
488 _mm_slli_si64 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
489 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
490 return (__m64) __builtin_arm_wslldi (__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
491 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
492
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
493 /* Shift four 16-bit values in M right by COUNT; shift in the sign bit. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
494 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
495 _mm_sra_pi16 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
496 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
497 return (__m64) __builtin_arm_wsrah ((__v4hi)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
498 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
499
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
500 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
501 _mm_srai_pi16 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
502 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
503 return (__m64) __builtin_arm_wsrahi ((__v4hi)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
504 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
505
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
506 /* Shift two 32-bit values in M right by COUNT; shift in the sign bit. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
507 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
508 _mm_sra_pi32 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
509 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
510 return (__m64) __builtin_arm_wsraw ((__v2si)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
511 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
512
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
513 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
514 _mm_srai_pi32 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
515 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
516 return (__m64) __builtin_arm_wsrawi ((__v2si)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
517 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
518
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
519 /* Shift the 64-bit value in M right by COUNT; shift in the sign bit. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
520 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
521 _mm_sra_si64 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
522 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
523 return (__m64) __builtin_arm_wsrad (__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
524 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
525
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
526 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
527 _mm_srai_si64 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
528 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
529 return (__m64) __builtin_arm_wsradi (__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
530 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
531
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
532 /* Shift four 16-bit values in M right by COUNT; shift in zeros. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
533 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
534 _mm_srl_pi16 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
535 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
536 return (__m64) __builtin_arm_wsrlh ((__v4hi)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
537 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
538
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
539 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
540 _mm_srli_pi16 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
541 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
542 return (__m64) __builtin_arm_wsrlhi ((__v4hi)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
543 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
544
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
545 /* Shift two 32-bit values in M right by COUNT; shift in zeros. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
546 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
547 _mm_srl_pi32 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
548 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
549 return (__m64) __builtin_arm_wsrlw ((__v2si)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
550 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
551
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
552 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
553 _mm_srli_pi32 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
554 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
555 return (__m64) __builtin_arm_wsrlwi ((__v2si)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
556 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
557
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
558 /* Shift the 64-bit value in M left by COUNT; shift in zeros. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
559 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
560 _mm_srl_si64 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
561 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
562 return (__m64) __builtin_arm_wsrld (__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
563 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
564
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
565 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
566 _mm_srli_si64 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
567 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
568 return (__m64) __builtin_arm_wsrldi (__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
569 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
570
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
571 /* Rotate four 16-bit values in M right by COUNT. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
572 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
573 _mm_ror_pi16 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
574 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
575 return (__m64) __builtin_arm_wrorh ((__v4hi)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
576 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
577
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
578 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
579 _mm_rori_pi16 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
580 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
581 return (__m64) __builtin_arm_wrorhi ((__v4hi)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
582 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
583
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
584 /* Rotate two 32-bit values in M right by COUNT. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
585 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
586 _mm_ror_pi32 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
587 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
588 return (__m64) __builtin_arm_wrorw ((__v2si)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
589 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
590
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
591 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
592 _mm_rori_pi32 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
593 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
594 return (__m64) __builtin_arm_wrorwi ((__v2si)__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
595 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
596
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
597 /* Rotate two 64-bit values in M right by COUNT. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
598 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
599 _mm_ror_si64 (__m64 __m, __m64 __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
600 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
601 return (__m64) __builtin_arm_wrord (__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
602 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
603
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
604 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
605 _mm_rori_si64 (__m64 __m, int __count)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
606 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
607 return (__m64) __builtin_arm_wrordi (__m, __count);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
608 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
609
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
610 /* Bit-wise AND the 64-bit values in M1 and M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
611 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
612 _mm_and_si64 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
613 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
614 return __builtin_arm_wand (__m1, __m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
615 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
616
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
617 /* Bit-wise complement the 64-bit value in M1 and bit-wise AND it with the
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
618 64-bit value in M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
619 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
620 _mm_andnot_si64 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
621 {
111
kono
parents: 0
diff changeset
622 return __builtin_arm_wandn (__m2, __m1);
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
623 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
624
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
625 /* Bit-wise inclusive OR the 64-bit values in M1 and M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
626 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
627 _mm_or_si64 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
628 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
629 return __builtin_arm_wor (__m1, __m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
630 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
631
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
632 /* Bit-wise exclusive OR the 64-bit values in M1 and M2. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
633 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
634 _mm_xor_si64 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
635 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
636 return __builtin_arm_wxor (__m1, __m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
637 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
638
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
639 /* Compare eight 8-bit values. The result of the comparison is 0xFF if the
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
640 test is true and zero if false. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
641 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
642 _mm_cmpeq_pi8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
643 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
644 return (__m64) __builtin_arm_wcmpeqb ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
645 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
646
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
647 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
648 _mm_cmpgt_pi8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
649 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
650 return (__m64) __builtin_arm_wcmpgtsb ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
651 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
652
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
653 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
654 _mm_cmpgt_pu8 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
655 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
656 return (__m64) __builtin_arm_wcmpgtub ((__v8qi)__m1, (__v8qi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
657 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
658
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
659 /* Compare four 16-bit values. The result of the comparison is 0xFFFF if
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
660 the test is true and zero if false. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
661 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
662 _mm_cmpeq_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
663 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
664 return (__m64) __builtin_arm_wcmpeqh ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
665 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
666
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
667 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
668 _mm_cmpgt_pi16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
669 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
670 return (__m64) __builtin_arm_wcmpgtsh ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
671 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
672
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
673 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
674 _mm_cmpgt_pu16 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
675 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
676 return (__m64) __builtin_arm_wcmpgtuh ((__v4hi)__m1, (__v4hi)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
677 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
678
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
679 /* Compare two 32-bit values. The result of the comparison is 0xFFFFFFFF if
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
680 the test is true and zero if false. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
681 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
682 _mm_cmpeq_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
683 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
684 return (__m64) __builtin_arm_wcmpeqw ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
685 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
686
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
687 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
688 _mm_cmpgt_pi32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
689 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
690 return (__m64) __builtin_arm_wcmpgtsw ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
691 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
692
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
693 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
694 _mm_cmpgt_pu32 (__m64 __m1, __m64 __m2)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
695 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
696 return (__m64) __builtin_arm_wcmpgtuw ((__v2si)__m1, (__v2si)__m2);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
697 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
698
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
699 /* Element-wise multiplication of unsigned 16-bit values __B and __C, followed
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
700 by accumulate across all elements and __A. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
701 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
702 _mm_mac_pu16 (__m64 __A, __m64 __B, __m64 __C)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
703 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
704 return __builtin_arm_wmacu (__A, (__v4hi)__B, (__v4hi)__C);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
705 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
706
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
707 /* Element-wise multiplication of signed 16-bit values __B and __C, followed
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
708 by accumulate across all elements and __A. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
709 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
710 _mm_mac_pi16 (__m64 __A, __m64 __B, __m64 __C)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
711 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
712 return __builtin_arm_wmacs (__A, (__v4hi)__B, (__v4hi)__C);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
713 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
714
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
715 /* Element-wise multiplication of unsigned 16-bit values __B and __C, followed
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
716 by accumulate across all elements. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
717 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
718 _mm_macz_pu16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
719 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
720 return __builtin_arm_wmacuz ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
721 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
722
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
723 /* Element-wise multiplication of signed 16-bit values __B and __C, followed
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
724 by accumulate across all elements. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
725 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
726 _mm_macz_pi16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
727 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
728 return __builtin_arm_wmacsz ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
729 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
730
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
731 /* Accumulate across all unsigned 8-bit values in __A. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
732 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
733 _mm_acc_pu8 (__m64 __A)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
734 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
735 return __builtin_arm_waccb ((__v8qi)__A);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
736 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
737
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
738 /* Accumulate across all unsigned 16-bit values in __A. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
739 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
740 _mm_acc_pu16 (__m64 __A)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
741 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
742 return __builtin_arm_wacch ((__v4hi)__A);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
743 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
744
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
745 /* Accumulate across all unsigned 32-bit values in __A. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
746 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
747 _mm_acc_pu32 (__m64 __A)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
748 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
749 return __builtin_arm_waccw ((__v2si)__A);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
750 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
751
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
752 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
753 _mm_mia_si64 (__m64 __A, int __B, int __C)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
754 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
755 return __builtin_arm_tmia (__A, __B, __C);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
756 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
757
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
758 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
759 _mm_miaph_si64 (__m64 __A, int __B, int __C)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
760 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
761 return __builtin_arm_tmiaph (__A, __B, __C);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
762 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
763
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
764 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
765 _mm_miabb_si64 (__m64 __A, int __B, int __C)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
766 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
767 return __builtin_arm_tmiabb (__A, __B, __C);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
768 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
769
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
770 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
771 _mm_miabt_si64 (__m64 __A, int __B, int __C)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
772 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
773 return __builtin_arm_tmiabt (__A, __B, __C);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
774 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
775
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
776 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
777 _mm_miatb_si64 (__m64 __A, int __B, int __C)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
778 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
779 return __builtin_arm_tmiatb (__A, __B, __C);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
780 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
781
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
782 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
783 _mm_miatt_si64 (__m64 __A, int __B, int __C)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
784 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
785 return __builtin_arm_tmiatt (__A, __B, __C);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
786 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
787
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
788 /* Extract one of the elements of A and sign extend. The selector N must
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
789 be immediate. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
790 #define _mm_extract_pi8(A, N) __builtin_arm_textrmsb ((__v8qi)(A), (N))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
791 #define _mm_extract_pi16(A, N) __builtin_arm_textrmsh ((__v4hi)(A), (N))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
792 #define _mm_extract_pi32(A, N) __builtin_arm_textrmsw ((__v2si)(A), (N))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
793
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
794 /* Extract one of the elements of A and zero extend. The selector N must
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
795 be immediate. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
796 #define _mm_extract_pu8(A, N) __builtin_arm_textrmub ((__v8qi)(A), (N))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
797 #define _mm_extract_pu16(A, N) __builtin_arm_textrmuh ((__v4hi)(A), (N))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
798 #define _mm_extract_pu32(A, N) __builtin_arm_textrmuw ((__v2si)(A), (N))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
799
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
800 /* Inserts word D into one of the elements of A. The selector N must be
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
801 immediate. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
802 #define _mm_insert_pi8(A, D, N) \
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
803 ((__m64) __builtin_arm_tinsrb ((__v8qi)(A), (D), (N)))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
804 #define _mm_insert_pi16(A, D, N) \
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
805 ((__m64) __builtin_arm_tinsrh ((__v4hi)(A), (D), (N)))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
806 #define _mm_insert_pi32(A, D, N) \
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
807 ((__m64) __builtin_arm_tinsrw ((__v2si)(A), (D), (N)))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
808
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
809 /* Compute the element-wise maximum of signed 8-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
810 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
811 _mm_max_pi8 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
812 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
813 return (__m64) __builtin_arm_wmaxsb ((__v8qi)__A, (__v8qi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
814 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
815
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
816 /* Compute the element-wise maximum of signed 16-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
817 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
818 _mm_max_pi16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
819 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
820 return (__m64) __builtin_arm_wmaxsh ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
821 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
822
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
823 /* Compute the element-wise maximum of signed 32-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
824 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
825 _mm_max_pi32 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
826 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
827 return (__m64) __builtin_arm_wmaxsw ((__v2si)__A, (__v2si)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
828 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
829
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
830 /* Compute the element-wise maximum of unsigned 8-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
831 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
832 _mm_max_pu8 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
833 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
834 return (__m64) __builtin_arm_wmaxub ((__v8qi)__A, (__v8qi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
835 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
836
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
837 /* Compute the element-wise maximum of unsigned 16-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
838 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
839 _mm_max_pu16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
840 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
841 return (__m64) __builtin_arm_wmaxuh ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
842 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
843
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
844 /* Compute the element-wise maximum of unsigned 32-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
845 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
846 _mm_max_pu32 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
847 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
848 return (__m64) __builtin_arm_wmaxuw ((__v2si)__A, (__v2si)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
849 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
850
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
851 /* Compute the element-wise minimum of signed 16-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
852 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
853 _mm_min_pi8 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
854 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
855 return (__m64) __builtin_arm_wminsb ((__v8qi)__A, (__v8qi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
856 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
857
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
858 /* Compute the element-wise minimum of signed 16-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
859 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
860 _mm_min_pi16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
861 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
862 return (__m64) __builtin_arm_wminsh ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
863 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
864
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
865 /* Compute the element-wise minimum of signed 32-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
866 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
867 _mm_min_pi32 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
868 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
869 return (__m64) __builtin_arm_wminsw ((__v2si)__A, (__v2si)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
870 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
871
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
872 /* Compute the element-wise minimum of unsigned 16-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
873 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
874 _mm_min_pu8 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
875 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
876 return (__m64) __builtin_arm_wminub ((__v8qi)__A, (__v8qi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
877 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
878
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
879 /* Compute the element-wise minimum of unsigned 16-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
880 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
881 _mm_min_pu16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
882 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
883 return (__m64) __builtin_arm_wminuh ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
884 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
885
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
886 /* Compute the element-wise minimum of unsigned 32-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
887 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
888 _mm_min_pu32 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
889 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
890 return (__m64) __builtin_arm_wminuw ((__v2si)__A, (__v2si)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
891 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
892
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
893 /* Create an 8-bit mask of the signs of 8-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
894 static __inline int
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
895 _mm_movemask_pi8 (__m64 __A)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
896 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
897 return __builtin_arm_tmovmskb ((__v8qi)__A);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
898 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
899
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
900 /* Create an 8-bit mask of the signs of 16-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
901 static __inline int
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
902 _mm_movemask_pi16 (__m64 __A)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
903 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
904 return __builtin_arm_tmovmskh ((__v4hi)__A);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
905 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
906
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
907 /* Create an 8-bit mask of the signs of 32-bit values. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
908 static __inline int
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
909 _mm_movemask_pi32 (__m64 __A)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
910 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
911 return __builtin_arm_tmovmskw ((__v2si)__A);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
912 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
913
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
914 /* Return a combination of the four 16-bit values in A. The selector
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
915 must be an immediate. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
916 #define _mm_shuffle_pi16(A, N) \
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
917 ((__m64) __builtin_arm_wshufh ((__v4hi)(A), (N)))
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
918
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
919
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
920 /* Compute the rounded averages of the unsigned 8-bit values in A and B. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
921 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
922 _mm_avg_pu8 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
923 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
924 return (__m64) __builtin_arm_wavg2br ((__v8qi)__A, (__v8qi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
925 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
926
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
927 /* Compute the rounded averages of the unsigned 16-bit values in A and B. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
928 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
929 _mm_avg_pu16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
930 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
931 return (__m64) __builtin_arm_wavg2hr ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
932 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
933
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
934 /* Compute the averages of the unsigned 8-bit values in A and B. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
935 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
936 _mm_avg2_pu8 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
937 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
938 return (__m64) __builtin_arm_wavg2b ((__v8qi)__A, (__v8qi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
939 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
940
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
941 /* Compute the averages of the unsigned 16-bit values in A and B. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
942 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
943 _mm_avg2_pu16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
944 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
945 return (__m64) __builtin_arm_wavg2h ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
946 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
947
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
948 /* Compute the sum of the absolute differences of the unsigned 8-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
949 values in A and B. Return the value in the lower 16-bit word; the
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
950 upper words are cleared. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
951 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
952 _mm_sad_pu8 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
953 {
111
kono
parents: 0
diff changeset
954 return (__m64) __builtin_arm_wsadbz ((__v8qi)__A, (__v8qi)__B);
kono
parents: 0
diff changeset
955 }
kono
parents: 0
diff changeset
956
kono
parents: 0
diff changeset
957 static __inline __m64
kono
parents: 0
diff changeset
958 _mm_sada_pu8 (__m64 __A, __m64 __B, __m64 __C)
kono
parents: 0
diff changeset
959 {
kono
parents: 0
diff changeset
960 return (__m64) __builtin_arm_wsadb ((__v2si)__A, (__v8qi)__B, (__v8qi)__C);
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
961 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
962
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
963 /* Compute the sum of the absolute differences of the unsigned 16-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
964 values in A and B. Return the value in the lower 32-bit word; the
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
965 upper words are cleared. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
966 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
967 _mm_sad_pu16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
968 {
111
kono
parents: 0
diff changeset
969 return (__m64) __builtin_arm_wsadhz ((__v4hi)__A, (__v4hi)__B);
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
970 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
971
111
kono
parents: 0
diff changeset
972 static __inline __m64
kono
parents: 0
diff changeset
973 _mm_sada_pu16 (__m64 __A, __m64 __B, __m64 __C)
kono
parents: 0
diff changeset
974 {
kono
parents: 0
diff changeset
975 return (__m64) __builtin_arm_wsadh ((__v2si)__A, (__v4hi)__B, (__v4hi)__C);
kono
parents: 0
diff changeset
976 }
kono
parents: 0
diff changeset
977
kono
parents: 0
diff changeset
978
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
979 /* Compute the sum of the absolute differences of the unsigned 8-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
980 values in A and B. Return the value in the lower 16-bit word; the
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
981 upper words are cleared. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
982 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
983 _mm_sadz_pu8 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
984 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
985 return (__m64) __builtin_arm_wsadbz ((__v8qi)__A, (__v8qi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
986 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
987
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
988 /* Compute the sum of the absolute differences of the unsigned 16-bit
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
989 values in A and B. Return the value in the lower 32-bit word; the
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
990 upper words are cleared. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
991 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
992 _mm_sadz_pu16 (__m64 __A, __m64 __B)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
993 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
994 return (__m64) __builtin_arm_wsadhz ((__v4hi)__A, (__v4hi)__B);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
995 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
996
111
kono
parents: 0
diff changeset
997 #define _mm_align_si64(__A,__B, N) \
kono
parents: 0
diff changeset
998 (__m64) __builtin_arm_walign ((__v8qi) (__A),(__v8qi) (__B), (N))
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
999
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1000 /* Creates a 64-bit zero. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1001 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1002 _mm_setzero_si64 (void)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1003 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1004 return __builtin_arm_wzero ();
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1005 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1006
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1007 /* Set and Get arbitrary iWMMXt Control registers.
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1008 Note only registers 0-3 and 8-11 are currently defined,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1009 the rest are reserved. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1010
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1011 static __inline void
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1012 _mm_setwcx (const int __value, const int __regno)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1013 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1014 switch (__regno)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1015 {
111
kono
parents: 0
diff changeset
1016 case 0:
kono
parents: 0
diff changeset
1017 __asm __volatile ("tmcr wcid, %0" :: "r"(__value));
kono
parents: 0
diff changeset
1018 break;
kono
parents: 0
diff changeset
1019 case 1:
kono
parents: 0
diff changeset
1020 __asm __volatile ("tmcr wcon, %0" :: "r"(__value));
kono
parents: 0
diff changeset
1021 break;
kono
parents: 0
diff changeset
1022 case 2:
kono
parents: 0
diff changeset
1023 __asm __volatile ("tmcr wcssf, %0" :: "r"(__value));
kono
parents: 0
diff changeset
1024 break;
kono
parents: 0
diff changeset
1025 case 3:
kono
parents: 0
diff changeset
1026 __asm __volatile ("tmcr wcasf, %0" :: "r"(__value));
kono
parents: 0
diff changeset
1027 break;
kono
parents: 0
diff changeset
1028 case 8:
kono
parents: 0
diff changeset
1029 __builtin_arm_setwcgr0 (__value);
kono
parents: 0
diff changeset
1030 break;
kono
parents: 0
diff changeset
1031 case 9:
kono
parents: 0
diff changeset
1032 __builtin_arm_setwcgr1 (__value);
kono
parents: 0
diff changeset
1033 break;
kono
parents: 0
diff changeset
1034 case 10:
kono
parents: 0
diff changeset
1035 __builtin_arm_setwcgr2 (__value);
kono
parents: 0
diff changeset
1036 break;
kono
parents: 0
diff changeset
1037 case 11:
kono
parents: 0
diff changeset
1038 __builtin_arm_setwcgr3 (__value);
kono
parents: 0
diff changeset
1039 break;
kono
parents: 0
diff changeset
1040 default:
kono
parents: 0
diff changeset
1041 break;
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1042 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1043 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1044
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1045 static __inline int
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1046 _mm_getwcx (const int __regno)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1047 {
111
kono
parents: 0
diff changeset
1048 int __value;
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1049 switch (__regno)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1050 {
111
kono
parents: 0
diff changeset
1051 case 0:
kono
parents: 0
diff changeset
1052 __asm __volatile ("tmrc %0, wcid" : "=r"(__value));
kono
parents: 0
diff changeset
1053 break;
kono
parents: 0
diff changeset
1054 case 1:
kono
parents: 0
diff changeset
1055 __asm __volatile ("tmrc %0, wcon" : "=r"(__value));
kono
parents: 0
diff changeset
1056 break;
kono
parents: 0
diff changeset
1057 case 2:
kono
parents: 0
diff changeset
1058 __asm __volatile ("tmrc %0, wcssf" : "=r"(__value));
kono
parents: 0
diff changeset
1059 break;
kono
parents: 0
diff changeset
1060 case 3:
kono
parents: 0
diff changeset
1061 __asm __volatile ("tmrc %0, wcasf" : "=r"(__value));
kono
parents: 0
diff changeset
1062 break;
kono
parents: 0
diff changeset
1063 case 8:
kono
parents: 0
diff changeset
1064 return __builtin_arm_getwcgr0 ();
kono
parents: 0
diff changeset
1065 case 9:
kono
parents: 0
diff changeset
1066 return __builtin_arm_getwcgr1 ();
kono
parents: 0
diff changeset
1067 case 10:
kono
parents: 0
diff changeset
1068 return __builtin_arm_getwcgr2 ();
kono
parents: 0
diff changeset
1069 case 11:
kono
parents: 0
diff changeset
1070 return __builtin_arm_getwcgr3 ();
kono
parents: 0
diff changeset
1071 default:
kono
parents: 0
diff changeset
1072 break;
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1073 }
111
kono
parents: 0
diff changeset
1074 return __value;
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1075 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1076
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1077 /* Creates a vector of two 32-bit values; I0 is least significant. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1078 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1079 _mm_set_pi32 (int __i1, int __i0)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1080 {
111
kono
parents: 0
diff changeset
1081 union
kono
parents: 0
diff changeset
1082 {
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1083 __m64 __q;
111
kono
parents: 0
diff changeset
1084 struct
kono
parents: 0
diff changeset
1085 {
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1086 unsigned int __i0;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1087 unsigned int __i1;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1088 } __s;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1089 } __u;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1090
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1091 __u.__s.__i0 = __i0;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1092 __u.__s.__i1 = __i1;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1093
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1094 return __u.__q;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1095 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1096
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1097 /* Creates a vector of four 16-bit values; W0 is least significant. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1098 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1099 _mm_set_pi16 (short __w3, short __w2, short __w1, short __w0)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1100 {
111
kono
parents: 0
diff changeset
1101 unsigned int __i1 = (unsigned short) __w3 << 16 | (unsigned short) __w2;
kono
parents: 0
diff changeset
1102 unsigned int __i0 = (unsigned short) __w1 << 16 | (unsigned short) __w0;
kono
parents: 0
diff changeset
1103
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1104 return _mm_set_pi32 (__i1, __i0);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1105 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1106
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1107 /* Creates a vector of eight 8-bit values; B0 is least significant. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1108 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1109 _mm_set_pi8 (char __b7, char __b6, char __b5, char __b4,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1110 char __b3, char __b2, char __b1, char __b0)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1111 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1112 unsigned int __i1, __i0;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1113
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1114 __i1 = (unsigned char)__b7;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1115 __i1 = __i1 << 8 | (unsigned char)__b6;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1116 __i1 = __i1 << 8 | (unsigned char)__b5;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1117 __i1 = __i1 << 8 | (unsigned char)__b4;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1118
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1119 __i0 = (unsigned char)__b3;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1120 __i0 = __i0 << 8 | (unsigned char)__b2;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1121 __i0 = __i0 << 8 | (unsigned char)__b1;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1122 __i0 = __i0 << 8 | (unsigned char)__b0;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1123
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1124 return _mm_set_pi32 (__i1, __i0);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1125 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1126
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1127 /* Similar, but with the arguments in reverse order. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1128 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1129 _mm_setr_pi32 (int __i0, int __i1)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1130 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1131 return _mm_set_pi32 (__i1, __i0);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1132 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1133
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1134 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1135 _mm_setr_pi16 (short __w0, short __w1, short __w2, short __w3)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1136 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1137 return _mm_set_pi16 (__w3, __w2, __w1, __w0);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1138 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1139
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1140 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1141 _mm_setr_pi8 (char __b0, char __b1, char __b2, char __b3,
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1142 char __b4, char __b5, char __b6, char __b7)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1143 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1144 return _mm_set_pi8 (__b7, __b6, __b5, __b4, __b3, __b2, __b1, __b0);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1145 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1146
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1147 /* Creates a vector of two 32-bit values, both elements containing I. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1148 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1149 _mm_set1_pi32 (int __i)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1150 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1151 return _mm_set_pi32 (__i, __i);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1152 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1153
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1154 /* Creates a vector of four 16-bit values, all elements containing W. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1155 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1156 _mm_set1_pi16 (short __w)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1157 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1158 unsigned int __i = (unsigned short)__w << 16 | (unsigned short)__w;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1159 return _mm_set1_pi32 (__i);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1160 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1161
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1162 /* Creates a vector of four 16-bit values, all elements containing B. */
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1163 static __inline __m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1164 _mm_set1_pi8 (char __b)
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1165 {
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1166 unsigned int __w = (unsigned char)__b << 8 | (unsigned char)__b;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1167 unsigned int __i = __w << 16 | __w;
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1168 return _mm_set1_pi32 (__i);
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1169 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1170
111
kono
parents: 0
diff changeset
1171 #ifdef __IWMMXT2__
kono
parents: 0
diff changeset
1172 static __inline __m64
kono
parents: 0
diff changeset
1173 _mm_abs_pi8 (__m64 m1)
kono
parents: 0
diff changeset
1174 {
kono
parents: 0
diff changeset
1175 return (__m64) __builtin_arm_wabsb ((__v8qi)m1);
kono
parents: 0
diff changeset
1176 }
kono
parents: 0
diff changeset
1177
kono
parents: 0
diff changeset
1178 static __inline __m64
kono
parents: 0
diff changeset
1179 _mm_abs_pi16 (__m64 m1)
kono
parents: 0
diff changeset
1180 {
kono
parents: 0
diff changeset
1181 return (__m64) __builtin_arm_wabsh ((__v4hi)m1);
kono
parents: 0
diff changeset
1182
kono
parents: 0
diff changeset
1183 }
kono
parents: 0
diff changeset
1184
kono
parents: 0
diff changeset
1185 static __inline __m64
kono
parents: 0
diff changeset
1186 _mm_abs_pi32 (__m64 m1)
kono
parents: 0
diff changeset
1187 {
kono
parents: 0
diff changeset
1188 return (__m64) __builtin_arm_wabsw ((__v2si)m1);
kono
parents: 0
diff changeset
1189
kono
parents: 0
diff changeset
1190 }
kono
parents: 0
diff changeset
1191
kono
parents: 0
diff changeset
1192 static __inline __m64
kono
parents: 0
diff changeset
1193 _mm_addsubhx_pi16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1194 {
kono
parents: 0
diff changeset
1195 return (__m64) __builtin_arm_waddsubhx ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1196 }
kono
parents: 0
diff changeset
1197
kono
parents: 0
diff changeset
1198 static __inline __m64
kono
parents: 0
diff changeset
1199 _mm_absdiff_pu8 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1200 {
kono
parents: 0
diff changeset
1201 return (__m64) __builtin_arm_wabsdiffb ((__v8qi)a, (__v8qi)b);
kono
parents: 0
diff changeset
1202 }
kono
parents: 0
diff changeset
1203
kono
parents: 0
diff changeset
1204 static __inline __m64
kono
parents: 0
diff changeset
1205 _mm_absdiff_pu16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1206 {
kono
parents: 0
diff changeset
1207 return (__m64) __builtin_arm_wabsdiffh ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1208 }
kono
parents: 0
diff changeset
1209
kono
parents: 0
diff changeset
1210 static __inline __m64
kono
parents: 0
diff changeset
1211 _mm_absdiff_pu32 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1212 {
kono
parents: 0
diff changeset
1213 return (__m64) __builtin_arm_wabsdiffw ((__v2si)a, (__v2si)b);
kono
parents: 0
diff changeset
1214 }
kono
parents: 0
diff changeset
1215
kono
parents: 0
diff changeset
1216 static __inline __m64
kono
parents: 0
diff changeset
1217 _mm_addc_pu16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1218 {
kono
parents: 0
diff changeset
1219 __m64 result;
kono
parents: 0
diff changeset
1220 __asm__ __volatile__ ("waddhc %0, %1, %2" : "=y" (result) : "y" (a), "y" (b));
kono
parents: 0
diff changeset
1221 return result;
kono
parents: 0
diff changeset
1222 }
kono
parents: 0
diff changeset
1223
kono
parents: 0
diff changeset
1224 static __inline __m64
kono
parents: 0
diff changeset
1225 _mm_addc_pu32 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1226 {
kono
parents: 0
diff changeset
1227 __m64 result;
kono
parents: 0
diff changeset
1228 __asm__ __volatile__ ("waddwc %0, %1, %2" : "=y" (result) : "y" (a), "y" (b));
kono
parents: 0
diff changeset
1229 return result;
kono
parents: 0
diff changeset
1230 }
kono
parents: 0
diff changeset
1231
kono
parents: 0
diff changeset
1232 static __inline __m64
kono
parents: 0
diff changeset
1233 _mm_avg4_pu8 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1234 {
kono
parents: 0
diff changeset
1235 return (__m64) __builtin_arm_wavg4 ((__v8qi)a, (__v8qi)b);
kono
parents: 0
diff changeset
1236 }
kono
parents: 0
diff changeset
1237
kono
parents: 0
diff changeset
1238 static __inline __m64
kono
parents: 0
diff changeset
1239 _mm_avg4r_pu8 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1240 {
kono
parents: 0
diff changeset
1241 return (__m64) __builtin_arm_wavg4r ((__v8qi)a, (__v8qi)b);
kono
parents: 0
diff changeset
1242 }
kono
parents: 0
diff changeset
1243
kono
parents: 0
diff changeset
1244 static __inline __m64
kono
parents: 0
diff changeset
1245 _mm_maddx_pi16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1246 {
kono
parents: 0
diff changeset
1247 return (__m64) __builtin_arm_wmaddsx ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1248 }
kono
parents: 0
diff changeset
1249
kono
parents: 0
diff changeset
1250 static __inline __m64
kono
parents: 0
diff changeset
1251 _mm_maddx_pu16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1252 {
kono
parents: 0
diff changeset
1253 return (__m64) __builtin_arm_wmaddux ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1254 }
kono
parents: 0
diff changeset
1255
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1256 static __inline __m64
111
kono
parents: 0
diff changeset
1257 _mm_msub_pi16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1258 {
kono
parents: 0
diff changeset
1259 return (__m64) __builtin_arm_wmaddsn ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1260 }
kono
parents: 0
diff changeset
1261
kono
parents: 0
diff changeset
1262 static __inline __m64
kono
parents: 0
diff changeset
1263 _mm_msub_pu16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1264 {
kono
parents: 0
diff changeset
1265 return (__m64) __builtin_arm_wmaddun ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1266 }
kono
parents: 0
diff changeset
1267
kono
parents: 0
diff changeset
1268 static __inline __m64
kono
parents: 0
diff changeset
1269 _mm_mulhi_pi32 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1270 {
kono
parents: 0
diff changeset
1271 return (__m64) __builtin_arm_wmulwsm ((__v2si)a, (__v2si)b);
kono
parents: 0
diff changeset
1272 }
kono
parents: 0
diff changeset
1273
kono
parents: 0
diff changeset
1274 static __inline __m64
kono
parents: 0
diff changeset
1275 _mm_mulhi_pu32 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1276 {
kono
parents: 0
diff changeset
1277 return (__m64) __builtin_arm_wmulwum ((__v2si)a, (__v2si)b);
kono
parents: 0
diff changeset
1278 }
kono
parents: 0
diff changeset
1279
kono
parents: 0
diff changeset
1280 static __inline __m64
kono
parents: 0
diff changeset
1281 _mm_mulhir_pi16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1282 {
kono
parents: 0
diff changeset
1283 return (__m64) __builtin_arm_wmulsmr ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1284 }
kono
parents: 0
diff changeset
1285
kono
parents: 0
diff changeset
1286 static __inline __m64
kono
parents: 0
diff changeset
1287 _mm_mulhir_pi32 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1288 {
kono
parents: 0
diff changeset
1289 return (__m64) __builtin_arm_wmulwsmr ((__v2si)a, (__v2si)b);
kono
parents: 0
diff changeset
1290 }
kono
parents: 0
diff changeset
1291
kono
parents: 0
diff changeset
1292 static __inline __m64
kono
parents: 0
diff changeset
1293 _mm_mulhir_pu16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1294 {
kono
parents: 0
diff changeset
1295 return (__m64) __builtin_arm_wmulumr ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1296 }
kono
parents: 0
diff changeset
1297
kono
parents: 0
diff changeset
1298 static __inline __m64
kono
parents: 0
diff changeset
1299 _mm_mulhir_pu32 (__m64 a, __m64 b)
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1300 {
111
kono
parents: 0
diff changeset
1301 return (__m64) __builtin_arm_wmulwumr ((__v2si)a, (__v2si)b);
kono
parents: 0
diff changeset
1302 }
kono
parents: 0
diff changeset
1303
kono
parents: 0
diff changeset
1304 static __inline __m64
kono
parents: 0
diff changeset
1305 _mm_mullo_pi32 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1306 {
kono
parents: 0
diff changeset
1307 return (__m64) __builtin_arm_wmulwl ((__v2si)a, (__v2si)b);
kono
parents: 0
diff changeset
1308 }
kono
parents: 0
diff changeset
1309
kono
parents: 0
diff changeset
1310 static __inline __m64
kono
parents: 0
diff changeset
1311 _mm_qmulm_pi16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1312 {
kono
parents: 0
diff changeset
1313 return (__m64) __builtin_arm_wqmulm ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1314 }
kono
parents: 0
diff changeset
1315
kono
parents: 0
diff changeset
1316 static __inline __m64
kono
parents: 0
diff changeset
1317 _mm_qmulm_pi32 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1318 {
kono
parents: 0
diff changeset
1319 return (__m64) __builtin_arm_wqmulwm ((__v2si)a, (__v2si)b);
kono
parents: 0
diff changeset
1320 }
kono
parents: 0
diff changeset
1321
kono
parents: 0
diff changeset
1322 static __inline __m64
kono
parents: 0
diff changeset
1323 _mm_qmulmr_pi16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1324 {
kono
parents: 0
diff changeset
1325 return (__m64) __builtin_arm_wqmulmr ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1326 }
kono
parents: 0
diff changeset
1327
kono
parents: 0
diff changeset
1328 static __inline __m64
kono
parents: 0
diff changeset
1329 _mm_qmulmr_pi32 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1330 {
kono
parents: 0
diff changeset
1331 return (__m64) __builtin_arm_wqmulwmr ((__v2si)a, (__v2si)b);
kono
parents: 0
diff changeset
1332 }
kono
parents: 0
diff changeset
1333
kono
parents: 0
diff changeset
1334 static __inline __m64
kono
parents: 0
diff changeset
1335 _mm_subaddhx_pi16 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1336 {
kono
parents: 0
diff changeset
1337 return (__m64) __builtin_arm_wsubaddhx ((__v4hi)a, (__v4hi)b);
kono
parents: 0
diff changeset
1338 }
kono
parents: 0
diff changeset
1339
kono
parents: 0
diff changeset
1340 static __inline __m64
kono
parents: 0
diff changeset
1341 _mm_addbhusl_pu8 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1342 {
kono
parents: 0
diff changeset
1343 return (__m64) __builtin_arm_waddbhusl ((__v4hi)a, (__v8qi)b);
kono
parents: 0
diff changeset
1344 }
kono
parents: 0
diff changeset
1345
kono
parents: 0
diff changeset
1346 static __inline __m64
kono
parents: 0
diff changeset
1347 _mm_addbhusm_pu8 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1348 {
kono
parents: 0
diff changeset
1349 return (__m64) __builtin_arm_waddbhusm ((__v4hi)a, (__v8qi)b);
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1350 }
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1351
111
kono
parents: 0
diff changeset
1352 #define _mm_qmiabb_pi32(acc, m1, m2) \
kono
parents: 0
diff changeset
1353 ({\
kono
parents: 0
diff changeset
1354 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1355 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1356 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1357 _acc = (__m64) __builtin_arm_wqmiabb ((__v2si)_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1358 _acc;\
kono
parents: 0
diff changeset
1359 })
kono
parents: 0
diff changeset
1360
kono
parents: 0
diff changeset
1361 #define _mm_qmiabbn_pi32(acc, m1, m2) \
kono
parents: 0
diff changeset
1362 ({\
kono
parents: 0
diff changeset
1363 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1364 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1365 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1366 _acc = (__m64) __builtin_arm_wqmiabbn ((__v2si)_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1367 _acc;\
kono
parents: 0
diff changeset
1368 })
kono
parents: 0
diff changeset
1369
kono
parents: 0
diff changeset
1370 #define _mm_qmiabt_pi32(acc, m1, m2) \
kono
parents: 0
diff changeset
1371 ({\
kono
parents: 0
diff changeset
1372 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1373 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1374 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1375 _acc = (__m64) __builtin_arm_wqmiabt ((__v2si)_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1376 _acc;\
kono
parents: 0
diff changeset
1377 })
kono
parents: 0
diff changeset
1378
kono
parents: 0
diff changeset
1379 #define _mm_qmiabtn_pi32(acc, m1, m2) \
kono
parents: 0
diff changeset
1380 ({\
kono
parents: 0
diff changeset
1381 __m64 _acc=acc;\
kono
parents: 0
diff changeset
1382 __m64 _m1=m1;\
kono
parents: 0
diff changeset
1383 __m64 _m2=m2;\
kono
parents: 0
diff changeset
1384 _acc = (__m64) __builtin_arm_wqmiabtn ((__v2si)_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1385 _acc;\
kono
parents: 0
diff changeset
1386 })
kono
parents: 0
diff changeset
1387
kono
parents: 0
diff changeset
1388 #define _mm_qmiatb_pi32(acc, m1, m2) \
kono
parents: 0
diff changeset
1389 ({\
kono
parents: 0
diff changeset
1390 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1391 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1392 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1393 _acc = (__m64) __builtin_arm_wqmiatb ((__v2si)_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1394 _acc;\
kono
parents: 0
diff changeset
1395 })
kono
parents: 0
diff changeset
1396
kono
parents: 0
diff changeset
1397 #define _mm_qmiatbn_pi32(acc, m1, m2) \
kono
parents: 0
diff changeset
1398 ({\
kono
parents: 0
diff changeset
1399 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1400 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1401 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1402 _acc = (__m64) __builtin_arm_wqmiatbn ((__v2si)_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1403 _acc;\
kono
parents: 0
diff changeset
1404 })
kono
parents: 0
diff changeset
1405
kono
parents: 0
diff changeset
1406 #define _mm_qmiatt_pi32(acc, m1, m2) \
kono
parents: 0
diff changeset
1407 ({\
kono
parents: 0
diff changeset
1408 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1409 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1410 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1411 _acc = (__m64) __builtin_arm_wqmiatt ((__v2si)_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1412 _acc;\
kono
parents: 0
diff changeset
1413 })
kono
parents: 0
diff changeset
1414
kono
parents: 0
diff changeset
1415 #define _mm_qmiattn_pi32(acc, m1, m2) \
kono
parents: 0
diff changeset
1416 ({\
kono
parents: 0
diff changeset
1417 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1418 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1419 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1420 _acc = (__m64) __builtin_arm_wqmiattn ((__v2si)_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1421 _acc;\
kono
parents: 0
diff changeset
1422 })
kono
parents: 0
diff changeset
1423
kono
parents: 0
diff changeset
1424 #define _mm_wmiabb_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1425 ({\
kono
parents: 0
diff changeset
1426 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1427 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1428 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1429 _acc = (__m64) __builtin_arm_wmiabb (_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1430 _acc;\
kono
parents: 0
diff changeset
1431 })
kono
parents: 0
diff changeset
1432
kono
parents: 0
diff changeset
1433 #define _mm_wmiabbn_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1434 ({\
kono
parents: 0
diff changeset
1435 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1436 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1437 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1438 _acc = (__m64) __builtin_arm_wmiabbn (_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1439 _acc;\
kono
parents: 0
diff changeset
1440 })
kono
parents: 0
diff changeset
1441
kono
parents: 0
diff changeset
1442 #define _mm_wmiabt_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1443 ({\
kono
parents: 0
diff changeset
1444 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1445 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1446 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1447 _acc = (__m64) __builtin_arm_wmiabt (_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1448 _acc;\
kono
parents: 0
diff changeset
1449 })
kono
parents: 0
diff changeset
1450
kono
parents: 0
diff changeset
1451 #define _mm_wmiabtn_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1452 ({\
kono
parents: 0
diff changeset
1453 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1454 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1455 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1456 _acc = (__m64) __builtin_arm_wmiabtn (_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1457 _acc;\
kono
parents: 0
diff changeset
1458 })
kono
parents: 0
diff changeset
1459
kono
parents: 0
diff changeset
1460 #define _mm_wmiatb_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1461 ({\
kono
parents: 0
diff changeset
1462 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1463 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1464 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1465 _acc = (__m64) __builtin_arm_wmiatb (_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1466 _acc;\
kono
parents: 0
diff changeset
1467 })
kono
parents: 0
diff changeset
1468
kono
parents: 0
diff changeset
1469 #define _mm_wmiatbn_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1470 ({\
kono
parents: 0
diff changeset
1471 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1472 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1473 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1474 _acc = (__m64) __builtin_arm_wmiatbn (_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1475 _acc;\
kono
parents: 0
diff changeset
1476 })
kono
parents: 0
diff changeset
1477
kono
parents: 0
diff changeset
1478 #define _mm_wmiatt_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1479 ({\
kono
parents: 0
diff changeset
1480 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1481 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1482 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1483 _acc = (__m64) __builtin_arm_wmiatt (_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1484 _acc;\
kono
parents: 0
diff changeset
1485 })
kono
parents: 0
diff changeset
1486
kono
parents: 0
diff changeset
1487 #define _mm_wmiattn_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1488 ({\
kono
parents: 0
diff changeset
1489 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1490 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1491 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1492 _acc = (__m64) __builtin_arm_wmiattn (_acc, (__v4hi)_m1, (__v4hi)_m2);\
kono
parents: 0
diff changeset
1493 _acc;\
kono
parents: 0
diff changeset
1494 })
kono
parents: 0
diff changeset
1495
kono
parents: 0
diff changeset
1496 #define _mm_wmiawbb_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1497 ({\
kono
parents: 0
diff changeset
1498 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1499 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1500 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1501 _acc = (__m64) __builtin_arm_wmiawbb (_acc, (__v2si)_m1, (__v2si)_m2);\
kono
parents: 0
diff changeset
1502 _acc;\
kono
parents: 0
diff changeset
1503 })
kono
parents: 0
diff changeset
1504
kono
parents: 0
diff changeset
1505 #define _mm_wmiawbbn_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1506 ({\
kono
parents: 0
diff changeset
1507 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1508 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1509 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1510 _acc = (__m64) __builtin_arm_wmiawbbn (_acc, (__v2si)_m1, (__v2si)_m2);\
kono
parents: 0
diff changeset
1511 _acc;\
kono
parents: 0
diff changeset
1512 })
kono
parents: 0
diff changeset
1513
kono
parents: 0
diff changeset
1514 #define _mm_wmiawbt_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1515 ({\
kono
parents: 0
diff changeset
1516 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1517 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1518 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1519 _acc = (__m64) __builtin_arm_wmiawbt (_acc, (__v2si)_m1, (__v2si)_m2);\
kono
parents: 0
diff changeset
1520 _acc;\
kono
parents: 0
diff changeset
1521 })
kono
parents: 0
diff changeset
1522
kono
parents: 0
diff changeset
1523 #define _mm_wmiawbtn_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1524 ({\
kono
parents: 0
diff changeset
1525 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1526 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1527 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1528 _acc = (__m64) __builtin_arm_wmiawbtn (_acc, (__v2si)_m1, (__v2si)_m2);\
kono
parents: 0
diff changeset
1529 _acc;\
kono
parents: 0
diff changeset
1530 })
kono
parents: 0
diff changeset
1531
kono
parents: 0
diff changeset
1532 #define _mm_wmiawtb_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1533 ({\
kono
parents: 0
diff changeset
1534 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1535 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1536 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1537 _acc = (__m64) __builtin_arm_wmiawtb (_acc, (__v2si)_m1, (__v2si)_m2);\
kono
parents: 0
diff changeset
1538 _acc;\
kono
parents: 0
diff changeset
1539 })
kono
parents: 0
diff changeset
1540
kono
parents: 0
diff changeset
1541 #define _mm_wmiawtbn_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1542 ({\
kono
parents: 0
diff changeset
1543 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1544 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1545 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1546 _acc = (__m64) __builtin_arm_wmiawtbn (_acc, (__v2si)_m1, (__v2si)_m2);\
kono
parents: 0
diff changeset
1547 _acc;\
kono
parents: 0
diff changeset
1548 })
kono
parents: 0
diff changeset
1549
kono
parents: 0
diff changeset
1550 #define _mm_wmiawtt_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1551 ({\
kono
parents: 0
diff changeset
1552 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1553 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1554 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1555 _acc = (__m64) __builtin_arm_wmiawtt (_acc, (__v2si)_m1, (__v2si)_m2);\
kono
parents: 0
diff changeset
1556 _acc;\
kono
parents: 0
diff changeset
1557 })
kono
parents: 0
diff changeset
1558
kono
parents: 0
diff changeset
1559 #define _mm_wmiawttn_si64(acc, m1, m2) \
kono
parents: 0
diff changeset
1560 ({\
kono
parents: 0
diff changeset
1561 __m64 _acc = acc;\
kono
parents: 0
diff changeset
1562 __m64 _m1 = m1;\
kono
parents: 0
diff changeset
1563 __m64 _m2 = m2;\
kono
parents: 0
diff changeset
1564 _acc = (__m64) __builtin_arm_wmiawttn (_acc, (__v2si)_m1, (__v2si)_m2);\
kono
parents: 0
diff changeset
1565 _acc;\
kono
parents: 0
diff changeset
1566 })
kono
parents: 0
diff changeset
1567
kono
parents: 0
diff changeset
1568 /* The third arguments should be an immediate. */
kono
parents: 0
diff changeset
1569 #define _mm_merge_si64(a, b, n) \
kono
parents: 0
diff changeset
1570 ({\
kono
parents: 0
diff changeset
1571 __m64 result;\
kono
parents: 0
diff changeset
1572 result = (__m64) __builtin_arm_wmerge ((__m64) (a), (__m64) (b), (n));\
kono
parents: 0
diff changeset
1573 result;\
kono
parents: 0
diff changeset
1574 })
kono
parents: 0
diff changeset
1575 #endif /* __IWMMXT2__ */
kono
parents: 0
diff changeset
1576
kono
parents: 0
diff changeset
1577 static __inline __m64
kono
parents: 0
diff changeset
1578 _mm_alignr0_si64 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1579 {
kono
parents: 0
diff changeset
1580 return (__m64) __builtin_arm_walignr0 ((__v8qi) a, (__v8qi) b);
kono
parents: 0
diff changeset
1581 }
kono
parents: 0
diff changeset
1582
kono
parents: 0
diff changeset
1583 static __inline __m64
kono
parents: 0
diff changeset
1584 _mm_alignr1_si64 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1585 {
kono
parents: 0
diff changeset
1586 return (__m64) __builtin_arm_walignr1 ((__v8qi) a, (__v8qi) b);
kono
parents: 0
diff changeset
1587 }
kono
parents: 0
diff changeset
1588
kono
parents: 0
diff changeset
1589 static __inline __m64
kono
parents: 0
diff changeset
1590 _mm_alignr2_si64 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1591 {
kono
parents: 0
diff changeset
1592 return (__m64) __builtin_arm_walignr2 ((__v8qi) a, (__v8qi) b);
kono
parents: 0
diff changeset
1593 }
kono
parents: 0
diff changeset
1594
kono
parents: 0
diff changeset
1595 static __inline __m64
kono
parents: 0
diff changeset
1596 _mm_alignr3_si64 (__m64 a, __m64 b)
kono
parents: 0
diff changeset
1597 {
kono
parents: 0
diff changeset
1598 return (__m64) __builtin_arm_walignr3 ((__v8qi) a, (__v8qi) b);
kono
parents: 0
diff changeset
1599 }
kono
parents: 0
diff changeset
1600
kono
parents: 0
diff changeset
1601 static __inline void
kono
parents: 0
diff changeset
1602 _mm_tandcb ()
kono
parents: 0
diff changeset
1603 {
kono
parents: 0
diff changeset
1604 __asm __volatile ("tandcb r15");
kono
parents: 0
diff changeset
1605 }
kono
parents: 0
diff changeset
1606
kono
parents: 0
diff changeset
1607 static __inline void
kono
parents: 0
diff changeset
1608 _mm_tandch ()
kono
parents: 0
diff changeset
1609 {
kono
parents: 0
diff changeset
1610 __asm __volatile ("tandch r15");
kono
parents: 0
diff changeset
1611 }
kono
parents: 0
diff changeset
1612
kono
parents: 0
diff changeset
1613 static __inline void
kono
parents: 0
diff changeset
1614 _mm_tandcw ()
kono
parents: 0
diff changeset
1615 {
kono
parents: 0
diff changeset
1616 __asm __volatile ("tandcw r15");
kono
parents: 0
diff changeset
1617 }
kono
parents: 0
diff changeset
1618
kono
parents: 0
diff changeset
1619 #define _mm_textrcb(n) \
kono
parents: 0
diff changeset
1620 ({\
kono
parents: 0
diff changeset
1621 __asm__ __volatile__ (\
kono
parents: 0
diff changeset
1622 "textrcb r15, %0" : : "i" (n));\
kono
parents: 0
diff changeset
1623 })
kono
parents: 0
diff changeset
1624
kono
parents: 0
diff changeset
1625 #define _mm_textrch(n) \
kono
parents: 0
diff changeset
1626 ({\
kono
parents: 0
diff changeset
1627 __asm__ __volatile__ (\
kono
parents: 0
diff changeset
1628 "textrch r15, %0" : : "i" (n));\
kono
parents: 0
diff changeset
1629 })
kono
parents: 0
diff changeset
1630
kono
parents: 0
diff changeset
1631 #define _mm_textrcw(n) \
kono
parents: 0
diff changeset
1632 ({\
kono
parents: 0
diff changeset
1633 __asm__ __volatile__ (\
kono
parents: 0
diff changeset
1634 "textrcw r15, %0" : : "i" (n));\
kono
parents: 0
diff changeset
1635 })
kono
parents: 0
diff changeset
1636
kono
parents: 0
diff changeset
1637 static __inline void
kono
parents: 0
diff changeset
1638 _mm_torcb ()
kono
parents: 0
diff changeset
1639 {
kono
parents: 0
diff changeset
1640 __asm __volatile ("torcb r15");
kono
parents: 0
diff changeset
1641 }
kono
parents: 0
diff changeset
1642
kono
parents: 0
diff changeset
1643 static __inline void
kono
parents: 0
diff changeset
1644 _mm_torch ()
kono
parents: 0
diff changeset
1645 {
kono
parents: 0
diff changeset
1646 __asm __volatile ("torch r15");
kono
parents: 0
diff changeset
1647 }
kono
parents: 0
diff changeset
1648
kono
parents: 0
diff changeset
1649 static __inline void
kono
parents: 0
diff changeset
1650 _mm_torcw ()
kono
parents: 0
diff changeset
1651 {
kono
parents: 0
diff changeset
1652 __asm __volatile ("torcw r15");
kono
parents: 0
diff changeset
1653 }
kono
parents: 0
diff changeset
1654
kono
parents: 0
diff changeset
1655 #ifdef __IWMMXT2__
kono
parents: 0
diff changeset
1656 static __inline void
kono
parents: 0
diff changeset
1657 _mm_torvscb ()
kono
parents: 0
diff changeset
1658 {
kono
parents: 0
diff changeset
1659 __asm __volatile ("torvscb r15");
kono
parents: 0
diff changeset
1660 }
kono
parents: 0
diff changeset
1661
kono
parents: 0
diff changeset
1662 static __inline void
kono
parents: 0
diff changeset
1663 _mm_torvsch ()
kono
parents: 0
diff changeset
1664 {
kono
parents: 0
diff changeset
1665 __asm __volatile ("torvsch r15");
kono
parents: 0
diff changeset
1666 }
kono
parents: 0
diff changeset
1667
kono
parents: 0
diff changeset
1668 static __inline void
kono
parents: 0
diff changeset
1669 _mm_torvscw ()
kono
parents: 0
diff changeset
1670 {
kono
parents: 0
diff changeset
1671 __asm __volatile ("torvscw r15");
kono
parents: 0
diff changeset
1672 }
kono
parents: 0
diff changeset
1673 #endif /* __IWMMXT2__ */
kono
parents: 0
diff changeset
1674
kono
parents: 0
diff changeset
1675 static __inline __m64
kono
parents: 0
diff changeset
1676 _mm_tbcst_pi8 (int value)
kono
parents: 0
diff changeset
1677 {
kono
parents: 0
diff changeset
1678 return (__m64) __builtin_arm_tbcstb ((signed char) value);
kono
parents: 0
diff changeset
1679 }
kono
parents: 0
diff changeset
1680
kono
parents: 0
diff changeset
1681 static __inline __m64
kono
parents: 0
diff changeset
1682 _mm_tbcst_pi16 (int value)
kono
parents: 0
diff changeset
1683 {
kono
parents: 0
diff changeset
1684 return (__m64) __builtin_arm_tbcsth ((short) value);
kono
parents: 0
diff changeset
1685 }
kono
parents: 0
diff changeset
1686
kono
parents: 0
diff changeset
1687 static __inline __m64
kono
parents: 0
diff changeset
1688 _mm_tbcst_pi32 (int value)
kono
parents: 0
diff changeset
1689 {
kono
parents: 0
diff changeset
1690 return (__m64) __builtin_arm_tbcstw (value);
kono
parents: 0
diff changeset
1691 }
kono
parents: 0
diff changeset
1692
kono
parents: 0
diff changeset
1693 #define _m_empty _mm_empty
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1694 #define _m_packsswb _mm_packs_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1695 #define _m_packssdw _mm_packs_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1696 #define _m_packuswb _mm_packs_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1697 #define _m_packusdw _mm_packs_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1698 #define _m_packssqd _mm_packs_pi64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1699 #define _m_packusqd _mm_packs_pu64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1700 #define _mm_packs_si64 _mm_packs_pi64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1701 #define _mm_packs_su64 _mm_packs_pu64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1702 #define _m_punpckhbw _mm_unpackhi_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1703 #define _m_punpckhwd _mm_unpackhi_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1704 #define _m_punpckhdq _mm_unpackhi_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1705 #define _m_punpcklbw _mm_unpacklo_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1706 #define _m_punpcklwd _mm_unpacklo_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1707 #define _m_punpckldq _mm_unpacklo_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1708 #define _m_punpckehsbw _mm_unpackeh_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1709 #define _m_punpckehswd _mm_unpackeh_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1710 #define _m_punpckehsdq _mm_unpackeh_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1711 #define _m_punpckehubw _mm_unpackeh_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1712 #define _m_punpckehuwd _mm_unpackeh_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1713 #define _m_punpckehudq _mm_unpackeh_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1714 #define _m_punpckelsbw _mm_unpackel_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1715 #define _m_punpckelswd _mm_unpackel_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1716 #define _m_punpckelsdq _mm_unpackel_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1717 #define _m_punpckelubw _mm_unpackel_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1718 #define _m_punpckeluwd _mm_unpackel_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1719 #define _m_punpckeludq _mm_unpackel_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1720 #define _m_paddb _mm_add_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1721 #define _m_paddw _mm_add_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1722 #define _m_paddd _mm_add_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1723 #define _m_paddsb _mm_adds_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1724 #define _m_paddsw _mm_adds_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1725 #define _m_paddsd _mm_adds_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1726 #define _m_paddusb _mm_adds_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1727 #define _m_paddusw _mm_adds_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1728 #define _m_paddusd _mm_adds_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1729 #define _m_psubb _mm_sub_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1730 #define _m_psubw _mm_sub_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1731 #define _m_psubd _mm_sub_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1732 #define _m_psubsb _mm_subs_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1733 #define _m_psubsw _mm_subs_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1734 #define _m_psubuw _mm_subs_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1735 #define _m_psubusb _mm_subs_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1736 #define _m_psubusw _mm_subs_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1737 #define _m_psubusd _mm_subs_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1738 #define _m_pmaddwd _mm_madd_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1739 #define _m_pmadduwd _mm_madd_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1740 #define _m_pmulhw _mm_mulhi_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1741 #define _m_pmulhuw _mm_mulhi_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1742 #define _m_pmullw _mm_mullo_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1743 #define _m_pmacsw _mm_mac_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1744 #define _m_pmacuw _mm_mac_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1745 #define _m_pmacszw _mm_macz_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1746 #define _m_pmacuzw _mm_macz_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1747 #define _m_paccb _mm_acc_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1748 #define _m_paccw _mm_acc_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1749 #define _m_paccd _mm_acc_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1750 #define _m_pmia _mm_mia_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1751 #define _m_pmiaph _mm_miaph_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1752 #define _m_pmiabb _mm_miabb_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1753 #define _m_pmiabt _mm_miabt_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1754 #define _m_pmiatb _mm_miatb_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1755 #define _m_pmiatt _mm_miatt_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1756 #define _m_psllw _mm_sll_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1757 #define _m_psllwi _mm_slli_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1758 #define _m_pslld _mm_sll_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1759 #define _m_pslldi _mm_slli_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1760 #define _m_psllq _mm_sll_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1761 #define _m_psllqi _mm_slli_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1762 #define _m_psraw _mm_sra_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1763 #define _m_psrawi _mm_srai_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1764 #define _m_psrad _mm_sra_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1765 #define _m_psradi _mm_srai_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1766 #define _m_psraq _mm_sra_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1767 #define _m_psraqi _mm_srai_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1768 #define _m_psrlw _mm_srl_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1769 #define _m_psrlwi _mm_srli_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1770 #define _m_psrld _mm_srl_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1771 #define _m_psrldi _mm_srli_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1772 #define _m_psrlq _mm_srl_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1773 #define _m_psrlqi _mm_srli_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1774 #define _m_prorw _mm_ror_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1775 #define _m_prorwi _mm_rori_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1776 #define _m_prord _mm_ror_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1777 #define _m_prordi _mm_rori_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1778 #define _m_prorq _mm_ror_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1779 #define _m_prorqi _mm_rori_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1780 #define _m_pand _mm_and_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1781 #define _m_pandn _mm_andnot_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1782 #define _m_por _mm_or_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1783 #define _m_pxor _mm_xor_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1784 #define _m_pcmpeqb _mm_cmpeq_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1785 #define _m_pcmpeqw _mm_cmpeq_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1786 #define _m_pcmpeqd _mm_cmpeq_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1787 #define _m_pcmpgtb _mm_cmpgt_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1788 #define _m_pcmpgtub _mm_cmpgt_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1789 #define _m_pcmpgtw _mm_cmpgt_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1790 #define _m_pcmpgtuw _mm_cmpgt_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1791 #define _m_pcmpgtd _mm_cmpgt_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1792 #define _m_pcmpgtud _mm_cmpgt_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1793 #define _m_pextrb _mm_extract_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1794 #define _m_pextrw _mm_extract_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1795 #define _m_pextrd _mm_extract_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1796 #define _m_pextrub _mm_extract_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1797 #define _m_pextruw _mm_extract_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1798 #define _m_pextrud _mm_extract_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1799 #define _m_pinsrb _mm_insert_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1800 #define _m_pinsrw _mm_insert_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1801 #define _m_pinsrd _mm_insert_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1802 #define _m_pmaxsb _mm_max_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1803 #define _m_pmaxsw _mm_max_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1804 #define _m_pmaxsd _mm_max_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1805 #define _m_pmaxub _mm_max_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1806 #define _m_pmaxuw _mm_max_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1807 #define _m_pmaxud _mm_max_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1808 #define _m_pminsb _mm_min_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1809 #define _m_pminsw _mm_min_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1810 #define _m_pminsd _mm_min_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1811 #define _m_pminub _mm_min_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1812 #define _m_pminuw _mm_min_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1813 #define _m_pminud _mm_min_pu32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1814 #define _m_pmovmskb _mm_movemask_pi8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1815 #define _m_pmovmskw _mm_movemask_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1816 #define _m_pmovmskd _mm_movemask_pi32
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1817 #define _m_pshufw _mm_shuffle_pi16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1818 #define _m_pavgb _mm_avg_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1819 #define _m_pavgw _mm_avg_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1820 #define _m_pavg2b _mm_avg2_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1821 #define _m_pavg2w _mm_avg2_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1822 #define _m_psadbw _mm_sad_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1823 #define _m_psadwd _mm_sad_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1824 #define _m_psadzbw _mm_sadz_pu8
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1825 #define _m_psadzwd _mm_sadz_pu16
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1826 #define _m_paligniq _mm_align_si64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1827 #define _m_cvt_si2pi _mm_cvtsi64_m64
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1828 #define _m_cvt_pi2si _mm_cvtm64_si64
111
kono
parents: 0
diff changeset
1829 #define _m_from_int _mm_cvtsi32_si64
kono
parents: 0
diff changeset
1830 #define _m_to_int _mm_cvtsi64_si32
kono
parents: 0
diff changeset
1831
kono
parents: 0
diff changeset
1832 #if defined __cplusplus
kono
parents: 0
diff changeset
1833 }; /* End "C" */
kono
parents: 0
diff changeset
1834 #endif /* __cplusplus */
0
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1835
a06113de4d67 first commit
kent <kent@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1836 #endif /* _MMINTRIN_H_INCLUDED */