28 #ifndef __ARCH_ARM_AAPCS64_HH__
29 #define __ARCH_ARM_AAPCS64_HH__
33 #include <type_traits>
77 template <
typename T,
typename Enabled=
void>
80 template <
typename E,
size_t N>
82 typename
std::enable_if_t<
83 (std::is_integral<E>::value || std::is_floating_point<E>::value) &&
84 (sizeof(E) * N == 8 || sizeof(E) * N == 16)>> :
92 template <
typename T,
typename Enabled=
void>
97 (std::is_array<T>::value ||
98 std::is_class<T>::value ||
99 std::is_union<T>::value) &&
101 !IsVarArgs<T>::value &&
103 !IsAapcs64ShortVector<T>::value
104 >> :
public std::true_type
116 template <
typename T,
typename Enabled=
void>
119 template <
typename E,
size_t N>
121 typename
std::enable_if_t<std::is_floating_point<E>::value && N <= 4>> :
122 public std::true_type
129 template <
typename T,
typename Enabled=
void>
130 struct IsAapcs64Hva :
public std::false_type {};
132 template <
typename E,
size_t N>
133 struct IsAapcs64Hva<
E[N],
134 typename
std::enable_if_t<IsAapcs64ShortVector<E>::value && N <= 4>> :
135 public std::true_type
139 template <
typename T,
typename Enabled=
void>
140 struct IsAapcs64Hxa :
public std::false_type {};
142 template <
typename T>
143 struct IsAapcs64Hxa<T, typename
std::enable_if_t<
144 IsAapcs64Hfa<T>::value || IsAapcs64Hva<T>::value>> :
145 public std::true_type
148 struct Aapcs64ArgumentBase
150 template <
typename T>
155 size_t align = std::max<size_t>(8,
alignof(T));
157 size_t size =
roundUp(
sizeof(T), 8);
178 template <
typename Float>
179 struct Argument<
Aapcs64, Float, typename
std::enable_if_t<
180 std::is_floating_point<Float>::value ||
181 IsAapcs64ShortVector<Float>::value>> :
182 public Aapcs64ArgumentBase
189 return tc->
readVecReg(
id).laneView<Float, 0>();
192 return loadFromStack<Float>(tc, state);
196 template <
typename Float>
198 std::is_floating_point<Float>::value ||
199 IsAapcs64ShortVector<Float>::value>>
206 reg.laneView<Float, 0>() =
f;
217 template <
typename Integer>
219 std::is_integral<Integer>::value && (sizeof(Integer) <= 8)>> :
220 public Aapcs64ArgumentBase
231 return loadFromStack<Integer>(tc, state);
235 template <
typename Integer>
237 std::is_integral<Integer>::value && (sizeof(Integer) > 8)>> :
238 public Aapcs64ArgumentBase
243 if (
alignof(Integer) == 16 && (state.
ngrn % 2))
246 if (
sizeof(Integer) == 16 && state.
ngrn + 1 <= state.
MAX_GRN) {
256 return loadFromStack<Integer>(tc, state);
260 template <
typename Integer>
262 std::is_integral<Integer>::value && (sizeof(Integer) <= 8)>>
271 template <
typename Integer>
273 std::is_integral<Integer>::value && (sizeof(Integer) > 8)>>
289 template <
typename T>
292 template <
typename E,
size_t N>
295 template <
typename HA>
297 IsAapcs64Hxa<HA>::value>> :
public Aapcs64ArgumentBase
303 constexpr
size_t Count =
sizeof(HA) /
sizeof(Elem);
307 for (
int i = 0;
i < Count;
i++)
315 return loadFromStack<HA>(tc, state);
319 template <
typename HA>
321 typename
std::enable_if_t<IsAapcs64Hxa<HA>::value>>
327 constexpr
size_t Count =
sizeof(HA) /
sizeof(Elem);
329 for (
int i = 0;
i < Count;
i++)
339 template <
typename Composite>
341 IsAapcs64Composite<Composite>::value && !IsAapcs64Hxa<Composite>::value>> :
342 public Aapcs64ArgumentBase
347 if (
sizeof(Composite) > 16) {
358 size_t bytes =
sizeof(Composite);
359 using Chunk = uint64_t;
361 const int chunk_size =
sizeof(Chunk);
362 const int regs = (bytes + chunk_size - 1) / chunk_size;
366 alignas(
alignof(Composite)) uint8_t buf[bytes];
367 for (
int i = 0;
i < regs;
i++) {
370 size_t to_copy = std::min<size_t>(bytes, chunk_size);
371 memcpy(buf +
i * chunk_size, &
val, to_copy);
380 return loadFromStack<Composite>(tc, state);
384 template <
typename Composite>
386 IsAapcs64Composite<Composite>::value && !IsAapcs64Hxa<Composite>::value>>
391 if (
sizeof(Composite) > 16) {
400 size_t bytes =
sizeof(Composite);
401 using Chunk = uint64_t;
403 const int chunk_size =
sizeof(Chunk);
404 const int regs = (bytes + chunk_size - 1) / chunk_size;
407 uint8_t *buf = (uint8_t *)&
cp;
408 for (
int i = 0;
i < regs;
i++) {
409 size_t to_copy = std::min<size_t>(bytes, chunk_size);
412 memcpy(&
val, buf, to_copy);
425 #endif // __ARCH_ARM_AAPCS64_HH__