49 lines
2.2 KiB
C++
49 lines
2.2 KiB
C++
/*===-------- amxmovrsintrin.h - AMX MOVRS intrinsics -*- C++ -*---------===
|
|
*
|
|
* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
* See https://llvm.org/LICENSE.txt for license information.
|
|
* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
*
|
|
* ===-------------------------------------------------------------------=== */
|
|
|
|
#ifndef __IMMINTRIN_H
|
|
#error "Never use <amxmovrsintrin.h> directly; include <immintrin.h> instead."
|
|
#endif /* __IMMINTRIN_H */
|
|
|
|
#ifndef __AMXMOVRSINTRIN_H
|
|
#define __AMXMOVRSINTRIN_H
|
|
#ifdef __x86_64__
|
|
|
|
#define __DEFAULT_FN_ATTRS_MOVRS \
|
|
__attribute__((__always_inline__, __nodebug__, __target__("amx-movrs")))
|
|
|
|
#define _tile_loaddrs(dst, base, stride) \
|
|
__builtin_ia32_tileloaddrs64((dst), ((const void *)(base)), \
|
|
(__SIZE_TYPE__)(stride))
|
|
#define _tile_stream_loaddrs(dst, base, stride) \
|
|
__builtin_ia32_tileloaddrst164((dst), ((const void *)(base)), \
|
|
(__SIZE_TYPE__)(stride))
|
|
static __inline__ _tile1024i __DEFAULT_FN_ATTRS_MOVRS
|
|
_tile_loaddrs_internal(unsigned short m, unsigned short n, const void *base,
|
|
__SIZE_TYPE__ stride) {
|
|
return __builtin_ia32_tileloaddrs64_internal(m, n, base,
|
|
(__SIZE_TYPE__)(stride));
|
|
}
|
|
static __inline__ _tile1024i __DEFAULT_FN_ATTRS_MOVRS
|
|
_tile_loaddrst1_internal(unsigned short m, unsigned short n, const void *base,
|
|
__SIZE_TYPE__ stride) {
|
|
return __builtin_ia32_tileloaddrst164_internal(m, n, base,
|
|
(__SIZE_TYPE__)(stride));
|
|
}
|
|
static __inline__ void __DEFAULT_FN_ATTRS_MOVRS
|
|
__tile_loaddrs(__tile1024i *dst, const void *base, __SIZE_TYPE__ stride) {
|
|
dst->tile = _tile_loaddrs_internal(dst->row, dst->col, base, stride);
|
|
}
|
|
static __inline__ void __DEFAULT_FN_ATTRS_MOVRS __tile_stream_loaddrs(
|
|
__tile1024i *dst, const void *base, __SIZE_TYPE__ stride) {
|
|
dst->tile = _tile_loaddrst1_internal(dst->row, dst->col, base, stride);
|
|
}
|
|
#undef __DEFAULT_FN_ATTRS_MOVRS
|
|
#endif /* __x86_64__ */
|
|
#endif /* __AMXMOVRSINTRIN_H */
|