6060/// \headerfile <x86intrin.h>
6161///
6262/// \code
63- /// __m512i _tile_cvtrowps2pbf16h (__tile tsrc, unsigned int row);
63+ /// __m512i _tile_cvtrowps2bf16h (__tile tsrc, unsigned int row);
6464/// \endcode
6565///
6666/// \code{.operation}
8080/// zero_tileconfig_start()
8181/// \endcode
8282///
83- /// This intrinsic corresponds to the \c TCVTROWPS2PBF16H instruction.
83+ /// This intrinsic corresponds to the \c TCVTROWPS2BF16H instruction.
8484///
8585/// \param tsrc
8686/// The source tile. Max size is 1024 Bytes.
8787/// \param row
8888/// The the row of the source tile.
89- #define _tile_cvtrowps2pbf16h (tsrc , row ) \
90- __builtin_ia32_tcvtrowps2pbf16h (tsrc, row)
89+ #define _tile_cvtrowps2bf16h (tsrc , row ) \
90+ __builtin_ia32_tcvtrowps2bf16h (tsrc, row)
9191
9292/// Moves a row from a tile register to a zmm destination register, converting
9393/// the fp32 source elements to bf16. It places the resulting bf16 elements
9797/// \headerfile <x86intrin.h>
9898///
9999/// \code
100- /// __m512i _tile_cvtrowps2pbf16l (__tile tsrc, unsigned int row);
100+ /// __m512i _tile_cvtrowps2bf16l (__tile tsrc, unsigned int row);
101101/// \endcode
102102///
103103/// \code{.operation}
117117/// zero_tileconfig_start()
118118/// \endcode
119119///
120- /// This intrinsic corresponds to the \c TCVTROWPS2PBF16L instruction.
120+ /// This intrinsic corresponds to the \c TCVTROWPS2BF16L instruction.
121121///
122122/// \param tsrc
123123/// The source tile. Max size is 1024 Bytes.
124124/// \param row
125125/// The the row of the source tile.
126- #define _tile_cvtrowps2pbf16l (tsrc , row ) \
127- __builtin_ia32_tcvtrowps2pbf16l (tsrc, row)
126+ #define _tile_cvtrowps2bf16l (tsrc , row ) \
127+ __builtin_ia32_tcvtrowps2bf16l (tsrc, row)
128128
129129/// Moves a row from a tile register to a zmm destination register, converting
130130/// the fp32 source elements to fp16. It places the resulting fp16 elements
@@ -238,15 +238,15 @@ static __inline__ __m512 __DEFAULT_FN_ATTRS_AVX512 _tile_cvtrowd2ps_internal(
238238}
239239
240240static __inline__ __m512bh __DEFAULT_FN_ATTRS_AVX512
241- _tile_cvtrowps2pbf16h_internal (unsigned short m , unsigned short n ,
242- _tile1024i src , unsigned u ) {
243- return __builtin_ia32_tcvtrowps2pbf16h_internal (m , n , src , u );
241+ _tile_cvtrowps2bf16h_internal (unsigned short m , unsigned short n ,
242+ _tile1024i src , unsigned u ) {
243+ return __builtin_ia32_tcvtrowps2bf16h_internal (m , n , src , u );
244244}
245245
246246static __inline__ __m512bh __DEFAULT_FN_ATTRS_AVX512
247- _tile_cvtrowps2pbf16l_internal (unsigned short m , unsigned short n ,
248- _tile1024i src , unsigned u ) {
249- return __builtin_ia32_tcvtrowps2pbf16l_internal (m , n , src , u );
247+ _tile_cvtrowps2bf16l_internal (unsigned short m , unsigned short n ,
248+ _tile1024i src , unsigned u ) {
249+ return __builtin_ia32_tcvtrowps2bf16l_internal (m , n , src , u );
250250}
251251
252252static __inline__ __m512h __DEFAULT_FN_ATTRS_AVX512 _tile_cvtrowps2phh_internal (
@@ -290,7 +290,7 @@ static __m512 __tile_cvtrowd2ps(__tile1024i src0, unsigned src1) {
290290///
291291/// \headerfile <immintrin.h>
292292///
293- /// This intrinsic corresponds to the <c> TCVTROWPS2PBF16H </c> instruction.
293+ /// This intrinsic corresponds to the <c> TCVTROWPS2BF16H </c> instruction.
294294///
295295/// \param src0
296296/// The 1st source tile. Max size is 1024 Bytes.
@@ -299,8 +299,8 @@ static __m512 __tile_cvtrowd2ps(__tile1024i src0, unsigned src1) {
299299/// \returns
300300/// The destination v32bf16 data. Size is 64 Bytes.
301301__DEFAULT_FN_ATTRS_AVX512
302- static __m512bh __tile_cvtrowps2pbf16h (__tile1024i src0 , unsigned src1 ) {
303- return _tile_cvtrowps2pbf16h_internal (src0 .row , src0 .col , src0 .tile , src1 );
302+ static __m512bh __tile_cvtrowps2bf16h (__tile1024i src0 , unsigned src1 ) {
303+ return _tile_cvtrowps2bf16h_internal (src0 .row , src0 .col , src0 .tile , src1 );
304304}
305305
306306/// Move a row from a tile (src0) to a v32bf16 dst, converting the fp32 source
@@ -309,7 +309,7 @@ static __m512bh __tile_cvtrowps2pbf16h(__tile1024i src0, unsigned src1) {
309309///
310310/// \headerfile <immintrin.h>
311311///
312- /// This intrinsic corresponds to the <c> TCVTROWPS2PBF16L </c> instruction.
312+ /// This intrinsic corresponds to the <c> TCVTROWPS2BF16L </c> instruction.
313313///
314314/// \param src0
315315/// The 1st source tile. Max size is 1024 Bytes.
@@ -318,8 +318,8 @@ static __m512bh __tile_cvtrowps2pbf16h(__tile1024i src0, unsigned src1) {
318318/// \returns
319319/// The destination v32bf16 data. Size is 64 Bytes.
320320__DEFAULT_FN_ATTRS_AVX512
321- static __m512bh __tile_cvtrowps2pbf16l (__tile1024i src0 , unsigned src1 ) {
322- return _tile_cvtrowps2pbf16l_internal (src0 .row , src0 .col , src0 .tile , src1 );
321+ static __m512bh __tile_cvtrowps2bf16l (__tile1024i src0 , unsigned src1 ) {
322+ return _tile_cvtrowps2bf16l_internal (src0 .row , src0 .col , src0 .tile , src1 );
323323}
324324
325325/// Move a row from a tile (src0) to a v32fp16 dst, converting the fp32 source
0 commit comments